Referensi:
01-08-2019
Gunakan perintah berikut untuk memuat kumpulan data ini di TFDS:
ds = tfds.load('huggingface:kilt_wikipedia/2019-08-01')
- Keterangan :
KILT-Wikipedia: Wikipedia pre-processed for KILT.
- Lisensi : Tidak ada lisensi yang diketahui
- Versi : 1.0.0
- Perpecahan :
Membelah | Contoh |
---|---|
'full' | 5903530 |
- Fitur :
{
"kilt_id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"text": {
"feature": {
"paragraph": {
"dtype": "string",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"anchors": {
"feature": {
"paragraph_id": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"start": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"end": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"href": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_id": {
"dtype": "string",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"categories": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikidata_info": {
"description": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"enwikiquote_title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikidata_id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikidata_label": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"aliases": {
"feature": {
"alias": {
"dtype": "string",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"history": {
"pageid": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"parentid": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"revid": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"pre_dump": {
"dtype": "bool",
"id": null,
"_type": "Value"
},
"timestamp": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"url": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
}