Referencias:
2019-08-01
Utilice el siguiente comando para cargar este conjunto de datos en TFDS:
ds = tfds.load('huggingface:kilt_wikipedia/2019-08-01')
- Descripción :
KILT-Wikipedia: Wikipedia pre-processed for KILT.
- Licencia : Sin licencia conocida
- Versión : 1.0.0
- Divisiones :
Separar | Ejemplos |
---|---|
'full' | 5903530 |
- Características :
{
"kilt_id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"text": {
"feature": {
"paragraph": {
"dtype": "string",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"anchors": {
"feature": {
"paragraph_id": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"start": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"end": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"href": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_id": {
"dtype": "string",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"categories": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikidata_info": {
"description": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"enwikiquote_title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikidata_id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikidata_label": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"wikipedia_title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"aliases": {
"feature": {
"alias": {
"dtype": "string",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"history": {
"pageid": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"parentid": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"revid": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"pre_dump": {
"dtype": "bool",
"id": null,
"_type": "Value"
},
"timestamp": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"url": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
}