Referências:
Use o seguinte comando para carregar esse conjunto de dados no TFDS:
ds = tfds.load('huggingface:tne')
- Descrição :
TNE is an NLU task, which focus on relations between noun phrases (NPs) that can be mediated via prepositions.
The dataset contains 5,497 documents, annotated exhaustively with all possible links between the NPs in each document.
- Licença : MIT
- Versão : 1.1.0
- Divisões :
Dividir | Exemplos |
---|---|
'test' | 500 |
'test_ood' | 509 |
'train' | 3988 |
'validation' | 500 |
- Características :
{
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"tokens": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"nps": [
{
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"first_char": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"last_char": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"first_token": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"last_token": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
],
"np_relations": [
{
"anchor": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"complement": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"preposition": {
"num_classes": 24,
"names": [
"about",
"for",
"with",
"from",
"among",
"by",
"on",
"at",
"during",
"of",
"member(s) of",
"in",
"after",
"under",
"to",
"into",
"before",
"near",
"outside",
"around",
"between",
"against",
"over",
"inside"
],
"id": null,
"_type": "ClassLabel"
},
"complement_coref_cluster_id": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
],
"coref": [
{
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"members": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"np_type": {
"num_classes": 3,
"names": [
"standard",
"time/date/measurement",
"idiomatic"
],
"id": null,
"_type": "ClassLabel"
}
}
],
"metadata": {
"annotators": {
"coref_worker": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"consolidator_worker": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"np-relations_worker": {
"feature": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"url": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"source": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
}