Références :
Utilisez la commande suivante pour charger cet ensemble de données dans TFDS :
ds = tfds.load('huggingface:tne')
- Description :
TNE is an NLU task, which focus on relations between noun phrases (NPs) that can be mediated via prepositions.
The dataset contains 5,497 documents, annotated exhaustively with all possible links between the NPs in each document.
- Licence : MIT
- Version : 1.1.0
- Divisions :
Diviser | Exemples |
---|---|
'test' | 500 |
'test_ood' | 509 |
'train' | 3988 |
'validation' | 500 |
- Caractéristiques :
{
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"tokens": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"nps": [
{
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"first_char": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"last_char": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"first_token": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"last_token": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
],
"np_relations": [
{
"anchor": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"complement": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"preposition": {
"num_classes": 24,
"names": [
"about",
"for",
"with",
"from",
"among",
"by",
"on",
"at",
"during",
"of",
"member(s) of",
"in",
"after",
"under",
"to",
"into",
"before",
"near",
"outside",
"around",
"between",
"against",
"over",
"inside"
],
"id": null,
"_type": "ClassLabel"
},
"complement_coref_cluster_id": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
],
"coref": [
{
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"members": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"np_type": {
"num_classes": 3,
"names": [
"standard",
"time/date/measurement",
"idiomatic"
],
"id": null,
"_type": "ClassLabel"
}
}
],
"metadata": {
"annotators": {
"coref_worker": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"consolidator_worker": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"np-relations_worker": {
"feature": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"url": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"source": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
}