参考文献:
次のコマンドを使用して、このデータセットを TFDS にロードします。
ds = tfds.load('huggingface:tne')
- 説明:
TNE is an NLU task, which focus on relations between noun phrases (NPs) that can be mediated via prepositions.
The dataset contains 5,497 documents, annotated exhaustively with all possible links between the NPs in each document.
- ライセンス: MIT
- バージョン: 1.1.0
- 分割:
スプリット | 例 |
---|---|
'test' | 500 |
'test_ood' | 509 |
'train' | 3988 |
'validation' | 500 |
- 特徴:
{
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"tokens": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"nps": [
{
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"first_char": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"last_char": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"first_token": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"last_token": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
],
"np_relations": [
{
"anchor": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"complement": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"preposition": {
"num_classes": 24,
"names": [
"about",
"for",
"with",
"from",
"among",
"by",
"on",
"at",
"during",
"of",
"member(s) of",
"in",
"after",
"under",
"to",
"into",
"before",
"near",
"outside",
"around",
"between",
"against",
"over",
"inside"
],
"id": null,
"_type": "ClassLabel"
},
"complement_coref_cluster_id": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
],
"coref": [
{
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"members": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"np_type": {
"num_classes": 3,
"names": [
"standard",
"time/date/measurement",
"idiomatic"
],
"id": null,
"_type": "ClassLabel"
}
}
],
"metadata": {
"annotators": {
"coref_worker": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"consolidator_worker": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"np-relations_worker": {
"feature": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
}
},
"url": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"source": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
}