参考文献:

次のコマンドを使用して、このデータセットを TFDS にロードします。

ds = tfds.load('huggingface:tne')
  • 説明
TNE is an NLU task, which focus on relations between noun phrases (NPs) that can be mediated via prepositions.
The dataset contains 5,497 documents, annotated exhaustively with all possible links between the NPs in each document.
  • ライセンス: MIT
  • バージョン: 1.1.0
  • 分割:
スプリット
'test' 500
'test_ood' 509
'train' 3988
'validation' 500
  • 特徴
{
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "text": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "tokens": {
        "feature": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "nps": [
        {
            "text": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "first_char": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "last_char": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "first_token": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "last_token": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "id": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        }
    ],
    "np_relations": [
        {
            "anchor": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "complement": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "preposition": {
                "num_classes": 24,
                "names": [
                    "about",
                    "for",
                    "with",
                    "from",
                    "among",
                    "by",
                    "on",
                    "at",
                    "during",
                    "of",
                    "member(s) of",
                    "in",
                    "after",
                    "under",
                    "to",
                    "into",
                    "before",
                    "near",
                    "outside",
                    "around",
                    "between",
                    "against",
                    "over",
                    "inside"
                ],
                "id": null,
                "_type": "ClassLabel"
            },
            "complement_coref_cluster_id": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        }
    ],
    "coref": [
        {
            "id": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "members": {
                "feature": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "length": -1,
                "id": null,
                "_type": "Sequence"
            },
            "np_type": {
                "num_classes": 3,
                "names": [
                    "standard",
                    "time/date/measurement",
                    "idiomatic"
                ],
                "id": null,
                "_type": "ClassLabel"
            }
        }
    ],
    "metadata": {
        "annotators": {
            "coref_worker": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "consolidator_worker": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "np-relations_worker": {
                "feature": {
                    "dtype": "int32",
                    "id": null,
                    "_type": "Value"
                },
                "length": -1,
                "id": null,
                "_type": "Sequence"
            }
        },
        "url": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "source": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}