bnl_newspapers

مراجع:

معالجتها

استخدم الأمر التالي لتحميل مجموعة البيانات هذه في TFDS:

ds = tfds.load('huggingface:bnl_newspapers/processed')
  • وصف :
Digitised historic newspapers from the Bibliothèque nationale (BnL) - the National Library of Luxembourg.
  • الترخيص : CC0
  • الإصدار : 1.17.0
  • الإنشقاقات :
ينقسم أمثلة
'train' 537558
  • سمات :
{
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "url": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "title": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "ispartof": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "text": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "pub_date": {
        "dtype": "timestamp[s]",
        "id": null,
        "_type": "Value"
    },
    "publisher": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "language": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "article_type": {
        "num_classes": 18,
        "names": [
            "ADVERTISEMENT_SECTION",
            "BIBLIOGRAPHY",
            "CHAPTER",
            "INDEX",
            "CONTRIBUTION",
            "TABLE_OF_CONTENTS",
            "WEATHER",
            "SHIPPING",
            "SECTION",
            "ARTICLE",
            "TITLE_SECTION",
            "DEATH_NOTICE",
            "SUPPLEMENT",
            "TABLE",
            "ADVERTISEMENT",
            "CHART_DIAGRAM",
            "ILLUSTRATION",
            "ISSUE"
        ],
        "names_file": null,
        "id": null,
        "_type": "ClassLabel"
    },
    "extent": {
        "dtype": "int32",
        "id": null,
        "_type": "Value"
    }
}