참고자료:
parsed_pdfs
TFDS에 이 데이터세트를 로드하려면 다음 명령어를 사용하세요.
ds = tfds.load('huggingface:peer_read/parsed_pdfs')
- 설명 :
PearRead is a dataset of scientific peer reviews available to help researchers study this important artifact. The dataset consists of over 14K paper drafts and the corresponding accept/reject decisions in top-tier venues including ACL, NIPS and ICLR, as well as over 10K textual peer reviews written by experts for a subset of the papers.
- 라이센스 : Creative Commons Public License
- 버전 : 1.1.0
- 분할 :
나뉘다 | 예 |
---|---|
'test' | 637 |
'train' | 11090 |
'validation' | 637 |
- 특징 :
{
"name": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"metadata": {
"source": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"authors": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"emails": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"sections": {
"feature": {
"heading": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"text": {
"dtype": "string",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"references": {
"feature": {
"title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"author": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"venue": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"citeRegEx": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"shortCiteRegEx": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"year": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"referenceMentions": {
"feature": {
"referenceID": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"context": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"startOffset": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"endOffset": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"year": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"abstractText": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"creator": {
"dtype": "string",
"id": null,
"_type": "Value"
}
}
}
리뷰
TFDS에 이 데이터세트를 로드하려면 다음 명령어를 사용하세요.
ds = tfds.load('huggingface:peer_read/reviews')
- 설명 :
PearRead is a dataset of scientific peer reviews available to help researchers study this important artifact. The dataset consists of over 14K paper drafts and the corresponding accept/reject decisions in top-tier venues including ACL, NIPS and ICLR, as well as over 10K textual peer reviews written by experts for a subset of the papers.
- 라이센스 : Creative Commons Public License
- 버전 : 1.1.0
- 분할 :
나뉘다 | 예 |
---|---|
'test' | 637 |
'train' | 11090 |
'validation' | 637 |
- 특징 :
{
"id": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"conference": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"comments": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"subjects": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"version": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"date_of_submission": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"authors": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"accepted": {
"dtype": "bool",
"id": null,
"_type": "Value"
},
"abstract": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"histories": {
"feature": {
"feature": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"length": -1,
"id": null,
"_type": "Sequence"
},
"reviews": {
"feature": {
"date": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"title": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"other_keys": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"originality": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"comments": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"is_meta_review": {
"dtype": "bool",
"id": null,
"_type": "Value"
},
"is_annotated": {
"dtype": "bool",
"id": null,
"_type": "Value"
},
"recommendation": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"replicability": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"presentation_format": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"clarity": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"meaningful_comparison": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"substance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"reviewer_confidence": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"soundness_correctness": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"appropriateness": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"impact": {
"dtype": "string",
"id": null,
"_type": "Value"
}
},
"length": -1,
"id": null,
"_type": "Sequence"
}
}