তথ্যসূত্র:
TFDS এ এই ডেটাসেট লোড করতে নিম্নলিখিত কমান্ডটি ব্যবহার করুন:
ds = tfds.load('huggingface:jigsaw_unintended_bias')
- বর্ণনা :
A collection of comments from the defunct Civil Comments platform that have been annotated for their toxicity.
- লাইসেন্স : CC0 (ডেটাসেট এবং অন্তর্নিহিত পাঠ্য উভয়ই)
- সংস্করণ : 1.1.0
- বিভাজন :
বিভক্ত | উদাহরণ |
---|---|
'test_private_leaderboard' | 97320 |
'test_public_leaderboard' | 97320 |
'train' | 1804874 |
- বৈশিষ্ট্য :
{
"target": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"comment_text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"severe_toxicity": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"obscene": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"identity_attack": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"insult": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"threat": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"asian": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"atheist": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"bisexual": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"black": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"buddhist": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"christian": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"female": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"heterosexual": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"hindu": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"homosexual_gay_or_lesbian": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"intellectual_or_learning_disability": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"jewish": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"latino": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"male": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"muslim": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_disability": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_gender": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_race_or_ethnicity": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_religion": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_sexual_orientation": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"physical_disability": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"psychiatric_or_mental_illness": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"transgender": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"white": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"created_date": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"publication_id": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"parent_id": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"article_id": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"rating": {
"num_classes": 2,
"names": [
"rejected",
"approved"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"funny": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"wow": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"sad": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"likes": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"disagree": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"sexual_explicit": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"identity_annotator_count": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"toxicity_annotator_count": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}