อ้างอิง:
ใช้คำสั่งต่อไปนี้เพื่อโหลดชุดข้อมูลนี้ใน TFDS:
ds = tfds.load('huggingface:jigsaw_unintended_bias')
- คำอธิบาย :
A collection of comments from the defunct Civil Comments platform that have been annotated for their toxicity.
- ใบอนุญาต : CC0 (ทั้งชุดข้อมูลและข้อความพื้นฐาน)
- เวอร์ชั่น : 1.1.0
- แยก :
แยก | ตัวอย่าง |
---|---|
'test_private_leaderboard' | 97320 |
'test_public_leaderboard' | 97320 |
'train' | 1804874 |
- คุณสมบัติ :
{
"target": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"comment_text": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"severe_toxicity": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"obscene": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"identity_attack": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"insult": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"threat": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"asian": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"atheist": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"bisexual": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"black": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"buddhist": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"christian": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"female": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"heterosexual": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"hindu": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"homosexual_gay_or_lesbian": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"intellectual_or_learning_disability": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"jewish": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"latino": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"male": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"muslim": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_disability": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_gender": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_race_or_ethnicity": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_religion": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"other_sexual_orientation": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"physical_disability": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"psychiatric_or_mental_illness": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"transgender": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"white": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"created_date": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"publication_id": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"parent_id": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"article_id": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"rating": {
"num_classes": 2,
"names": [
"rejected",
"approved"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"funny": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"wow": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"sad": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"likes": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"disagree": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"sexual_explicit": {
"dtype": "float32",
"id": null,
"_type": "Value"
},
"identity_annotator_count": {
"dtype": "int32",
"id": null,
"_type": "Value"
},
"toxicity_annotator_count": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}