مراجع:
dyda_da
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/dyda_da')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 7740 |
'train' | 87170 |
'validation' | 8069 |
- ویژگی ها :
{
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_Act": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 4,
"names": [
"commissive",
"directive",
"inform",
"question"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
dyda_e
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/dyda_e')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 7740 |
'train' | 87170 |
'validation' | 8069 |
- ویژگی ها :
{
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Emotion": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 7,
"names": [
"anger",
"disgust",
"fear",
"happiness",
"no emotion",
"sadness",
"surprise"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
iemocap
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/iemocap')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 2021 |
'train' | 7213 |
'validation' | 805 |
- ویژگی ها :
{
"Dialogue_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Utterance_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Emotion": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 11,
"names": [
"ang",
"dis",
"exc",
"fea",
"fru",
"hap",
"neu",
"oth",
"sad",
"sur",
"xxx"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
نقشه کار
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/maptask')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 2894 |
'train' | 20905 |
'validation' | 2963 |
- ویژگی ها :
{
"Speaker": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_Act": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 12,
"names": [
"acknowledge",
"align",
"check",
"clarify",
"explain",
"instruct",
"query_w",
"query_yn",
"ready",
"reply_n",
"reply_w",
"reply_y"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
meld_e
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/meld_e')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 2610 |
'train' | 9989 |
'validation' | 1109 |
- ویژگی ها :
{
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Speaker": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Emotion": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Utterance_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 7,
"names": [
"anger",
"disgust",
"fear",
"joy",
"neutral",
"sadness",
"surprise"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
meld_s
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/meld_s')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 2610 |
'train' | 9989 |
'validation' | 1109 |
- ویژگی ها :
{
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Speaker": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Sentiment": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Utterance_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 3,
"names": [
"negative",
"neutral",
"positive"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
مردا
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/mrda')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 15470 |
'train' | 83943 |
'validation' | 9815 |
- ویژگی ها :
{
"Utterance_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_Act": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Channel_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Speaker": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 5,
"names": [
"s",
"d",
"b",
"f",
"q"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
واحه
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/oasis')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 1478 |
'train' | 12076 |
'validation' | 1513 |
- ویژگی ها :
{
"Speaker": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_Act": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 42,
"names": [
"accept",
"ackn",
"answ",
"answElab",
"appreciate",
"backch",
"bye",
"complete",
"confirm",
"correct",
"direct",
"directElab",
"echo",
"exclaim",
"expressOpinion",
"expressPossibility",
"expressRegret",
"expressWish",
"greet",
"hold",
"identifySelf",
"inform",
"informCont",
"informDisc",
"informIntent",
"init",
"negate",
"offer",
"pardon",
"raiseIssue",
"refer",
"refuse",
"reqDirect",
"reqInfo",
"reqModal",
"selfTalk",
"suggest",
"thank",
"informIntent-hold",
"correctSelf",
"expressRegret-inform",
"thank-identifySelf"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
نیم
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/sem')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 878 |
'train' | 4264 |
'validation' | 485 |
- ویژگی ها :
{
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"NbPairInSession": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"SpeechTurn": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Speaker": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Sentiment": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 3,
"names": [
"Negative",
"Neutral",
"Positive"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}
swda
برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:
ds = tfds.load('huggingface:silicone/swda')
- توضیحات :
The Sequence labellIng evaLuatIon benChmark fOr spoken laNguagE (SILICONE) benchmark is a collection
of resources for training, evaluating, and analyzing natural language understanding systems
specifically designed for spoken language. All datasets are in the English language and cover a
variety of domains including daily life, scripted scenarios, joint task completion, phone call
conversations, and televsion dialogue. Some datasets additionally include emotion and/or sentimant
labels.
- مجوز : مجوز شناخته شده ای وجود ندارد
- نسخه : 1.0.0
- تقسیم ها :
تقسیم کنید | نمونه ها |
---|---|
'test' | 2714 |
'train' | 190709 |
'validation' | 21203 |
- ویژگی ها :
{
"Utterance": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_Act": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"From_Caller": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"To_Caller": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Topic": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Dialogue_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Conv_ID": {
"dtype": "string",
"id": null,
"_type": "Value"
},
"Label": {
"num_classes": 46,
"names": [
"sd",
"b",
"sv",
"%",
"aa",
"ba",
"fc",
"qw",
"nn",
"bk",
"h",
"qy^d",
"bh",
"^q",
"bf",
"fo_o_fw_\"_by_bc",
"fo_o_fw_by_bc_\"",
"na",
"ad",
"^2",
"b^m",
"qo",
"qh",
"^h",
"ar",
"ng",
"br",
"no",
"fp",
"qrr",
"arp_nd",
"t3",
"oo_co_cc",
"aap_am",
"t1",
"bd",
"^g",
"qw^d",
"fa",
"ft",
"+",
"x",
"ny",
"sv_fx",
"qy_qr",
"ba_fe"
],
"names_file": null,
"id": null,
"_type": "ClassLabel"
},
"Idx": {
"dtype": "int32",
"id": null,
"_type": "Value"
}
}