subjqa

مراجع:

کتاب ها

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:subjqa/books')
  • توضیحات :
SubjQA is a question answering dataset that focuses on subjective questions and answers.
The dataset consists of roughly 10,000 questions over reviews from 6 different domains: books, movies, grocery,
electronics, TripAdvisor (i.e. hotels), and restaurants.
  • مجوز : مجوز شناخته شده ای وجود ندارد
  • نسخه : 1.1.0
  • تقسیم ها :
تقسیم کنید نمونه ها
'test' 345
'train' 1314
'validation' 256
  • ویژگی ها :
{
    "domain": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "q_reviews_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_subj_level": {
        "dtype": "int64",
        "id": null,
        "_type": "Value"
    },
    "ques_subj_score": {
        "dtype": "float32",
        "id": null,
        "_type": "Value"
    },
    "is_ques_subjective": {
        "dtype": "bool",
        "id": null,
        "_type": "Value"
    },
    "review_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "title": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "context": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "answers": {
        "feature": {
            "text": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "answer_start": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "answer_subj_level": {
                "dtype": "int64",
                "id": null,
                "_type": "Value"
            },
            "ans_subj_score": {
                "dtype": "float32",
                "id": null,
                "_type": "Value"
            },
            "is_ans_subjective": {
                "dtype": "bool",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    }
}

الکترونیک

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:subjqa/electronics')
  • توضیحات :
SubjQA is a question answering dataset that focuses on subjective questions and answers.
The dataset consists of roughly 10,000 questions over reviews from 6 different domains: books, movies, grocery,
electronics, TripAdvisor (i.e. hotels), and restaurants.
  • مجوز : مجوز شناخته شده ای وجود ندارد
  • نسخه : 1.1.0
  • تقسیم ها :
تقسیم کنید نمونه ها
'test' 358
'train' 1295
'validation' 255
  • ویژگی ها :
{
    "domain": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "q_reviews_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_subj_level": {
        "dtype": "int64",
        "id": null,
        "_type": "Value"
    },
    "ques_subj_score": {
        "dtype": "float32",
        "id": null,
        "_type": "Value"
    },
    "is_ques_subjective": {
        "dtype": "bool",
        "id": null,
        "_type": "Value"
    },
    "review_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "title": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "context": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "answers": {
        "feature": {
            "text": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "answer_start": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "answer_subj_level": {
                "dtype": "int64",
                "id": null,
                "_type": "Value"
            },
            "ans_subj_score": {
                "dtype": "float32",
                "id": null,
                "_type": "Value"
            },
            "is_ans_subjective": {
                "dtype": "bool",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    }
}

خواربار فروشی

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:subjqa/grocery')
  • توضیحات :
SubjQA is a question answering dataset that focuses on subjective questions and answers.
The dataset consists of roughly 10,000 questions over reviews from 6 different domains: books, movies, grocery,
electronics, TripAdvisor (i.e. hotels), and restaurants.
  • مجوز : مجوز شناخته شده ای وجود ندارد
  • نسخه : 1.1.0
  • تقسیم ها :
تقسیم کنید نمونه ها
'test' 591
'train' 1124
'validation' 218
  • ویژگی ها :
{
    "domain": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "q_reviews_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_subj_level": {
        "dtype": "int64",
        "id": null,
        "_type": "Value"
    },
    "ques_subj_score": {
        "dtype": "float32",
        "id": null,
        "_type": "Value"
    },
    "is_ques_subjective": {
        "dtype": "bool",
        "id": null,
        "_type": "Value"
    },
    "review_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "title": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "context": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "answers": {
        "feature": {
            "text": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "answer_start": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "answer_subj_level": {
                "dtype": "int64",
                "id": null,
                "_type": "Value"
            },
            "ans_subj_score": {
                "dtype": "float32",
                "id": null,
                "_type": "Value"
            },
            "is_ans_subjective": {
                "dtype": "bool",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    }
}

فیلم ها

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:subjqa/movies')
  • توضیحات :
SubjQA is a question answering dataset that focuses on subjective questions and answers.
The dataset consists of roughly 10,000 questions over reviews from 6 different domains: books, movies, grocery,
electronics, TripAdvisor (i.e. hotels), and restaurants.
  • مجوز : مجوز شناخته شده ای وجود ندارد
  • نسخه : 1.1.0
  • تقسیم ها :
تقسیم کنید نمونه ها
'test' 291
'train' 1369
'validation' 261
  • ویژگی ها :
{
    "domain": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "q_reviews_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_subj_level": {
        "dtype": "int64",
        "id": null,
        "_type": "Value"
    },
    "ques_subj_score": {
        "dtype": "float32",
        "id": null,
        "_type": "Value"
    },
    "is_ques_subjective": {
        "dtype": "bool",
        "id": null,
        "_type": "Value"
    },
    "review_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "title": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "context": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "answers": {
        "feature": {
            "text": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "answer_start": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "answer_subj_level": {
                "dtype": "int64",
                "id": null,
                "_type": "Value"
            },
            "ans_subj_score": {
                "dtype": "float32",
                "id": null,
                "_type": "Value"
            },
            "is_ans_subjective": {
                "dtype": "bool",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    }
}

رستوران ها

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:subjqa/restaurants')
  • توضیحات :
SubjQA is a question answering dataset that focuses on subjective questions and answers.
The dataset consists of roughly 10,000 questions over reviews from 6 different domains: books, movies, grocery,
electronics, TripAdvisor (i.e. hotels), and restaurants.
  • مجوز : مجوز شناخته شده ای وجود ندارد
  • نسخه : 1.1.0
  • تقسیم ها :
تقسیم کنید نمونه ها
'test' 266
'train' 1400
'validation' 267
  • ویژگی ها :
{
    "domain": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "q_reviews_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_subj_level": {
        "dtype": "int64",
        "id": null,
        "_type": "Value"
    },
    "ques_subj_score": {
        "dtype": "float32",
        "id": null,
        "_type": "Value"
    },
    "is_ques_subjective": {
        "dtype": "bool",
        "id": null,
        "_type": "Value"
    },
    "review_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "title": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "context": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "answers": {
        "feature": {
            "text": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "answer_start": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "answer_subj_level": {
                "dtype": "int64",
                "id": null,
                "_type": "Value"
            },
            "ans_subj_score": {
                "dtype": "float32",
                "id": null,
                "_type": "Value"
            },
            "is_ans_subjective": {
                "dtype": "bool",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    }
}

tripadvisor

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:subjqa/tripadvisor')
  • توضیحات :
SubjQA is a question answering dataset that focuses on subjective questions and answers.
The dataset consists of roughly 10,000 questions over reviews from 6 different domains: books, movies, grocery,
electronics, TripAdvisor (i.e. hotels), and restaurants.
  • مجوز : مجوز شناخته شده ای وجود ندارد
  • نسخه : 1.1.0
  • تقسیم ها :
تقسیم کنید نمونه ها
'test' 512
'train' 1165
'validation' 230
  • ویژگی ها :
{
    "domain": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "nn_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_mod": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "query_asp": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "q_reviews_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_subj_level": {
        "dtype": "int64",
        "id": null,
        "_type": "Value"
    },
    "ques_subj_score": {
        "dtype": "float32",
        "id": null,
        "_type": "Value"
    },
    "is_ques_subjective": {
        "dtype": "bool",
        "id": null,
        "_type": "Value"
    },
    "review_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "title": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "context": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "answers": {
        "feature": {
            "text": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "answer_start": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "answer_subj_level": {
                "dtype": "int64",
                "id": null,
                "_type": "Value"
            },
            "ans_subj_score": {
                "dtype": "float32",
                "id": null,
                "_type": "Value"
            },
            "is_ans_subjective": {
                "dtype": "bool",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    }
}