nguyennghia0902/asag-unified-phase1-new
收藏Hugging Face2026-04-22 更新2026-04-26 收录
下载链接:
https://hf-mirror.com/datasets/nguyennghia0902/asag-unified-phase1-new
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: feedback_t5
features:
- name: sample_id
dtype: string
- name: source_dataset
dtype: string
- name: original_id
dtype: string
- name: question_uid
dtype: string
- name: question_id
dtype: string
- name: domain
dtype: string
- name: subdomain
dtype: string
- name: difficulty
dtype: string
- name: question
dtype: string
- name: reference_answer
dtype: string
- name: student_answer
dtype: string
- name: alternative_reference_answers
list: string
- name: score_raw
dtype: float64
- name: score_normalized
dtype: 'null'
- name: label_2way
dtype: string
- name: label_3way
dtype: string
- name: label_5way
dtype: string
- name: key_concepts
list: string
- name: missing_concepts
list: string
- name: extra_incorrect_claims
list: string
- name: misconception_tags
list: string
- name: misconception_inventory
list: string
- name: feedback_short
dtype: string
- name: feedback_detailed
dtype: string
- name: feedback_type
dtype: string
- name: feedback_tone
dtype: string
- name: split
dtype: string
- name: is_human_annotated
dtype: bool
- name: is_synthetic
dtype: bool
- name: is_adversarial
dtype: bool
- name: perturbation_type
dtype: string
- name: adversarial_variant_of
dtype: string
- name: student_answer_style
dtype: string
- name: annotation_confidence
dtype: float64
- name: usable_for_grading
dtype: bool
- name: usable_for_feedback
dtype: bool
- name: usable_for_misconception_mining
dtype: bool
- name: usable_for_robustness_eval
dtype: bool
- name: question_len
dtype: int64
- name: reference_answer_len
dtype: int64
- name: student_answer_len
dtype: int64
- name: feedback_detailed_len
dtype: int64
- name: t5_input_grounded
dtype: string
- name: t5_input_ungrounded
dtype: string
- name: t5_target
dtype: string
splits:
- name: train
num_bytes: 27907687
num_examples: 7000
- name: validation
num_bytes: 3983507
num_examples: 1000
download_size: 12256425
dataset_size: 31891194
- config_name: grading
features:
- name: sample_id
dtype: string
- name: source_dataset
dtype: string
- name: original_id
dtype: string
- name: question_uid
dtype: string
- name: question_id
dtype: string
- name: domain
dtype: string
- name: subdomain
dtype: string
- name: difficulty
dtype: string
- name: question
dtype: string
- name: reference_answer
dtype: string
- name: student_answer
dtype: string
- name: alternative_reference_answers
list: string
- name: score_raw
dtype: float64
- name: score_normalized
dtype: 'null'
- name: label_2way
dtype: string
- name: label_3way
dtype: string
- name: label_5way
dtype: string
- name: key_concepts
list: string
- name: missing_concepts
list: string
- name: extra_incorrect_claims
list: string
- name: misconception_tags
list: string
- name: misconception_inventory
list: string
- name: feedback_short
dtype: string
- name: feedback_detailed
dtype: string
- name: feedback_type
dtype: string
- name: feedback_tone
dtype: string
- name: split
dtype: string
- name: is_human_annotated
dtype: bool
- name: is_synthetic
dtype: bool
- name: is_adversarial
dtype: bool
- name: perturbation_type
dtype: string
- name: adversarial_variant_of
dtype: string
- name: student_answer_style
dtype: string
- name: annotation_confidence
dtype: float64
- name: usable_for_grading
dtype: bool
- name: usable_for_feedback
dtype: bool
- name: usable_for_misconception_mining
dtype: bool
- name: usable_for_robustness_eval
dtype: bool
- name: question_len
dtype: int64
- name: reference_answer_len
dtype: int64
- name: student_answer_len
dtype: int64
- name: feedback_detailed_len
dtype: int64
splits:
- name: train
num_bytes: 34869607
num_examples: 23375
download_size: 13979914
dataset_size: 34869607
- config_name: unified
features:
- name: sample_id
dtype: string
- name: source_dataset
dtype: string
- name: original_id
dtype: string
- name: question_uid
dtype: string
- name: question_id
dtype: string
- name: domain
dtype: string
- name: subdomain
dtype: string
- name: difficulty
dtype: string
- name: question
dtype: string
- name: reference_answer
dtype: string
- name: student_answer
dtype: string
- name: alternative_reference_answers
list: string
- name: score_raw
dtype: float64
- name: score_normalized
dtype: 'null'
- name: label_2way
dtype: string
- name: label_3way
dtype: string
- name: label_5way
dtype: string
- name: key_concepts
list: string
- name: missing_concepts
list: string
- name: extra_incorrect_claims
list: string
- name: misconception_tags
list: string
- name: misconception_inventory
list: string
- name: feedback_short
dtype: string
- name: feedback_detailed
dtype: string
- name: feedback_type
dtype: string
- name: feedback_tone
dtype: string
- name: split
dtype: string
- name: is_human_annotated
dtype: bool
- name: is_synthetic
dtype: bool
- name: is_adversarial
dtype: bool
- name: perturbation_type
dtype: string
- name: adversarial_variant_of
dtype: string
- name: student_answer_style
dtype: string
- name: annotation_confidence
dtype: float64
- name: usable_for_grading
dtype: bool
- name: usable_for_feedback
dtype: bool
- name: usable_for_misconception_mining
dtype: bool
- name: usable_for_robustness_eval
dtype: bool
- name: question_len
dtype: int64
- name: reference_answer_len
dtype: int64
- name: student_answer_len
dtype: int64
- name: feedback_detailed_len
dtype: int64
splits:
- name: all
num_bytes: 34869607
num_examples: 23375
download_size: 13979914
dataset_size: 34869607
configs:
- config_name: feedback_t5
data_files:
- split: train
path: feedback_t5/train-*
- split: validation
path: feedback_t5/validation-*
- config_name: grading
data_files:
- split: train
path: grading/train-*
- config_name: unified
data_files:
- split: all
path: unified/all-*
---
提供机构:
nguyennghia0902



