atreydesai/augmented-mcqa-together-full-question
收藏Hugging Face2026-04-03 更新2026-04-12 收录
下载链接:
https://hf-mirror.com/datasets/atreydesai/augmented-mcqa-together-full-question
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: vllm_Qwen_Qwen3-4B-Instruct-2507
features:
- name: id
dtype: string
- name: question_id
dtype: int64
- name: dataset_type
dtype: string
- name: row_index
dtype: int64
- name: sample_id
dtype: string
- name: question
dtype: string
- name: answer
dtype: string
- name: category
dtype: string
- name: options
list: string
- name: answer_index
dtype: int64
- name: choices_human
list: string
- name: setting
dtype: string
- name: generation_strategy
dtype: string
- name: status
dtype: string
- name: num_human
dtype: int64
- name: num_model
dtype: int64
- name: num_choices
dtype: int64
- name: human_distractors
list: string
- name: model_distractors
list: string
- name: distractors
list: string
- name: options_randomized
list: string
- name: correct_answer_letter
dtype: string
- name: evaluation_is_correct
dtype: bool
- name: evaluation_score
dtype: float64
- name: evaluation_prediction
dtype: string
- name: evaluation_prediction_type
dtype: string
- name: evaluation_raw_output
dtype: string
- name: evaluation_prompt
dtype: string
- name: evaluation_status
dtype: string
- name: evaluation_question_idx
dtype: int64
- name: evaluation_log_path
dtype: string
- name: traces
dtype: string
splits:
- name: human_from_scratch
num_bytes: 6532078
num_examples: 2443
- name: model_from_scratch
num_bytes: 6774066
num_examples: 2443
- name: augment_human
num_bytes: 9617181
num_examples: 2443
- name: augment_model
num_bytes: 10073411
num_examples: 2443
- name: augment_ablation
num_bytes: 9816195
num_examples: 2443
download_size: 29162026
dataset_size: 42812931
- config_name: vllm_allenai_Olmo-3-7B-Instruct
features:
- name: id
dtype: string
- name: question_id
dtype: int64
- name: dataset_type
dtype: string
- name: row_index
dtype: int64
- name: sample_id
dtype: string
- name: question
dtype: string
- name: answer
dtype: string
- name: category
dtype: string
- name: options
list: string
- name: answer_index
dtype: int64
- name: choices_human
list: string
- name: setting
dtype: string
- name: generation_strategy
dtype: string
- name: status
dtype: string
- name: num_human
dtype: int64
- name: num_model
dtype: int64
- name: num_choices
dtype: int64
- name: human_distractors
list: string
- name: model_distractors
list: string
- name: distractors
list: string
- name: options_randomized
list: string
- name: correct_answer_letter
dtype: string
- name: evaluation_is_correct
dtype: bool
- name: evaluation_score
dtype: float64
- name: evaluation_prediction
dtype: string
- name: evaluation_prediction_type
dtype: string
- name: evaluation_raw_output
dtype: string
- name: evaluation_prompt
dtype: string
- name: evaluation_status
dtype: string
- name: evaluation_question_idx
dtype: int64
- name: evaluation_log_path
dtype: string
- name: traces
dtype: string
splits:
- name: human_from_scratch
num_bytes: 6505083
num_examples: 2443
- name: model_from_scratch
num_bytes: 6747061
num_examples: 2443
- name: augment_human
num_bytes: 9604914
num_examples: 2443
- name: augment_model
num_bytes: 10061905
num_examples: 2443
- name: augment_ablation
num_bytes: 9804140
num_examples: 2443
download_size: 29164377
dataset_size: 42723103
- config_name: vllm_meta-llama_Llama-3.1-8B-Instruct
features:
- name: id
dtype: string
- name: question_id
dtype: int64
- name: dataset_type
dtype: string
- name: row_index
dtype: int64
- name: sample_id
dtype: string
- name: question
dtype: string
- name: answer
dtype: string
- name: category
dtype: string
- name: options
list: string
- name: answer_index
dtype: int64
- name: choices_human
list: string
- name: setting
dtype: string
- name: generation_strategy
dtype: string
- name: status
dtype: string
- name: num_human
dtype: int64
- name: num_model
dtype: int64
- name: num_choices
dtype: int64
- name: human_distractors
list: string
- name: model_distractors
list: string
- name: distractors
list: string
- name: options_randomized
list: string
- name: correct_answer_letter
dtype: string
- name: evaluation_is_correct
dtype: bool
- name: evaluation_score
dtype: float64
- name: evaluation_prediction
dtype: string
- name: evaluation_prediction_type
dtype: string
- name: evaluation_raw_output
dtype: string
- name: evaluation_prompt
dtype: string
- name: evaluation_status
dtype: string
- name: evaluation_question_idx
dtype: int64
- name: evaluation_log_path
dtype: string
- name: traces
dtype: string
splits:
- name: human_from_scratch
num_bytes: 6522094
num_examples: 2443
- name: model_from_scratch
num_bytes: 6764244
num_examples: 2443
- name: augment_human
num_bytes: 9622268
num_examples: 2443
- name: augment_model
num_bytes: 10077821
num_examples: 2443
- name: augment_ablation
num_bytes: 9821337
num_examples: 2443
download_size: 29162163
dataset_size: 42807764
- config_name: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2
features:
- name: id
dtype: string
- name: question_id
dtype: int64
- name: dataset_type
dtype: string
- name: row_index
dtype: int64
- name: sample_id
dtype: string
- name: question
dtype: string
- name: answer
dtype: string
- name: category
dtype: string
- name: options
list: string
- name: answer_index
dtype: int64
- name: choices_human
list: string
- name: setting
dtype: string
- name: generation_strategy
dtype: string
- name: status
dtype: string
- name: num_human
dtype: int64
- name: num_model
dtype: int64
- name: num_choices
dtype: int64
- name: human_distractors
list: string
- name: model_distractors
list: string
- name: distractors
list: string
- name: options_randomized
list: string
- name: correct_answer_letter
dtype: string
- name: evaluation_is_correct
dtype: bool
- name: evaluation_score
dtype: float64
- name: evaluation_prediction
dtype: string
- name: evaluation_prediction_type
dtype: string
- name: evaluation_raw_output
dtype: string
- name: evaluation_prompt
dtype: string
- name: evaluation_status
dtype: string
- name: evaluation_question_idx
dtype: int64
- name: evaluation_log_path
dtype: string
- name: traces
dtype: string
splits:
- name: human_from_scratch
num_bytes: 6531827
num_examples: 2443
- name: model_from_scratch
num_bytes: 6773013
num_examples: 2443
- name: augment_human
num_bytes: 9630051
num_examples: 2443
- name: augment_model
num_bytes: 10087781
num_examples: 2443
- name: augment_ablation
num_bytes: 9830115
num_examples: 2443
download_size: 29168702
dataset_size: 42852787
configs:
- config_name: vllm_Qwen_Qwen3-4B-Instruct-2507
data_files:
- split: human_from_scratch
path: vllm_Qwen_Qwen3-4B-Instruct-2507/human_from_scratch-*
- split: model_from_scratch
path: vllm_Qwen_Qwen3-4B-Instruct-2507/model_from_scratch-*
- split: augment_ablation
path: vllm_Qwen_Qwen3-4B-Instruct-2507/augment_ablation-*
- split: augment_human
path: vllm_Qwen_Qwen3-4B-Instruct-2507/augment_human-*
- split: augment_model
path: vllm_Qwen_Qwen3-4B-Instruct-2507/augment_model-*
- config_name: vllm_allenai_Olmo-3-7B-Instruct
data_files:
- split: human_from_scratch
path: vllm_allenai_Olmo-3-7B-Instruct/human_from_scratch-*
- split: model_from_scratch
path: vllm_allenai_Olmo-3-7B-Instruct/model_from_scratch-*
- split: augment_ablation
path: vllm_allenai_Olmo-3-7B-Instruct/augment_ablation-*
- split: augment_human
path: vllm_allenai_Olmo-3-7B-Instruct/augment_human-*
- split: augment_model
path: vllm_allenai_Olmo-3-7B-Instruct/augment_model-*
- config_name: vllm_meta-llama_Llama-3.1-8B-Instruct
data_files:
- split: human_from_scratch
path: vllm_meta-llama_Llama-3.1-8B-Instruct/human_from_scratch-*
- split: model_from_scratch
path: vllm_meta-llama_Llama-3.1-8B-Instruct/model_from_scratch-*
- split: augment_ablation
path: vllm_meta-llama_Llama-3.1-8B-Instruct/augment_ablation-*
- split: augment_human
path: vllm_meta-llama_Llama-3.1-8B-Instruct/augment_human-*
- split: augment_model
path: vllm_meta-llama_Llama-3.1-8B-Instruct/augment_model-*
- config_name: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2
data_files:
- split: human_from_scratch
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/human_from_scratch-*
- split: model_from_scratch
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/model_from_scratch-*
- split: augment_ablation
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/augment_ablation-*
- split: augment_human
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/augment_human-*
- split: augment_model
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/augment_model-*
---
提供机构:
atreydesai



