atreydesai/augmented-mcqa-gemini-choices-only
收藏Hugging Face2026-04-03 更新2026-04-12 收录
下载链接:
https://hf-mirror.com/datasets/atreydesai/augmented-mcqa-gemini-choices-only
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: vllm_Qwen_Qwen3-4B-Instruct-2507
features:
- name: id
dtype: string
- name: question_id
dtype: int64
- name: dataset_type
dtype: string
- name: row_index
dtype: int64
- name: sample_id
dtype: string
- name: question
dtype: string
- name: answer
dtype: string
- name: category
dtype: string
- name: options
list: string
- name: answer_index
dtype: int64
- name: choices_human
list: string
- name: setting
dtype: string
- name: generation_strategy
dtype: string
- name: status
dtype: string
- name: num_human
dtype: int64
- name: num_model
dtype: int64
- name: num_choices
dtype: int64
- name: human_distractors
list: string
- name: model_distractors
list: string
- name: distractors
list: string
- name: options_randomized
list: string
- name: correct_answer_letter
dtype: string
- name: evaluation_is_correct
dtype: bool
- name: evaluation_score
dtype: float64
- name: evaluation_prediction
dtype: string
- name: evaluation_prediction_type
dtype: string
- name: evaluation_raw_output
dtype: string
- name: evaluation_prompt
dtype: string
- name: evaluation_status
dtype: string
- name: evaluation_question_idx
dtype: int64
- name: evaluation_log_path
dtype: string
- name: traces
dtype: string
splits:
- name: human_from_scratch
num_bytes: 6167313
num_examples: 2443
- name: model_from_scratch
num_bytes: 6414356
num_examples: 2443
- name: augment_human
num_bytes: 9531519
num_examples: 2443
- name: augment_model
num_bytes: 9995970
num_examples: 2443
- name: augment_ablation
num_bytes: 9845695
num_examples: 2443
download_size: 27908454
dataset_size: 41954853
- config_name: vllm_allenai_Olmo-3-7B-Instruct
features:
- name: id
dtype: string
- name: question_id
dtype: int64
- name: dataset_type
dtype: string
- name: row_index
dtype: int64
- name: sample_id
dtype: string
- name: question
dtype: string
- name: answer
dtype: string
- name: category
dtype: string
- name: options
list: string
- name: answer_index
dtype: int64
- name: choices_human
list: string
- name: setting
dtype: string
- name: generation_strategy
dtype: string
- name: status
dtype: string
- name: num_human
dtype: int64
- name: num_model
dtype: int64
- name: num_choices
dtype: int64
- name: human_distractors
list: string
- name: model_distractors
list: string
- name: distractors
list: string
- name: options_randomized
list: string
- name: correct_answer_letter
dtype: string
- name: evaluation_is_correct
dtype: bool
- name: evaluation_score
dtype: float64
- name: evaluation_prediction
dtype: string
- name: evaluation_prediction_type
dtype: string
- name: evaluation_raw_output
dtype: string
- name: evaluation_prompt
dtype: string
- name: evaluation_status
dtype: string
- name: evaluation_question_idx
dtype: int64
- name: evaluation_log_path
dtype: string
- name: traces
dtype: string
splits:
- name: human_from_scratch
num_bytes: 6162725
num_examples: 2443
- name: model_from_scratch
num_bytes: 6409777
num_examples: 2443
- name: augment_human
num_bytes: 9526583
num_examples: 2443
- name: augment_model
num_bytes: 9991203
num_examples: 2443
- name: augment_ablation
num_bytes: 9840880
num_examples: 2443
download_size: 27910356
dataset_size: 41931168
- config_name: vllm_meta-llama_Llama-3.1-8B-Instruct
features:
- name: id
dtype: string
- name: question_id
dtype: int64
- name: dataset_type
dtype: string
- name: row_index
dtype: int64
- name: sample_id
dtype: string
- name: question
dtype: string
- name: answer
dtype: string
- name: category
dtype: string
- name: options
list: string
- name: answer_index
dtype: int64
- name: choices_human
list: string
- name: setting
dtype: string
- name: generation_strategy
dtype: string
- name: status
dtype: string
- name: num_human
dtype: int64
- name: num_model
dtype: int64
- name: num_choices
dtype: int64
- name: human_distractors
list: string
- name: model_distractors
list: string
- name: distractors
list: string
- name: options_randomized
list: string
- name: correct_answer_letter
dtype: string
- name: evaluation_is_correct
dtype: bool
- name: evaluation_score
dtype: float64
- name: evaluation_prediction
dtype: string
- name: evaluation_prediction_type
dtype: string
- name: evaluation_raw_output
dtype: string
- name: evaluation_prompt
dtype: string
- name: evaluation_status
dtype: string
- name: evaluation_question_idx
dtype: int64
- name: evaluation_log_path
dtype: string
- name: traces
dtype: string
splits:
- name: human_from_scratch
num_bytes: 6179473
num_examples: 2443
- name: model_from_scratch
num_bytes: 6426501
num_examples: 2443
- name: augment_human
num_bytes: 9543729
num_examples: 2443
- name: augment_model
num_bytes: 10008175
num_examples: 2443
- name: augment_ablation
num_bytes: 9857890
num_examples: 2443
download_size: 27908402
dataset_size: 42015768
- config_name: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2
features:
- name: id
dtype: string
- name: question_id
dtype: int64
- name: dataset_type
dtype: string
- name: row_index
dtype: int64
- name: sample_id
dtype: string
- name: question
dtype: string
- name: answer
dtype: string
- name: category
dtype: string
- name: options
list: string
- name: answer_index
dtype: int64
- name: choices_human
list: string
- name: setting
dtype: string
- name: generation_strategy
dtype: string
- name: status
dtype: string
- name: num_human
dtype: int64
- name: num_model
dtype: int64
- name: num_choices
dtype: int64
- name: human_distractors
list: string
- name: model_distractors
list: string
- name: distractors
list: string
- name: options_randomized
list: string
- name: correct_answer_letter
dtype: string
- name: evaluation_is_correct
dtype: bool
- name: evaluation_score
dtype: float64
- name: evaluation_prediction
dtype: string
- name: evaluation_prediction_type
dtype: string
- name: evaluation_raw_output
dtype: string
- name: evaluation_prompt
dtype: string
- name: evaluation_status
dtype: string
- name: evaluation_question_idx
dtype: int64
- name: evaluation_log_path
dtype: string
- name: traces
dtype: string
splits:
- name: human_from_scratch
num_bytes: 6187374
num_examples: 2443
- name: model_from_scratch
num_bytes: 6433433
num_examples: 2443
- name: augment_human
num_bytes: 9549986
num_examples: 2443
- name: augment_model
num_bytes: 10014460
num_examples: 2443
- name: augment_ablation
num_bytes: 9864522
num_examples: 2443
download_size: 27915656
dataset_size: 42049775
configs:
- config_name: vllm_Qwen_Qwen3-4B-Instruct-2507
data_files:
- split: human_from_scratch
path: vllm_Qwen_Qwen3-4B-Instruct-2507/human_from_scratch-*
- split: model_from_scratch
path: vllm_Qwen_Qwen3-4B-Instruct-2507/model_from_scratch-*
- split: augment_ablation
path: vllm_Qwen_Qwen3-4B-Instruct-2507/augment_ablation-*
- split: augment_human
path: vllm_Qwen_Qwen3-4B-Instruct-2507/augment_human-*
- split: augment_model
path: vllm_Qwen_Qwen3-4B-Instruct-2507/augment_model-*
- config_name: vllm_allenai_Olmo-3-7B-Instruct
data_files:
- split: human_from_scratch
path: vllm_allenai_Olmo-3-7B-Instruct/human_from_scratch-*
- split: model_from_scratch
path: vllm_allenai_Olmo-3-7B-Instruct/model_from_scratch-*
- split: augment_ablation
path: vllm_allenai_Olmo-3-7B-Instruct/augment_ablation-*
- split: augment_human
path: vllm_allenai_Olmo-3-7B-Instruct/augment_human-*
- split: augment_model
path: vllm_allenai_Olmo-3-7B-Instruct/augment_model-*
- config_name: vllm_meta-llama_Llama-3.1-8B-Instruct
data_files:
- split: human_from_scratch
path: vllm_meta-llama_Llama-3.1-8B-Instruct/human_from_scratch-*
- split: model_from_scratch
path: vllm_meta-llama_Llama-3.1-8B-Instruct/model_from_scratch-*
- split: augment_ablation
path: vllm_meta-llama_Llama-3.1-8B-Instruct/augment_ablation-*
- split: augment_human
path: vllm_meta-llama_Llama-3.1-8B-Instruct/augment_human-*
- split: augment_model
path: vllm_meta-llama_Llama-3.1-8B-Instruct/augment_model-*
- config_name: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2
data_files:
- split: human_from_scratch
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/human_from_scratch-*
- split: model_from_scratch
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/model_from_scratch-*
- split: augment_ablation
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/augment_ablation-*
- split: augment_human
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/augment_human-*
- split: augment_model
path: vllm_nvidia_NVIDIA-Nemotron-Nano-9B-v2/augment_model-*
---
提供机构:
atreydesai



