rashadaziz/mrt-traces
收藏Hugging Face2026-04-14 更新2026-04-26 收录
下载链接:
https://hf-mirror.com/datasets/rashadaziz/mrt-traces
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: gemma4-31b_mmmlu_ar
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11853271
num_examples: 1000
download_size: 4929447
dataset_size: 11853271
- config_name: gemma4-31b_mmmlu_bn
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 14260602
num_examples: 1000
download_size: 5343460
dataset_size: 14260602
- config_name: gemma4-31b_mmmlu_de
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11592686
num_examples: 1000
download_size: 5079638
dataset_size: 11592686
- config_name: gemma4-31b_mmmlu_en
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11014985
num_examples: 1000
download_size: 4526417
dataset_size: 11014985
- config_name: gemma4-31b_mmmlu_sw
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11522291
num_examples: 1000
download_size: 4899695
dataset_size: 11522291
- config_name: gemma4-31b_mmmlu_zh
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11241615
num_examples: 1000
download_size: 5045736
dataset_size: 11241615
- config_name: qwen3-32b_mmmlu_ar
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 9013409
num_examples: 1000
download_size: 3538393
dataset_size: 9013409
- config_name: qwen3-32b_mmmlu_bn
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11577727
num_examples: 1000
download_size: 4178141
dataset_size: 11577727
- config_name: qwen3-32b_mmmlu_de
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 8965267
num_examples: 1000
download_size: 3582527
dataset_size: 8965267
- config_name: qwen3-32b_mmmlu_en
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 8338982
num_examples: 1000
download_size: 3575682
dataset_size: 8338982
- config_name: qwen3-32b_mmmlu_sw
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 9517839
num_examples: 1000
download_size: 3845568
dataset_size: 9517839
- config_name: qwen3-32b_mmmlu_zh
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 9765874
num_examples: 1000
download_size: 4041334
dataset_size: 9765874
- config_name: qwen3-8b_mmmlu_ar
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11936013
num_examples: 1000
download_size: 4463456
dataset_size: 11936013
- config_name: qwen3-8b_mmmlu_bn
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 14211700
num_examples: 1000
download_size: 4965453
dataset_size: 14211700
- config_name: qwen3-8b_mmmlu_de
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11157539
num_examples: 1000
download_size: 4363953
dataset_size: 11157539
- config_name: qwen3-8b_mmmlu_en
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 11893360
num_examples: 1000
download_size: 4548773
dataset_size: 11893360
- config_name: qwen3-8b_mmmlu_sw
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 14196456
num_examples: 1000
download_size: 5054053
dataset_size: 14196456
- config_name: qwen3-8b_mmmlu_zh
features:
- name: question_id
dtype: string
- name: model
dtype: string
- name: dataset
dtype: string
- name: language
dtype: string
- name: condition
dtype: string
- name: subject
dtype: string
- name: prompt
dtype: string
- name: raw_prompt
dtype: string
- name: raw_response
dtype: string
- name: reasoning_trace
dtype: string
- name: final_answer
dtype: string
- name: correct_answer
dtype: string
- name: is_correct
dtype: bool
- name: completion_tokens
dtype: int64
- name: prompt_tokens
dtype: int64
- name: dominant_language
dtype: string
- name: compliance_rate
dtype: float64
- name: num_switches
dtype: int64
- name: detected_languages
dtype: string
- name: language_switches
dtype: string
splits:
- name: train
num_bytes: 14578827
num_examples: 1000
download_size: 5214922
dataset_size: 14578827
configs:
- config_name: gemma4-31b_mmmlu_ar
data_files:
- split: train
path: gemma4-31b_mmmlu_ar/train-*
- config_name: gemma4-31b_mmmlu_bn
data_files:
- split: train
path: gemma4-31b_mmmlu_bn/train-*
- config_name: gemma4-31b_mmmlu_de
data_files:
- split: train
path: gemma4-31b_mmmlu_de/train-*
- config_name: gemma4-31b_mmmlu_en
data_files:
- split: train
path: gemma4-31b_mmmlu_en/train-*
- config_name: gemma4-31b_mmmlu_sw
data_files:
- split: train
path: gemma4-31b_mmmlu_sw/train-*
- config_name: gemma4-31b_mmmlu_zh
data_files:
- split: train
path: gemma4-31b_mmmlu_zh/train-*
- config_name: qwen3-32b_mmmlu_ar
data_files:
- split: train
path: qwen3-32b_mmmlu_ar/train-*
- config_name: qwen3-32b_mmmlu_bn
data_files:
- split: train
path: qwen3-32b_mmmlu_bn/train-*
- config_name: qwen3-32b_mmmlu_de
data_files:
- split: train
path: qwen3-32b_mmmlu_de/train-*
- config_name: qwen3-32b_mmmlu_en
data_files:
- split: train
path: qwen3-32b_mmmlu_en/train-*
- config_name: qwen3-32b_mmmlu_sw
data_files:
- split: train
path: qwen3-32b_mmmlu_sw/train-*
- config_name: qwen3-32b_mmmlu_zh
data_files:
- split: train
path: qwen3-32b_mmmlu_zh/train-*
- config_name: qwen3-8b_mmmlu_ar
data_files:
- split: train
path: qwen3-8b_mmmlu_ar/train-*
- config_name: qwen3-8b_mmmlu_bn
data_files:
- split: train
path: qwen3-8b_mmmlu_bn/train-*
- config_name: qwen3-8b_mmmlu_de
data_files:
- split: train
path: qwen3-8b_mmmlu_de/train-*
- config_name: qwen3-8b_mmmlu_en
data_files:
- split: train
path: qwen3-8b_mmmlu_en/train-*
- config_name: qwen3-8b_mmmlu_sw
data_files:
- split: train
path: qwen3-8b_mmmlu_sw/train-*
- config_name: qwen3-8b_mmmlu_zh
data_files:
- split: train
path: qwen3-8b_mmmlu_zh/train-*
---
提供机构:
rashadaziz



