ENSEONG/full-math-private-Qwen3-4B-Instruct-2507-bon
收藏Hugging Face2026-03-01 更新2026-03-29 收录
下载链接:
https://hf-mirror.com/datasets/ENSEONG/full-math-private-Qwen3-4B-Instruct-2507-bon
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 733378612
num_examples: 5000
download_size: 155307315
dataset_size: 733378612
- config_name: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 733092592
num_examples: 5000
download_size: 154966055
dataset_size: 733092592
- config_name: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 733704827
num_examples: 5000
download_size: 155154761
dataset_size: 733704827
- config_name: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 734130837
num_examples: 5000
download_size: 171101204
dataset_size: 734130837
- config_name: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 733880744
num_examples: 5000
download_size: 171103612
dataset_size: 733880744
- config_name: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 733911272
num_examples: 5000
download_size: 171497320
dataset_size: 733911272
- config_name: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 734983813
num_examples: 5000
download_size: 181887583
dataset_size: 734983813
- config_name: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 734591399
num_examples: 5000
download_size: 181709525
dataset_size: 734591399
- config_name: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 734873581
num_examples: 5000
download_size: 181794108
dataset_size: 734873581
- config_name: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 735722939
num_examples: 5000
download_size: 189961400
dataset_size: 735722939
- config_name: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 735333377
num_examples: 5000
download_size: 189696273
dataset_size: 735333377
- config_name: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 735952383
num_examples: 5000
download_size: 189879824
dataset_size: 735952383
- config_name: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 736876582
num_examples: 5000
download_size: 196958882
dataset_size: 736876582
- config_name: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 737406396
num_examples: 5000
download_size: 197041745
dataset_size: 737406396
- config_name: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 736915225
num_examples: 5000
download_size: 196816865
dataset_size: 736915225
- config_name: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 738932262
num_examples: 5000
download_size: 203625736
dataset_size: 738932262
- config_name: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 738690556
num_examples: 5000
download_size: 203433105
dataset_size: 738690556
- config_name: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 739289707
num_examples: 5000
download_size: 203710182
dataset_size: 739289707
- config_name: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 741332270
num_examples: 5000
download_size: 209939787
dataset_size: 741332270
- config_name: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 741122934
num_examples: 5000
download_size: 209910427
dataset_size: 741122934
- config_name: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 740764842
num_examples: 5000
download_size: 209758588
dataset_size: 740764842
- config_name: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 743886975
num_examples: 5000
download_size: 215840246
dataset_size: 743886975
- config_name: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 742851808
num_examples: 5000
download_size: 215545202
dataset_size: 742851808
- config_name: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 743182052
num_examples: 5000
download_size: 215706753
dataset_size: 743182052
- config_name: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 746965102
num_examples: 5000
download_size: 221852276
dataset_size: 746965102
- config_name: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 747001455
num_examples: 5000
download_size: 221871906
dataset_size: 747001455
- config_name: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 746852823
num_examples: 5000
download_size: 221786377
dataset_size: 746852823
- config_name: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 750428224
num_examples: 5000
download_size: 228002126
dataset_size: 750428224
- config_name: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 750254345
num_examples: 5000
download_size: 227983165
dataset_size: 750254345
- config_name: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 750406278
num_examples: 5000
download_size: 228033763
dataset_size: 750406278
- config_name: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 755209185
num_examples: 5000
download_size: 234772020
dataset_size: 755209185
- config_name: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 755304716
num_examples: 5000
download_size: 234895570
dataset_size: 755304716
- config_name: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 754337973
num_examples: 5000
download_size: 234466354
dataset_size: 754337973
- config_name: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-0--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 760531562
num_examples: 5000
download_size: 241777790
dataset_size: 760531562
- config_name: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-42--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 760280791
num_examples: 5000
download_size: 241759682
dataset_size: 760280791
- config_name: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-64--agg_strategy-last
features:
- name: problem
dtype: string
- name: level
dtype: string
- name: type
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: completions
list: string
- name: scores
list:
list: float32
- name: pred
dtype: string
- name: completion_tokens
list: int64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
splits:
- name: train
num_bytes: 760574921
num_examples: 5000
download_size: 241791391
dataset_size: 760574921
configs:
- config_name: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.1--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.2--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.3--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.4--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.5--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.6--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.7--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.8--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-0.9--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.0--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.1--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-0--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-0--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-42--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-42--agg_strategy-last/train-*
- config_name: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-64--agg_strategy-last
data_files:
- split: train
path: ENSEONG_math-private--T-1.2--top_p-1.0--n-64--seed-64--agg_strategy-last/train-*
---
提供机构:
ENSEONG



