ENSEONG/grad_weighted_mean-Qwen2.5-1.5B-Instruct-Prm-Skywork-Qwen2.5-1.5B-dvts-completions
收藏Hugging Face2025-12-10 更新2025-12-20 收录
下载链接:
https://hf-mirror.com/datasets/ENSEONG/grad_weighted_mean-Qwen2.5-1.5B-Instruct-Prm-Skywork-Qwen2.5-1.5B-dvts-completions
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-256--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.14--entropy_agg-grad_weighted_mean
features:
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: subject
dtype: string
- name: level
dtype: int64
- name: unique_id
dtype: string
- name: completions
list: string
- name: pred
dtype: string
- name: completion_tokens
dtype: int64
- name: scores
list:
list: float64
- name: entropies
list:
list: float64
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
- name: pass@128
dtype: float64
- name: pass@256
dtype: float64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
- name: pred_weighted@128
dtype: string
- name: pred_maj@128
dtype: string
- name: pred_naive@128
dtype: string
- name: pred_weighted@256
dtype: string
- name: pred_maj@256
dtype: string
- name: pred_naive@256
dtype: string
splits:
- name: train
num_bytes: 214609832
num_examples: 500
download_size: 41246516
dataset_size: 214609832
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.06--entropy_agg-grad_weighted_mean
features:
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: subject
dtype: string
- name: level
dtype: int64
- name: unique_id
dtype: string
- name: completions
list: string
- name: pred
dtype: string
- name: completion_tokens
dtype: int64
- name: scores
list:
list: float64
- name: entropies
list:
list: float64
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
splits:
- name: train
num_bytes: 56977417
num_examples: 500
download_size: 11394219
dataset_size: 56977417
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.1--entropy_agg-grad_weighted_mean
features:
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: subject
dtype: string
- name: level
dtype: int64
- name: unique_id
dtype: string
- name: completions
list: string
- name: pred
dtype: string
- name: completion_tokens
dtype: int64
- name: scores
list:
list: float64
- name: entropies
list:
list: float64
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
splits:
- name: train
num_bytes: 57838038
num_examples: 500
download_size: 11393588
dataset_size: 57838038
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.14--entropy_agg-grad_weighted_mean
features:
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: subject
dtype: string
- name: level
dtype: int64
- name: unique_id
dtype: string
- name: completions
list: string
- name: pred
dtype: string
- name: completion_tokens
dtype: int64
- name: scores
list:
list: float64
- name: entropies
list:
list: float64
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
splits:
- name: train
num_bytes: 58061983
num_examples: 500
download_size: 11384044
dataset_size: 58061983
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.18--entropy_agg-grad_weighted_mean
features:
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: subject
dtype: string
- name: level
dtype: int64
- name: unique_id
dtype: string
- name: completions
list: string
- name: pred
dtype: string
- name: completion_tokens
dtype: int64
- name: scores
list:
list: float64
- name: entropies
list:
list: float64
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
splits:
- name: train
num_bytes: 57685444
num_examples: 500
download_size: 11291211
dataset_size: 57685444
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.22--entropy_agg-grad_weighted_mean
features:
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: subject
dtype: string
- name: level
dtype: int64
- name: unique_id
dtype: string
- name: completions
list: string
- name: pred
dtype: string
- name: completion_tokens
dtype: int64
- name: scores
list:
list: float64
- name: entropies
list:
list: float64
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
splits:
- name: train
num_bytes: 57458385
num_examples: 500
download_size: 11189993
dataset_size: 57458385
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.26--entropy_agg-grad_weighted_mean
features:
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: subject
dtype: string
- name: level
dtype: int64
- name: unique_id
dtype: string
- name: completions
list: string
- name: pred
dtype: string
- name: completion_tokens
dtype: int64
- name: scores
list:
list: float64
- name: entropies
list:
list: float64
- name: preds
list: string
- name: pass@1
dtype: float64
- name: pass@2
dtype: float64
- name: pass@4
dtype: float64
- name: pass@8
dtype: float64
- name: pass@16
dtype: float64
- name: pass@32
dtype: float64
- name: pass@64
dtype: float64
- name: agg_scores
list: float64
- name: pred_weighted@1
dtype: string
- name: pred_maj@1
dtype: string
- name: pred_naive@1
dtype: string
- name: pred_weighted@2
dtype: string
- name: pred_maj@2
dtype: string
- name: pred_naive@2
dtype: string
- name: pred_weighted@4
dtype: string
- name: pred_maj@4
dtype: string
- name: pred_naive@4
dtype: string
- name: pred_weighted@8
dtype: string
- name: pred_maj@8
dtype: string
- name: pred_naive@8
dtype: string
- name: pred_weighted@16
dtype: string
- name: pred_maj@16
dtype: string
- name: pred_naive@16
dtype: string
- name: pred_weighted@32
dtype: string
- name: pred_maj@32
dtype: string
- name: pred_naive@32
dtype: string
- name: pred_weighted@64
dtype: string
- name: pred_maj@64
dtype: string
- name: pred_naive@64
dtype: string
splits:
- name: train
num_bytes: 55576272
num_examples: 500
download_size: 11303808
dataset_size: 55576272
configs:
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-256--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.14--entropy_agg-grad_weighted_mean
data_files:
- split: train
path: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-256--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.14--entropy_agg-grad_weighted_mean/train-*
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.06--entropy_agg-grad_weighted_mean
data_files:
- split: train
path: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.06--entropy_agg-grad_weighted_mean/train-*
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.1--entropy_agg-grad_weighted_mean
data_files:
- split: train
path: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.1--entropy_agg-grad_weighted_mean/train-*
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.14--entropy_agg-grad_weighted_mean
data_files:
- split: train
path: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.14--entropy_agg-grad_weighted_mean/train-*
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.18--entropy_agg-grad_weighted_mean
data_files:
- split: train
path: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.18--entropy_agg-grad_weighted_mean/train-*
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.22--entropy_agg-grad_weighted_mean
data_files:
- split: train
path: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.22--entropy_agg-grad_weighted_mean/train-*
- config_name: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.26--entropy_agg-grad_weighted_mean
data_files:
- split: train
path: HuggingFaceH4_MATH-500--T-0.8--top_p-1.0--n-64--m-4--iters-40--look-0--seed-0--agg_strategy--last--entropy_alpha-0.26--entropy_agg-grad_weighted_mean/train-*
---
提供机构:
ENSEONG



