RyanYr/grpo-dapo_shuffled-02_offline-grpo-dapo-qwen3-1.7B-Base-mbs128-n4-mbs128-n4_matheval
收藏Hugging Face2026-04-25 更新2026-05-03 收录
下载链接:
https://hf-mirror.com/datasets/RyanYr/grpo-dapo_shuffled-02_offline-grpo-dapo-qwen3-1.7B-Base-mbs128-n4-mbs128-n4_matheval
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
features:
- name: data_source
dtype: string
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: prompt
list:
- name: role
dtype: string
- name: content
dtype: string
- name: reward_model
struct:
- name: ground_truth
dtype: string
- name: style
dtype: string
- name: responses
list: string
splits:
- name: mixed.100
num_bytes: 34944964
num_examples: 1447
- name: hard.100
num_bytes: 49537284
num_examples: 100
- name: mixed.90
num_bytes: 31384493
num_examples: 1447
- name: hard.90
num_bytes: 48357788
num_examples: 100
- name: mixed.80
num_bytes: 30970674
num_examples: 1447
- name: hard.80
num_bytes: 47055783
num_examples: 100
- name: mixed.70
num_bytes: 30850570
num_examples: 1447
- name: hard.70
num_bytes: 42870921
num_examples: 100
- name: mixed.60
num_bytes: 33352578
num_examples: 1447
- name: hard.60
num_bytes: 36558434
num_examples: 100
- name: mixed.50
num_bytes: 26299787
num_examples: 1447
- name: hard.50
num_bytes: 34536650
num_examples: 100
- name: mixed.40
num_bytes: 19748549
num_examples: 1447
- name: hard.40
num_bytes: 32833269
num_examples: 100
- name: mixed.30
num_bytes: 8242993
num_examples: 1447
- name: hard.30
num_bytes: 24542506
num_examples: 100
- name: mixed.20
num_bytes: 9638588
num_examples: 1447
- name: hard.20
num_bytes: 28312111
num_examples: 100
- name: mixed.10
num_bytes: 7955543
num_examples: 1447
- name: hard.10
num_bytes: 17058618
num_examples: 100
download_size: 584658806
dataset_size: 595052103
configs:
- config_name: default
data_files:
- split: mixed.100
path: data/mixed.100-*
- split: hard.100
path: data/hard.100-*
- split: mixed.90
path: data/mixed.90-*
- split: hard.90
path: data/hard.90-*
- split: mixed.80
path: data/mixed.80-*
- split: hard.80
path: data/hard.80-*
- split: mixed.70
path: data/mixed.70-*
- split: hard.70
path: data/hard.70-*
- split: mixed.60
path: data/mixed.60-*
- split: hard.60
path: data/hard.60-*
- split: mixed.50
path: data/mixed.50-*
- split: hard.50
path: data/hard.50-*
- split: mixed.40
path: data/mixed.40-*
- split: hard.40
path: data/hard.40-*
- split: mixed.30
path: data/mixed.30-*
- split: hard.30
path: data/hard.30-*
- split: mixed.20
path: data/mixed.20-*
- split: hard.20
path: data/hard.20-*
- split: mixed.10
path: data/mixed.10-*
- split: hard.10
path: data/hard.10-*
---
提供机构:
RyanYr



