RyanYr/pg-dapo_ordered-01_offline-grpo-dapo-qwen3-4B-Base-mbs128-n4-mbs128-n4_matheval
收藏Hugging Face2026-04-23 更新2026-04-26 收录
下载链接:
https://hf-mirror.com/datasets/RyanYr/pg-dapo_ordered-01_offline-grpo-dapo-qwen3-4B-Base-mbs128-n4-mbs128-n4_matheval
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
features:
- name: data_source
dtype: string
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: prompt
list:
- name: role
dtype: string
- name: content
dtype: string
- name: reward_model
struct:
- name: ground_truth
dtype: string
- name: style
dtype: string
- name: responses
list: string
splits:
- name: mixed.90
num_bytes: 27206019
num_examples: 1447
- name: hard.90
num_bytes: 55970957
num_examples: 100
- name: mixed.80
num_bytes: 26721484
num_examples: 1447
- name: hard.80
num_bytes: 57092010
num_examples: 100
- name: mixed.70
num_bytes: 26800332
num_examples: 1447
- name: hard.70
num_bytes: 56282983
num_examples: 100
- name: mixed.60
num_bytes: 28071113
num_examples: 1447
- name: hard.60
num_bytes: 54646363
num_examples: 100
- name: mixed.50
num_bytes: 31536926
num_examples: 1447
- name: hard.50
num_bytes: 51774095
num_examples: 100
- name: mixed.40
num_bytes: 30391803
num_examples: 1447
- name: hard.40
num_bytes: 48588656
num_examples: 100
- name: mixed.30
num_bytes: 29576031
num_examples: 1447
- name: hard.30
num_bytes: 50257335
num_examples: 100
- name: mixed.20
num_bytes: 30951759
num_examples: 1447
- name: hard.20
num_bytes: 48744073
num_examples: 100
- name: mixed.10
num_bytes: 18205355
num_examples: 1447
- name: hard.10
num_bytes: 41777854
num_examples: 100
download_size: 705256093
dataset_size: 714595148
configs:
- config_name: default
data_files:
- split: mixed.90
path: data/mixed.90-*
- split: hard.90
path: data/hard.90-*
- split: mixed.80
path: data/mixed.80-*
- split: hard.80
path: data/hard.80-*
- split: mixed.70
path: data/mixed.70-*
- split: hard.70
path: data/hard.70-*
- split: mixed.60
path: data/mixed.60-*
- split: hard.60
path: data/hard.60-*
- split: mixed.50
path: data/mixed.50-*
- split: hard.50
path: data/hard.50-*
- split: mixed.40
path: data/mixed.40-*
- split: hard.40
path: data/hard.40-*
- split: mixed.30
path: data/mixed.30-*
- split: hard.30
path: data/hard.30-*
- split: mixed.20
path: data/mixed.20-*
- split: hard.20
path: data/hard.20-*
- split: mixed.10
path: data/mixed.10-*
- split: hard.10
path: data/hard.10-*
---
提供机构:
RyanYr



