RyanYr/pg-dapo_ordered-0_offline-grpo-dapo-qwen3-4B-Base-mbs128-n4-mbs128-n4_matheval
收藏Hugging Face2026-04-23 更新2026-04-26 收录
下载链接:
https://hf-mirror.com/datasets/RyanYr/pg-dapo_ordered-0_offline-grpo-dapo-qwen3-4B-Base-mbs128-n4-mbs128-n4_matheval
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
features:
- name: data_source
dtype: string
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: prompt
list:
- name: role
dtype: string
- name: content
dtype: string
- name: reward_model
struct:
- name: ground_truth
dtype: string
- name: style
dtype: string
- name: responses
list: string
splits:
- name: mixed.90
num_bytes: 27841144
num_examples: 1447
- name: hard.90
num_bytes: 54930755
num_examples: 100
- name: mixed.80
num_bytes: 28627672
num_examples: 1447
- name: hard.80
num_bytes: 55542725
num_examples: 100
- name: mixed.70
num_bytes: 28253643
num_examples: 1447
- name: hard.70
num_bytes: 53299260
num_examples: 100
- name: mixed.60
num_bytes: 31474158
num_examples: 1447
- name: hard.60
num_bytes: 51668684
num_examples: 100
- name: mixed.50
num_bytes: 33780138
num_examples: 1447
- name: hard.50
num_bytes: 50089322
num_examples: 100
- name: mixed.40
num_bytes: 27595511
num_examples: 1447
- name: hard.40
num_bytes: 47220854
num_examples: 100
- name: mixed.30
num_bytes: 29744862
num_examples: 1447
- name: hard.30
num_bytes: 50048103
num_examples: 100
- name: mixed.20
num_bytes: 25206793
num_examples: 1447
download_size: 587112465
dataset_size: 595323624
configs:
- config_name: default
data_files:
- split: mixed.90
path: data/mixed.90-*
- split: hard.90
path: data/hard.90-*
- split: mixed.80
path: data/mixed.80-*
- split: hard.80
path: data/hard.80-*
- split: mixed.70
path: data/mixed.70-*
- split: hard.70
path: data/hard.70-*
- split: mixed.60
path: data/mixed.60-*
- split: hard.60
path: data/hard.60-*
- split: mixed.50
path: data/mixed.50-*
- split: hard.50
path: data/hard.50-*
- split: mixed.40
path: data/mixed.40-*
- split: hard.40
path: data/hard.40-*
- split: mixed.30
path: data/mixed.30-*
- split: hard.30
path: data/hard.30-*
- split: mixed.20
path: data/mixed.20-*
---
提供机构:
RyanYr



