RyanYr/grpo-dapo_ordered-01_offline-grpo-dapo-qwen3-1.7B-Base-mbs128-n4-mbs128-n4_matheval
收藏Hugging Face2026-04-24 更新2026-04-26 收录
下载链接:
https://hf-mirror.com/datasets/RyanYr/grpo-dapo_ordered-01_offline-grpo-dapo-qwen3-1.7B-Base-mbs128-n4-mbs128-n4_matheval
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
features:
- name: data_source
dtype: string
- name: problem
dtype: string
- name: solution
dtype: string
- name: answer
dtype: string
- name: prompt
list:
- name: role
dtype: string
- name: content
dtype: string
- name: reward_model
struct:
- name: ground_truth
dtype: string
- name: style
dtype: string
- name: responses
list: string
splits:
- name: mixed.90
num_bytes: 38337875
num_examples: 1447
- name: hard.90
num_bytes: 52914131
num_examples: 100
- name: mixed.80
num_bytes: 33410089
num_examples: 1447
- name: hard.80
num_bytes: 51195205
num_examples: 100
- name: mixed.70
num_bytes: 37116577
num_examples: 1447
- name: hard.70
num_bytes: 47181298
num_examples: 100
- name: mixed.60
num_bytes: 27193719
num_examples: 1447
- name: hard.60
num_bytes: 40918608
num_examples: 100
- name: mixed.50
num_bytes: 23557379
num_examples: 1447
- name: hard.50
num_bytes: 38563563
num_examples: 100
- name: mixed.40
num_bytes: 17096676
num_examples: 1447
- name: hard.40
num_bytes: 38022371
num_examples: 100
- name: mixed.30
num_bytes: 9887917
num_examples: 1447
- name: hard.30
num_bytes: 26093948
num_examples: 100
- name: mixed.20
num_bytes: 12316555
num_examples: 1447
- name: hard.20
num_bytes: 26812485
num_examples: 100
- name: mixed.10
num_bytes: 8708057
num_examples: 1447
- name: hard.10
num_bytes: 17660083
num_examples: 100
- name: mixed.100
num_bytes: 30904507
num_examples: 1447
- name: hard.100
num_bytes: 53026529
num_examples: 100
- name: mixed.95
num_bytes: 34289199
num_examples: 1447
download_size: 653872829
dataset_size: 665206771
configs:
- config_name: default
data_files:
- split: mixed.90
path: data/mixed.90-*
- split: hard.90
path: data/hard.90-*
- split: mixed.80
path: data/mixed.80-*
- split: hard.80
path: data/hard.80-*
- split: mixed.70
path: data/mixed.70-*
- split: hard.70
path: data/hard.70-*
- split: mixed.60
path: data/mixed.60-*
- split: hard.60
path: data/hard.60-*
- split: mixed.50
path: data/mixed.50-*
- split: hard.50
path: data/hard.50-*
- split: mixed.40
path: data/mixed.40-*
- split: hard.40
path: data/hard.40-*
- split: mixed.30
path: data/mixed.30-*
- split: hard.30
path: data/hard.30-*
- split: mixed.20
path: data/mixed.20-*
- split: hard.20
path: data/hard.20-*
- split: mixed.10
path: data/mixed.10-*
- split: hard.10
path: data/hard.10-*
- split: mixed.100
path: data/mixed.100-*
- split: hard.100
path: data/hard.100-*
- split: mixed.95
path: data/mixed.95-*
---
提供机构:
RyanYr



