xudongwu/DPR_Pm3B_U10_beta0.10g0.30gamma0.30
收藏Hugging Face2026-04-27 更新2026-05-03 收录
下载链接:
https://hf-mirror.com/datasets/xudongwu/DPR_Pm3B_U10_beta0.10g0.30gamma0.30
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: Pm3B
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 644108
num_examples: 100
download_size: 327130
dataset_size: 644108
- config_name: Pm3B1e-1KL
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 395453
num_examples: 100
download_size: 232034
dataset_size: 395453
- config_name: Pm3B1e-2KL
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 395950
num_examples: 100
download_size: 229822
dataset_size: 395950
- config_name: Pm3B1e-3KL
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 407753
num_examples: 100
download_size: 227324
dataset_size: 407753
- config_name: Pm3B_lr1e5
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 594129
num_examples: 100
download_size: 323526
dataset_size: 594129
- config_name: Pm3B_lr1e5_rk1e-1
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 597142
num_examples: 100
download_size: 326634
dataset_size: 597142
- config_name: Pm3B_lr1e5_rk1e-2
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 594391
num_examples: 100
download_size: 323698
dataset_size: 594391
- config_name: Pm3B_lr1e5_rk1e-3
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 593395
num_examples: 100
download_size: 323072
dataset_size: 593395
- config_name: Pm3B_lr1e6
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 595750
num_examples: 100
download_size: 322283
dataset_size: 595750
- config_name: Pm3B_lr1e6_rk1e-1
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 595763
num_examples: 100
download_size: 322309
dataset_size: 595763
- config_name: Pm3B_lr2e6
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 592115
num_examples: 100
download_size: 322939
dataset_size: 592115
- config_name: Pm3B_lr2e6_rk1e-1
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 592529
num_examples: 100
download_size: 323092
dataset_size: 592529
- config_name: Pm3B_lr4e6
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 597569
num_examples: 100
download_size: 325063
dataset_size: 597569
- config_name: Pm3B_lr4e6_rk1e-1
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 597172
num_examples: 100
download_size: 324738
dataset_size: 597172
- config_name: Pm3B_lr6e6
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 597768
num_examples: 100
download_size: 326836
dataset_size: 597768
- config_name: Pm3B_lr6e6_rk1e-1
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 595661
num_examples: 100
download_size: 326058
dataset_size: 595661
- config_name: Pm3B_lr6e6_rk1e-2
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 597700
num_examples: 100
download_size: 326833
dataset_size: 597700
- config_name: Pm3B_lr6e6_rk1e-3
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 597781
num_examples: 100
download_size: 326859
dataset_size: 597781
- config_name: Pm3B_lr9e6
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 594048
num_examples: 100
download_size: 322099
dataset_size: 594048
- config_name: Pm3B_lr9e6_rk1e-1
features:
- name: prompt
dtype: string
- name: chosen
dtype: string
- name: rejected
dtype: string
- name: response
dtype: string
- name: reward_score
dtype: float64
- name: gpt_score
dtype: float64
splits:
- name: default
num_bytes: 596091
num_examples: 100
download_size: 323532
dataset_size: 596091
configs:
- config_name: Pm3B
data_files:
- split: default
path: Pm3B/default-*
- config_name: Pm3B1e-1KL
data_files:
- split: default
path: Pm3B1e-1KL/default-*
- config_name: Pm3B1e-2KL
data_files:
- split: default
path: Pm3B1e-2KL/default-*
- config_name: Pm3B1e-3KL
data_files:
- split: default
path: Pm3B1e-3KL/default-*
- config_name: Pm3B_lr1e5
data_files:
- split: default
path: Pm3B_lr1e5/default-*
- config_name: Pm3B_lr1e5_rk1e-1
data_files:
- split: default
path: Pm3B_lr1e5_rk1e-1/default-*
- config_name: Pm3B_lr1e5_rk1e-2
data_files:
- split: default
path: Pm3B_lr1e5_rk1e-2/default-*
- config_name: Pm3B_lr1e5_rk1e-3
data_files:
- split: default
path: Pm3B_lr1e5_rk1e-3/default-*
- config_name: Pm3B_lr1e6
data_files:
- split: default
path: Pm3B_lr1e6/default-*
- config_name: Pm3B_lr1e6_rk1e-1
data_files:
- split: default
path: Pm3B_lr1e6_rk1e-1/default-*
- config_name: Pm3B_lr2e6
data_files:
- split: default
path: Pm3B_lr2e6/default-*
- config_name: Pm3B_lr2e6_rk1e-1
data_files:
- split: default
path: Pm3B_lr2e6_rk1e-1/default-*
- config_name: Pm3B_lr4e6
data_files:
- split: default
path: Pm3B_lr4e6/default-*
- config_name: Pm3B_lr4e6_rk1e-1
data_files:
- split: default
path: Pm3B_lr4e6_rk1e-1/default-*
- config_name: Pm3B_lr6e6
data_files:
- split: default
path: Pm3B_lr6e6/default-*
- config_name: Pm3B_lr6e6_rk1e-1
data_files:
- split: default
path: Pm3B_lr6e6_rk1e-1/default-*
- config_name: Pm3B_lr6e6_rk1e-2
data_files:
- split: default
path: Pm3B_lr6e6_rk1e-2/default-*
- config_name: Pm3B_lr6e6_rk1e-3
data_files:
- split: default
path: Pm3B_lr6e6_rk1e-3/default-*
- config_name: Pm3B_lr9e6
data_files:
- split: default
path: Pm3B_lr9e6/default-*
- config_name: Pm3B_lr9e6_rk1e-1
data_files:
- split: default
path: Pm3B_lr9e6_rk1e-1/default-*
---
提供机构:
xudongwu



