MLLM-CL/_MLLM_CL_10_percent_noicl
收藏Hugging Face2026-03-25 更新2026-03-29 收录
下载链接:
https://hf-mirror.com/datasets/MLLM-CL/_MLLM_CL_10_percent_noicl
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: AD
features:
- name: question_id
dtype: string
- name: answer
dtype: string
- name: images
list: image
- name: problem
dtype: string
- name: messages_noicl
list:
- name: content
dtype: string
- name: role
dtype: string
splits:
- name: train
num_bytes: 109212284
num_examples: 5400
- name: val
num_bytes: 121304530
num_examples: 6000
- name: test
num_bytes: 202195277
num_examples: 10000
download_size: 425119979
dataset_size: 432712091
- config_name: Fin
features:
- name: question_id
dtype: string
- name: answer
dtype: string
- name: images
list: image
- name: problem
dtype: string
- name: _drop
dtype: bool
- name: messages_noicl
list:
- name: content
dtype: string
- name: role
dtype: string
splits:
- name: train
num_bytes: 60538293
num_examples: 2610
- name: val
num_bytes: 67715421
num_examples: 2929
- name: test
num_bytes: 232399980
num_examples: 10000
download_size: 356602056
dataset_size: 360653694
- config_name: Med
features:
- name: question_id
dtype: string
- name: answer
dtype: string
- name: images
list: image
- name: problem
dtype: string
- name: messages_noicl
list:
- name: content
dtype: string
- name: role
dtype: string
splits:
- name: train
num_bytes: 72621437
num_examples: 2056
- name: val
num_bytes: 80922960
num_examples: 2285
- name: test
num_bytes: 350138897
num_examples: 9790
download_size: 503121205
dataset_size: 503683294
- config_name: RS
features:
- name: question_id
dtype: int64
- name: answer
dtype: string
- name: images
list: image
- name: problem
dtype: string
- name: messages_noicl
list:
- name: content
dtype: string
- name: role
dtype: string
splits:
- name: train
num_bytes: 254320906
num_examples: 5400
- name: val
num_bytes: 283179122
num_examples: 6000
- name: test
num_bytes: 467561784
num_examples: 10000
download_size: 1003359287
dataset_size: 1005061812
- config_name: Sci
features:
- name: answer
dtype: string
- name: question_id
dtype: string
- name: images
list: image
- name: problem
dtype: string
- name: _drop
dtype: bool
- name: messages_noicl
list:
- name: content
dtype: string
- name: role
dtype: string
splits:
- name: train
num_bytes: 65010067
num_examples: 2768
- name: val
num_bytes: 72341159
num_examples: 3075
- name: test
num_bytes: 181342560
num_examples: 7687
download_size: 317163133
dataset_size: 318693786
configs:
- config_name: AD
data_files:
- split: train
path: AD/train-*
- split: val
path: AD/val-*
- split: test
path: AD/test-*
- config_name: Fin
data_files:
- split: train
path: Fin/train-*
- split: val
path: Fin/val-*
- split: test
path: Fin/test-*
- config_name: Med
data_files:
- split: train
path: Med/train-*
- split: val
path: Med/val-*
- split: test
path: Med/test-*
- config_name: RS
data_files:
- split: train
path: RS/train-*
- split: val
path: RS/val-*
- split: test
path: RS/test-*
- config_name: Sci
data_files:
- split: train
path: Sci/train-*
- split: val
path: Sci/val-*
- split: test
path: Sci/test-*
---
提供机构:
MLLM-CL



