Mantis-VL/MIQA_sample
收藏Hugging Face2024-04-18 更新2024-06-22 收录
下载链接:
https://hf-mirror.com/datasets/Mantis-VL/MIQA_sample
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: ai2d
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 20775020
num_examples: 100
download_size: 6169456
dataset_size: 20775020
- config_name: birds-to-words
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 52982608
num_examples: 100
- name: val
num_bytes: 46432837
num_examples: 100
download_size: 12218041
dataset_size: 99415445
- config_name: chartqa
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 4337107
num_examples: 100
download_size: 3068927
dataset_size: 4337107
- config_name: contrastive_caption
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 165093781
num_examples: 100
download_size: 164841716
dataset_size: 165093781
- config_name: dreamsim
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 306032936
num_examples: 100
- name: val
num_bytes: 311397198
num_examples: 100
download_size: 617404160
dataset_size: 617430134
- config_name: dvqa
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 2034018
num_examples: 100
download_size: 1926679
dataset_size: 2034018
- config_name: iconqa
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 2164110
num_examples: 100
download_size: 2131110
dataset_size: 2164110
- config_name: imagecode
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 666177106
num_examples: 100
download_size: 292302633
dataset_size: 666177106
- config_name: llava_665k_merged
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 108540294
num_examples: 100
download_size: 108356138
dataset_size: 108540294
- config_name: lrv
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 93669796
num_examples: 100
download_size: 93173296
dataset_size: 93669796
- config_name: nlvr2
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 181066810
num_examples: 100
- name: val
num_bytes: 149112471
num_examples: 100
download_size: 522012811
dataset_size: 330179281
- config_name: nlvr2_true
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 192702837
num_examples: 100
- name: val
num_bytes: 170950141
num_examples: 100
download_size: 313699742
dataset_size: 363652978
- config_name: spot-the-diff
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 19601605
num_examples: 100
download_size: 18313879
dataset_size: 19601605
- config_name: synthetic
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 182464879
num_examples: 100
download_size: 182400902
dataset_size: 182464879
- config_name: synthetic_from_caption
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 104823288
num_examples: 100
download_size: 104575349
dataset_size: 104823288
- config_name: visual_story_telling
features:
- name: id
dtype: string
- name: images
sequence:
image:
decode: false
- name: conversation
list:
- name: role
dtype: string
- name: content
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 166151848
num_examples: 100
download_size: 166034399
dataset_size: 166151848
configs:
- config_name: ai2d
data_files:
- split: train
path: ai2d/train-*
- config_name: birds-to-words
data_files:
- split: train
path: birds-to-words/train-*
- split: val
path: birds-to-words/val-*
- config_name: chartqa
data_files:
- split: train
path: chartqa/train-*
- config_name: contrastive_caption
data_files:
- split: train
path: contrastive_caption/train-*
- config_name: dreamsim
data_files:
- split: train
path: dreamsim/train-*
- split: val
path: dreamsim/val-*
- config_name: dvqa
data_files:
- split: train
path: dvqa/train-*
- config_name: iconqa
data_files:
- split: train
path: iconqa/train-*
- config_name: imagecode
data_files:
- split: train
path: imagecode/train-*
- config_name: llava_665k_merged
data_files:
- split: train
path: llava_665k_merged/train-*
- config_name: lrv
data_files:
- split: train
path: lrv/train-*
- config_name: nlvr2
data_files:
- split: train
path: nlvr2/train-*
- split: val
path: nlvr2/val-*
- config_name: nlvr2_true
data_files:
- split: train
path: nlvr2_true/train-*
- split: val
path: nlvr2_true/val-*
- config_name: spot-the-diff
data_files:
- split: train
path: spot-the-diff/train-*
- config_name: synthetic
data_files:
- split: train
path: synthetic/train-*
- config_name: synthetic_from_caption
data_files:
- split: train
path: synthetic_from_caption/train-*
- config_name: visual_story_telling
data_files:
- split: train
path: visual_story_telling/train-*
---
提供机构:
Mantis-VL
原始信息汇总
数据集概述
数据集配置
ai2d
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 20775020 bytes
- 下载大小: 6169456 bytes
- 数据集大小: 20775020 bytes
birds-to-words
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 52982608 bytes
- val: 100 examples, 46432837 bytes
- 下载大小: 12218041 bytes
- 数据集大小: 99415445 bytes
chartqa
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 4337107 bytes
- 下载大小: 3068927 bytes
- 数据集大小: 4337107 bytes
contrastive_caption
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 165093781 bytes
- 下载大小: 164841716 bytes
- 数据集大小: 165093781 bytes
dreamsim
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 306032936 bytes
- val: 100 examples, 311397198 bytes
- 下载大小: 617404160 bytes
- 数据集大小: 617430134 bytes
dvqa
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 2034018 bytes
- 下载大小: 1926679 bytes
- 数据集大小: 2034018 bytes
iconqa
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 2164110 bytes
- 下载大小: 2131110 bytes
- 数据集大小: 2164110 bytes
imagecode
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 666177106 bytes
- 下载大小: 292302633 bytes
- 数据集大小: 666177106 bytes
llava_665k_merged
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 108540294 bytes
- 下载大小: 108356138 bytes
- 数据集大小: 108540294 bytes
lrv
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 93669796 bytes
- 下载大小: 93173296 bytes
- 数据集大小: 93669796 bytes
nlvr2
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 181066810 bytes
- val: 100 examples, 149112471 bytes
- 下载大小: 522012811 bytes
- 数据集大小: 330179281 bytes
nlvr2_true
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 192702837 bytes
- val: 100 examples, 170950141 bytes
- 下载大小: 313699742 bytes
- 数据集大小: 363652978 bytes
spot-the-diff
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 19601605 bytes
- 下载大小: 18313879 bytes
- 数据集大小: 19601605 bytes
synthetic
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 182464879 bytes
- 下载大小: 182400902 bytes
- 数据集大小: 182464879 bytes
synthetic_from_caption
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 104823288 bytes
- 下载大小: 104575349 bytes
- 数据集大小: 104823288 bytes
visual_story_telling
- 特征:
- id: string
- images: sequence of images (decode: false)
- conversation: list of
- role: string
- content: string
- source: string
- 分割:
- train: 100 examples, 166151848 bytes
- 下载大小: 166034399 bytes
- 数据集大小: 166151848 bytes



