omai-research/parallel_mmarco_query
收藏Hugging Face2026-03-18 更新2026-04-26 收录
下载链接:
https://hf-mirror.com/datasets/omai-research/parallel_mmarco_query
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: ar
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 88600888
num_examples: 808260
download_size: 39849109
dataset_size: 88600888
- config_name: de
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 75869567
num_examples: 802334
download_size: 38142449
dataset_size: 75869567
- config_name: es
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 78220534
num_examples: 808731
download_size: 38116874
dataset_size: 78220534
- config_name: fr
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 79613641
num_examples: 808731
download_size: 38466446
dataset_size: 79613641
- config_name: hi
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 119266572
num_examples: 808730
download_size: 45802571
dataset_size: 119266572
- config_name: id
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 73613285
num_examples: 808731
download_size: 35794230
dataset_size: 73613285
- config_name: it
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 76679431
num_examples: 808731
download_size: 37784301
dataset_size: 76679431
- config_name: ja
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 82783201
num_examples: 808731
download_size: 38904588
dataset_size: 82783201
- config_name: nl
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 74980220
num_examples: 808731
download_size: 36837854
dataset_size: 74980220
- config_name: pt
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 76036729
num_examples: 808731
download_size: 37502252
dataset_size: 76036729
- config_name: ru
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 99152481
num_examples: 808731
download_size: 43999455
dataset_size: 99152481
- config_name: vi
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 82407365
num_examples: 808731
download_size: 38646494
dataset_size: 82407365
- config_name: zh
features:
- name: id
dtype: string
- name: english
dtype: string
- name: non_english
dtype: string
splits:
- name: train
num_bytes: 68323213
num_examples: 808731
download_size: 35275415
dataset_size: 68323213
configs:
- config_name: ar
data_files:
- split: train
path: ar/train-*
- config_name: de
data_files:
- split: train
path: de/train-*
- config_name: es
data_files:
- split: train
path: es/train-*
- config_name: fr
data_files:
- split: train
path: fr/train-*
- config_name: hi
data_files:
- split: train
path: hi/train-*
- config_name: id
data_files:
- split: train
path: id/train-*
- config_name: it
data_files:
- split: train
path: it/train-*
- config_name: ja
data_files:
- split: train
path: ja/train-*
- config_name: nl
data_files:
- split: train
path: nl/train-*
- config_name: pt
data_files:
- split: train
path: pt/train-*
- config_name: ru
data_files:
- split: train
path: ru/train-*
- config_name: vi
data_files:
- split: train
path: vi/train-*
- config_name: zh
data_files:
- split: train
path: zh/train-*
---
提供机构:
omai-research



