amanuelbyte/african-multilingual-translation-merged
收藏Hugging Face2026-02-02 更新2026-03-29 收录
下载链接:
https://hf-mirror.com/datasets/amanuelbyte/african-multilingual-translation-merged
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: default
features:
- name: en
dtype: string
- name: ha
dtype: string
- name: lang_pair
dtype: string
- name: yo
dtype: string
- name: zu
dtype: string
- name: arz
dtype: string
- name: wo
dtype: string
- name: af
dtype: string
- name: sw
dtype: string
- name: so
dtype: string
splits:
- name: train
num_bytes: 252042251
num_examples: 713382
download_size: 137121346
dataset_size: 252042251
- config_name: en-af
features:
- name: en
dtype: string
- name: af
dtype: string
- name: lang_pair
dtype: string
splits:
- name: train
num_bytes: 38292399
num_examples: 161644
download_size: 24032623
dataset_size: 38292399
- config_name: en-arz
features:
- name: en
dtype: string
- name: arz
dtype: string
- name: lang_pair
dtype: string
splits:
- name: train
num_bytes: 69257920
num_examples: 84170
download_size: 38161575
dataset_size: 69257920
- config_name: en-ha
features:
- name: en
dtype: string
- name: ha
dtype: string
- name: lang_pair
dtype: string
splits:
- name: train
num_bytes: 50384319
num_examples: 155881
download_size: 31353602
dataset_size: 50384319
- config_name: en-so
features:
- name: en
dtype: string
- name: so
dtype: string
- name: lang_pair
dtype: string
splits:
- name: train
num_bytes: 12008726
num_examples: 43657
download_size: 6922120
dataset_size: 12008726
- config_name: en-sw
features:
- name: en
dtype: string
- name: sw
dtype: string
- name: lang_pair
dtype: string
splits:
- name: train
num_bytes: 36618867
num_examples: 181045
download_size: 21955758
dataset_size: 36618867
- config_name: en-wol
features:
- name: en
dtype: string
- name: wo
dtype: string
- name: lang_pair
dtype: string
splits:
- name: train
num_bytes: 6563684
num_examples: 31170
download_size: 3741528
dataset_size: 6563684
- config_name: en-yo
features:
- name: en
dtype: string
- name: yo
dtype: string
- name: lang_pair
dtype: string
splits:
- name: train
num_bytes: 6969249
num_examples: 22626
download_size: 4009629
dataset_size: 6969249
- config_name: en-zu
features:
- name: en
dtype: string
- name: zu
dtype: string
- name: lang_pair
dtype: string
splits:
- name: train
num_bytes: 11348145
num_examples: 33189
download_size: 6994564
dataset_size: 11348145
configs:
- config_name: default
data_files:
- split: train
path: data/train-*
- config_name: en-af
data_files:
- split: train
path: en-af/train-*
- config_name: en-arz
data_files:
- split: train
path: en-arz/train-*
- config_name: en-ha
data_files:
- split: train
path: en-ha/train-*
- config_name: en-so
data_files:
- split: train
path: en-so/train-*
- config_name: en-sw
data_files:
- split: train
path: en-sw/train-*
- config_name: en-wol
data_files:
- split: train
path: en-wol/train-*
- config_name: en-yo
data_files:
- split: train
path: en-yo/train-*
- config_name: en-zu
data_files:
- split: train
path: en-zu/train-*
---
提供机构:
amanuelbyte



