Scicom-intl/Evaluation-Multilingual-VC
收藏Hugging Face2026-04-08 更新2026-04-05 收录
下载链接:
https://hf-mirror.com/datasets/Scicom-intl/Evaluation-Multilingual-VC
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: af
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 43171
num_examples: 131
download_size: 26894
dataset_size: 43171
- config_name: am
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 111762
num_examples: 252
download_size: 52103
dataset_size: 111762
- config_name: ar
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 153332
num_examples: 500
download_size: 78928
dataset_size: 153332
- config_name: as
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 168833
num_examples: 379
download_size: 67550
dataset_size: 168833
- config_name: az
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 31429
num_examples: 95
download_size: 20500
dataset_size: 31429
- config_name: ba
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 173784
num_examples: 500
download_size: 95186
dataset_size: 173784
- config_name: be
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 211146
num_examples: 500
download_size: 142100
dataset_size: 211146
- config_name: bg
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 199362
num_examples: 500
download_size: 83163
dataset_size: 199362
- config_name: bn
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 259922
num_examples: 500
download_size: 154522
dataset_size: 259922
- config_name: br
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 124718
num_examples: 500
download_size: 48360
dataset_size: 124718
- config_name: ca
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 154756
num_examples: 500
download_size: 106709
dataset_size: 154756
- config_name: combine_filtered_whisper_large_v3
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
- name: __index_level_0__
dtype: int64
splits:
- name: train
num_bytes: 11750786
num_examples: 34142
download_size: 5707734
dataset_size: 11750786
- config_name: cs
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 150414
num_examples: 500
download_size: 79034
dataset_size: 150414
- config_name: cy
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 140916
num_examples: 500
download_size: 83342
dataset_size: 140916
- config_name: da
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 141496
num_examples: 500
download_size: 60567
dataset_size: 141496
- config_name: de
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 157780
num_examples: 500
download_size: 96637
dataset_size: 157780
- config_name: el
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 164978
num_examples: 500
download_size: 70737
dataset_size: 164978
- config_name: en
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 154956
num_examples: 500
download_size: 123429
dataset_size: 154956
- config_name: es
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 159310
num_examples: 500
download_size: 127634
dataset_size: 159310
- config_name: et
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 192432
num_examples: 500
download_size: 115598
dataset_size: 192432
- config_name: eu
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 157874
num_examples: 500
download_size: 121857
dataset_size: 157874
- config_name: fa
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 164342
num_examples: 500
download_size: 107535
dataset_size: 164342
- config_name: fi
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 150388
num_examples: 500
download_size: 68045
dataset_size: 150388
- config_name: fr
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 159688
num_examples: 500
download_size: 101578
dataset_size: 159688
- config_name: gl
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 151134
num_examples: 500
download_size: 113306
dataset_size: 151134
- config_name: ha
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 138696
num_examples: 500
download_size: 54484
dataset_size: 138696
- config_name: he
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 143348
num_examples: 392
download_size: 64484
dataset_size: 143348
- config_name: hi
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 196502
num_examples: 500
download_size: 78253
dataset_size: 196502
- config_name: ht
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 1335
num_examples: 5
download_size: 4497
dataset_size: 1335
- config_name: hu
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 157988
num_examples: 500
download_size: 75134
dataset_size: 157988
- config_name: hy-AM
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 210470
num_examples: 500
download_size: 86716
dataset_size: 210470
- config_name: id
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 135458
num_examples: 500
download_size: 62223
dataset_size: 135458
- config_name: is
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 2949
num_examples: 9
download_size: 5789
dataset_size: 2949
- config_name: it
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 161018
num_examples: 500
download_size: 117370
dataset_size: 161018
- config_name: ja
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 154228
num_examples: 500
download_size: 114670
dataset_size: 154228
- config_name: ka
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 267546
num_examples: 500
download_size: 99309
dataset_size: 267546
- config_name: kk
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 170704
num_examples: 500
download_size: 74734
dataset_size: 170704
- config_name: ko
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 157144
num_examples: 472
download_size: 76690
dataset_size: 157144
- config_name: lo
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 12716
num_examples: 26
download_size: 10533
dataset_size: 12716
- config_name: lt
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 154422
num_examples: 500
download_size: 74269
dataset_size: 154422
- config_name: lv
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 144804
num_examples: 500
download_size: 97059
dataset_size: 144804
- config_name: mk
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 195724
num_examples: 500
download_size: 86164
dataset_size: 195724
- config_name: ml
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 220380
num_examples: 500
download_size: 81007
dataset_size: 220380
- config_name: mn
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 212668
num_examples: 500
download_size: 104772
dataset_size: 212668
- config_name: mr
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 261024
num_examples: 500
download_size: 98828
dataset_size: 261024
- config_name: mt
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 149290
num_examples: 500
download_size: 67310
dataset_size: 149290
- config_name: ne-NP
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 108282
num_examples: 287
download_size: 43784
dataset_size: 108282
- config_name: nl
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 157258
num_examples: 500
download_size: 72000
dataset_size: 157258
- config_name: nn-NO
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 119872
num_examples: 423
download_size: 50899
dataset_size: 119872
- config_name: oc
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 77096
num_examples: 274
download_size: 44681
dataset_size: 77096
- config_name: pa-IN
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 184206
num_examples: 500
download_size: 68472
dataset_size: 184206
- config_name: pl
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 148288
num_examples: 500
download_size: 107231
dataset_size: 148288
- config_name: ps
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 163576
num_examples: 500
download_size: 82090
dataset_size: 163576
- config_name: pt
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 136488
num_examples: 500
download_size: 85595
dataset_size: 136488
- config_name: ro
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 144052
num_examples: 500
download_size: 61955
dataset_size: 144052
- config_name: ru
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 194342
num_examples: 500
download_size: 99263
dataset_size: 194342
- config_name: sd
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 13140
num_examples: 40
download_size: 10094
dataset_size: 13140
- config_name: sk
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 128640
num_examples: 500
download_size: 58544
dataset_size: 128640
- config_name: sl
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 130246
num_examples: 500
download_size: 75838
dataset_size: 130246
- config_name: sq
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 154310
num_examples: 500
download_size: 67317
dataset_size: 154310
- config_name: sr
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 133670
num_examples: 500
download_size: 50678
dataset_size: 133670
- config_name: sv-SE
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 135556
num_examples: 500
download_size: 61512
dataset_size: 135556
- config_name: sw
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 151132
num_examples: 500
download_size: 89571
dataset_size: 151132
- config_name: ta
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 271944
num_examples: 500
download_size: 104866
dataset_size: 271944
- config_name: te
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 24254
num_examples: 66
download_size: 15702
dataset_size: 24254
- config_name: tg
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 23429
num_examples: 69
download_size: 13999
dataset_size: 23429
- config_name: th
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 198024
num_examples: 500
download_size: 120588
dataset_size: 198024
- config_name: tk
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 156434
num_examples: 500
download_size: 73494
dataset_size: 156434
- config_name: tr
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 136928
num_examples: 500
download_size: 58023
dataset_size: 136928
- config_name: tt
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 166124
num_examples: 500
download_size: 68140
dataset_size: 166124
- config_name: uk
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 168632
num_examples: 500
download_size: 70160
dataset_size: 168632
- config_name: ur
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 169392
num_examples: 500
download_size: 83520
dataset_size: 169392
- config_name: uz
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 152696
num_examples: 500
download_size: 86881
dataset_size: 152696
- config_name: vi
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 137488
num_examples: 500
download_size: 57518
dataset_size: 137488
- config_name: yi
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 77794
num_examples: 222
download_size: 37069
dataset_size: 77794
- config_name: yo
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 179016
num_examples: 500
download_size: 79252
dataset_size: 179016
- config_name: zh-CN
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 154040
num_examples: 500
download_size: 112578
dataset_size: 154040
- config_name: zh-HK
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 132888
num_examples: 500
download_size: 69061
dataset_size: 132888
- config_name: zh-TW
features:
- name: language
dtype: string
- name: source_text
dtype: string
- name: target_text
dtype: string
- name: upvotes
dtype: int64
- name: speaker_id
dtype: string
- name: audio_filename
dtype: string
splits:
- name: train
num_bytes: 122076
num_examples: 500
download_size: 63304
dataset_size: 122076
configs:
- config_name: af
data_files:
- split: train
path: af/train-*
- config_name: am
data_files:
- split: train
path: am/train-*
- config_name: ar
data_files:
- split: train
path: ar/train-*
- config_name: as
data_files:
- split: train
path: as/train-*
- config_name: az
data_files:
- split: train
path: az/train-*
- config_name: ba
data_files:
- split: train
path: ba/train-*
- config_name: be
data_files:
- split: train
path: be/train-*
- config_name: bg
data_files:
- split: train
path: bg/train-*
- config_name: bn
data_files:
- split: train
path: bn/train-*
- config_name: br
data_files:
- split: train
path: br/train-*
- config_name: ca
data_files:
- split: train
path: ca/train-*
- config_name: combine_filtered_whisper_large_v3
data_files:
- split: train
path: combine_filtered_whisper_large_v3/train-*
- config_name: cs
data_files:
- split: train
path: cs/train-*
- config_name: cy
data_files:
- split: train
path: cy/train-*
- config_name: da
data_files:
- split: train
path: da/train-*
- config_name: de
data_files:
- split: train
path: de/train-*
- config_name: el
data_files:
- split: train
path: el/train-*
- config_name: en
data_files:
- split: train
path: en/train-*
- config_name: es
data_files:
- split: train
path: es/train-*
- config_name: et
data_files:
- split: train
path: et/train-*
- config_name: eu
data_files:
- split: train
path: eu/train-*
- config_name: fa
data_files:
- split: train
path: fa/train-*
- config_name: fi
data_files:
- split: train
path: fi/train-*
- config_name: fr
data_files:
- split: train
path: fr/train-*
- config_name: gl
data_files:
- split: train
path: gl/train-*
- config_name: ha
data_files:
- split: train
path: ha/train-*
- config_name: he
data_files:
- split: train
path: he/train-*
- config_name: hi
data_files:
- split: train
path: hi/train-*
- config_name: ht
data_files:
- split: train
path: ht/train-*
- config_name: hu
data_files:
- split: train
path: hu/train-*
- config_name: hy-AM
data_files:
- split: train
path: hy-AM/train-*
- config_name: id
data_files:
- split: train
path: id/train-*
- config_name: is
data_files:
- split: train
path: is/train-*
- config_name: it
data_files:
- split: train
path: it/train-*
- config_name: ja
data_files:
- split: train
path: ja/train-*
- config_name: ka
data_files:
- split: train
path: ka/train-*
- config_name: kk
data_files:
- split: train
path: kk/train-*
- config_name: ko
data_files:
- split: train
path: ko/train-*
- config_name: lo
data_files:
- split: train
path: lo/train-*
- config_name: lt
data_files:
- split: train
path: lt/train-*
- config_name: lv
data_files:
- split: train
path: lv/train-*
- config_name: mk
data_files:
- split: train
path: mk/train-*
- config_name: ml
data_files:
- split: train
path: ml/train-*
- config_name: mn
data_files:
- split: train
path: mn/train-*
- config_name: mr
data_files:
- split: train
path: mr/train-*
- config_name: mt
data_files:
- split: train
path: mt/train-*
- config_name: ne-NP
data_files:
- split: train
path: ne-NP/train-*
- config_name: nl
data_files:
- split: train
path: nl/train-*
- config_name: nn-NO
data_files:
- split: train
path: nn-NO/train-*
- config_name: oc
data_files:
- split: train
path: oc/train-*
- config_name: pa-IN
data_files:
- split: train
path: pa-IN/train-*
- config_name: pl
data_files:
- split: train
path: pl/train-*
- config_name: ps
data_files:
- split: train
path: ps/train-*
- config_name: pt
data_files:
- split: train
path: pt/train-*
- config_name: ro
data_files:
- split: train
path: ro/train-*
- config_name: ru
data_files:
- split: train
path: ru/train-*
- config_name: sd
data_files:
- split: train
path: sd/train-*
- config_name: sk
data_files:
- split: train
path: sk/train-*
- config_name: sl
data_files:
- split: train
path: sl/train-*
- config_name: sq
data_files:
- split: train
path: sq/train-*
- config_name: sr
data_files:
- split: train
path: sr/train-*
- config_name: sv-SE
data_files:
- split: train
path: sv-SE/train-*
- config_name: sw
data_files:
- split: train
path: sw/train-*
- config_name: ta
data_files:
- split: train
path: ta/train-*
- config_name: te
data_files:
- split: train
path: te/train-*
- config_name: tg
data_files:
- split: train
path: tg/train-*
- config_name: th
data_files:
- split: train
path: th/train-*
- config_name: tk
data_files:
- split: train
path: tk/train-*
- config_name: tr
data_files:
- split: train
path: tr/train-*
- config_name: tt
data_files:
- split: train
path: tt/train-*
- config_name: uk
data_files:
- split: train
path: uk/train-*
- config_name: ur
data_files:
- split: train
path: ur/train-*
- config_name: uz
data_files:
- split: train
path: uz/train-*
- config_name: vi
data_files:
- split: train
path: vi/train-*
- config_name: yi
data_files:
- split: train
path: yi/train-*
- config_name: yo
data_files:
- split: train
path: yo/train-*
- config_name: zh-CN
data_files:
- split: train
path: zh-CN/train-*
- config_name: zh-HK
data_files:
- split: train
path: zh-HK/train-*
- config_name: zh-TW
data_files:
- split: train
path: zh-TW/train-*
---
# Evaluation-Multilingual-VC
We use dataset https://huggingface.co/datasets/sarulab-speech/commonvoice22_sidon,
1. Filter languages that support by Whisper Large V3 to evaluate WER automatically,
2. Only take test set, sort by up votes.
3. Because VC required to source text, source audio, target text, we make sure the target text is not same as source text, target text we take from other rows.
4. Only build first 500 rows for each language
Github issue at https://github.com/Scicom-AI-Enterprise-Organization/Multilingual-TTS/issues/4
提供机构:
Scicom-intl



