asahi417/seamless-align-enA-zhA.speaker-embedding.metavoice
收藏Hugging Face2024-06-10 更新2024-06-12 收录
下载链接:
https://hf-mirror.com/datasets/asahi417/seamless-align-enA-zhA.speaker-embedding.metavoice
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: subset_1
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4178187
num_examples: 1962
download_size: 4697629
dataset_size: 4178187
- config_name: subset_10
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4325241
num_examples: 2031
download_size: 4800589
dataset_size: 4325241
- config_name: subset_100
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4027109
num_examples: 1891
download_size: 4560652
dataset_size: 4027109
- config_name: subset_101
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4014383
num_examples: 1885
download_size: 4536325
dataset_size: 4014383
- config_name: subset_102
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3967490
num_examples: 1863
download_size: 4469938
dataset_size: 3967490
- config_name: subset_103
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3963253
num_examples: 1861
download_size: 4478877
dataset_size: 3963253
- config_name: subset_104
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3993050
num_examples: 1875
download_size: 4511226
dataset_size: 3993050
- config_name: subset_105
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3984522
num_examples: 1871
download_size: 4511926
dataset_size: 3984522
- config_name: subset_106
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3971782
num_examples: 1865
download_size: 4471550
dataset_size: 3971782
- config_name: subset_107
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3914294
num_examples: 1838
download_size: 4423934
dataset_size: 3914294
- config_name: subset_108
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3961153
num_examples: 1860
download_size: 4492033
dataset_size: 3961153
- config_name: subset_109
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3973882
num_examples: 1866
download_size: 4493942
dataset_size: 3973882
- config_name: subset_11
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4246495
num_examples: 1994
download_size: 4741778
dataset_size: 4246495
- config_name: subset_110
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3924898
num_examples: 1843
download_size: 4441323
dataset_size: 3924898
- config_name: subset_111
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3929176
num_examples: 1845
download_size: 4448621
dataset_size: 3929176
- config_name: subset_112
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3927021
num_examples: 1844
download_size: 4426963
dataset_size: 3927021
- config_name: subset_113
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3916382
num_examples: 1839
download_size: 4398593
dataset_size: 3916382
- config_name: subset_114
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3941981
num_examples: 1851
download_size: 4461303
dataset_size: 3941981
- config_name: subset_115
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3878073
num_examples: 1821
download_size: 4404239
dataset_size: 3878073
- config_name: subset_116
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3912139
num_examples: 1837
download_size: 4430164
dataset_size: 3912139
- config_name: subset_117
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3948349
num_examples: 1854
download_size: 4469661
dataset_size: 3948349
- config_name: subset_118
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3863163
num_examples: 1814
download_size: 4364133
dataset_size: 3863163
- config_name: subset_119
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3882316
num_examples: 1823
download_size: 4379942
dataset_size: 3882316
- config_name: subset_12
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4331586
num_examples: 2034
download_size: 4836292
dataset_size: 4331586
- config_name: subset_120
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3907865
num_examples: 1835
download_size: 4409783
dataset_size: 3907865
- config_name: subset_121
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3901433
num_examples: 1832
download_size: 4418517
dataset_size: 3901433
- config_name: subset_122
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3884420
num_examples: 1824
download_size: 4394720
dataset_size: 3884420
- config_name: subset_123
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3833362
num_examples: 1800
download_size: 4350568
dataset_size: 3833362
- config_name: subset_124
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3897236
num_examples: 1830
download_size: 4419742
dataset_size: 3897236
- config_name: subset_125
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3956878
num_examples: 1858
download_size: 4481236
dataset_size: 3956878
- config_name: subset_126
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4020747
num_examples: 1888
download_size: 4545634
dataset_size: 4020747
- config_name: subset_127
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3903622
num_examples: 1833
download_size: 4413827
dataset_size: 3903622
- config_name: subset_128
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3907878
num_examples: 1835
download_size: 4443312
dataset_size: 3907878
- config_name: subset_129
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4014361
num_examples: 1885
download_size: 4548907
dataset_size: 4014361
- config_name: subset_13
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4304007
num_examples: 2021
download_size: 4793364
dataset_size: 4304007
- config_name: subset_130
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3892980
num_examples: 1828
download_size: 4414004
dataset_size: 3892980
- config_name: subset_131
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3861034
num_examples: 1813
download_size: 4364749
dataset_size: 3861034
- config_name: subset_132
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3969623
num_examples: 1864
download_size: 4490749
dataset_size: 3969623
- config_name: subset_133
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3927002
num_examples: 1844
download_size: 4454561
dataset_size: 3927002
- config_name: subset_134
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3888723
num_examples: 1826
download_size: 4387273
dataset_size: 3888723
- config_name: subset_135
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3946193
num_examples: 1853
download_size: 4466376
dataset_size: 3946193
- config_name: subset_136
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4005802
num_examples: 1881
download_size: 4516739
dataset_size: 4005802
- config_name: subset_137
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3912113
num_examples: 1837
download_size: 4409777
dataset_size: 3912113
- config_name: subset_138
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3980331
num_examples: 1869
download_size: 4518150
dataset_size: 3980331
- config_name: subset_139
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3897214
num_examples: 1830
download_size: 4424350
dataset_size: 3897214
- config_name: subset_14
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4284823
num_examples: 2012
download_size: 4780394
dataset_size: 4284823
- config_name: subset_140
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3865298
num_examples: 1815
download_size: 4383355
dataset_size: 3865298
- config_name: subset_141
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3863138
num_examples: 1814
download_size: 4378991
dataset_size: 3863138
- config_name: subset_142
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3941932
num_examples: 1851
download_size: 4462305
dataset_size: 3941932
- config_name: subset_143
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3816274
num_examples: 1792
download_size: 4315940
dataset_size: 3816274
- config_name: subset_144
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3952625
num_examples: 1856
download_size: 4487018
dataset_size: 3952625
- config_name: subset_145
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3939816
num_examples: 1850
download_size: 4456912
dataset_size: 3939816
- config_name: subset_146
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3933396
num_examples: 1847
download_size: 4469369
dataset_size: 3933396
- config_name: subset_147
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3941987
num_examples: 1851
download_size: 4469830
dataset_size: 3941987
- config_name: subset_148
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3935566
num_examples: 1848
download_size: 4451955
dataset_size: 3935566
- config_name: subset_149
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3980338
num_examples: 1869
download_size: 4494478
dataset_size: 3980338
- config_name: subset_15
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4280609
num_examples: 2010
download_size: 4767151
dataset_size: 4280609
- config_name: subset_150
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3973881
num_examples: 1866
download_size: 4514133
dataset_size: 3973881
- config_name: subset_151
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3965399
num_examples: 1862
download_size: 4490172
dataset_size: 3965399
- config_name: subset_152
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3886579
num_examples: 1825
download_size: 4394685
dataset_size: 3886579
- config_name: subset_153
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3958963
num_examples: 1859
download_size: 4477250
dataset_size: 3958963
- config_name: subset_154
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3965398
num_examples: 1862
download_size: 4488087
dataset_size: 3965398
- config_name: subset_155
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3890831
num_examples: 1827
download_size: 4406592
dataset_size: 3890831
- config_name: subset_156
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3905718
num_examples: 1834
download_size: 4433415
dataset_size: 3905718
- config_name: subset_157
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3963239
num_examples: 1861
download_size: 4485797
dataset_size: 3963239
- config_name: subset_158
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3797118
num_examples: 1783
download_size: 4323023
dataset_size: 3797118
- config_name: subset_159
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3522395
num_examples: 1654
download_size: 3983351
dataset_size: 3522395
- config_name: subset_16
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4203842
num_examples: 1974
download_size: 4674710
dataset_size: 4203842
- config_name: subset_160
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3920591
num_examples: 1841
download_size: 4459541
dataset_size: 3920591
- config_name: subset_161
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3914235
num_examples: 1838
download_size: 4438402
dataset_size: 3914235
- config_name: subset_162
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3933447
num_examples: 1847
download_size: 4461740
dataset_size: 3933447
- config_name: subset_163
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3967452
num_examples: 1863
download_size: 4480965
dataset_size: 3967452
- config_name: subset_164
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3918535
num_examples: 1840
download_size: 4446956
dataset_size: 3918535
- config_name: subset_165
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3882282
num_examples: 1823
download_size: 4407215
dataset_size: 3882282
- config_name: subset_166
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3971782
num_examples: 1865
download_size: 4502080
dataset_size: 3971782
- config_name: subset_167
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3946191
num_examples: 1853
download_size: 4473493
dataset_size: 3946191
- config_name: subset_168
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3984525
num_examples: 1871
download_size: 4516780
dataset_size: 3984525
- config_name: subset_169
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3929181
num_examples: 1845
download_size: 4464766
dataset_size: 3929181
- config_name: subset_17
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4269920
num_examples: 2005
download_size: 4729110
dataset_size: 4269920
- config_name: subset_170
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3997287
num_examples: 1877
download_size: 4536240
dataset_size: 3997287
- config_name: subset_171
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3967458
num_examples: 1863
download_size: 4499111
dataset_size: 3967458
- config_name: subset_172
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3920644
num_examples: 1841
download_size: 4447845
dataset_size: 3920644
- config_name: subset_173
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3931252
num_examples: 1846
download_size: 4461468
dataset_size: 3931252
- config_name: subset_174
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3903611
num_examples: 1833
download_size: 4439543
dataset_size: 3903611
- config_name: subset_175
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3897177
num_examples: 1830
download_size: 4425662
dataset_size: 3897177
- config_name: subset_176
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3852513
num_examples: 1809
download_size: 4370480
dataset_size: 3852513
- config_name: subset_177
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3920662
num_examples: 1841
download_size: 4453192
dataset_size: 3920662
- config_name: subset_178
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3995181
num_examples: 1876
download_size: 4530153
dataset_size: 3995181
- config_name: subset_179
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3967492
num_examples: 1863
download_size: 4513985
dataset_size: 3967492
- config_name: subset_18
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4116568
num_examples: 1933
download_size: 4594572
dataset_size: 4116568
- config_name: subset_180
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4042040
num_examples: 1898
download_size: 4583599
dataset_size: 4042040
- config_name: subset_181
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3954739
num_examples: 1857
download_size: 4492894
dataset_size: 3954739
- config_name: subset_182
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3954729
num_examples: 1857
download_size: 4501872
dataset_size: 3954729
- config_name: subset_183
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3907866
num_examples: 1835
download_size: 4442919
dataset_size: 3907866
- config_name: subset_184
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3878054
num_examples: 1821
download_size: 4407701
dataset_size: 3878054
- config_name: subset_185
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3878057
num_examples: 1821
download_size: 4393433
dataset_size: 3878057
- config_name: subset_186
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3933446
num_examples: 1847
download_size: 4470446
dataset_size: 3933446
- config_name: subset_187
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3892985
num_examples: 1828
download_size: 4426915
dataset_size: 3892985
- config_name: subset_188
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3912085
num_examples: 1837
download_size: 4437644
dataset_size: 3912085
- config_name: subset_189
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3993013
num_examples: 1875
download_size: 4538458
dataset_size: 3993013
- config_name: subset_19
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4222992
num_examples: 1983
download_size: 4693656
dataset_size: 4222992
- config_name: subset_190
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3952597
num_examples: 1856
download_size: 4486320
dataset_size: 3952597
- config_name: subset_191
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3916360
num_examples: 1839
download_size: 4472494
dataset_size: 3916360
- config_name: subset_192
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3941948
num_examples: 1851
download_size: 4488515
dataset_size: 3941948
- config_name: subset_193
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3944106
num_examples: 1852
download_size: 4491042
dataset_size: 3944106
- config_name: subset_194
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3892926
num_examples: 1828
download_size: 4427493
dataset_size: 3892926
- config_name: subset_195
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3924924
num_examples: 1843
download_size: 4449654
dataset_size: 3924924
- config_name: subset_196
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3973905
num_examples: 1866
download_size: 4523453
dataset_size: 3973905
- config_name: subset_197
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4010113
num_examples: 1883
download_size: 4540997
dataset_size: 4010113
- config_name: subset_198
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3954738
num_examples: 1857
download_size: 4485967
dataset_size: 3954738
- config_name: subset_199
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3937694
num_examples: 1849
download_size: 4462153
dataset_size: 3937694
- config_name: subset_2
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4369800
num_examples: 2052
download_size: 4867963
dataset_size: 4369800
- config_name: subset_20
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4171928
num_examples: 1959
download_size: 4646912
dataset_size: 4171928
- config_name: subset_200
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3973865
num_examples: 1866
download_size: 4513266
dataset_size: 3973865
- config_name: subset_201
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3822671
num_examples: 1795
download_size: 4342855
dataset_size: 3822671
- config_name: subset_202
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4014358
num_examples: 1885
download_size: 4566589
dataset_size: 4014358
- config_name: subset_203
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3973933
num_examples: 1866
download_size: 4501959
dataset_size: 3973933
- config_name: subset_204
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3927077
num_examples: 1844
download_size: 4463041
dataset_size: 3927077
- config_name: subset_205
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3946178
num_examples: 1853
download_size: 4487476
dataset_size: 3946178
- config_name: subset_206
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3914235
num_examples: 1838
download_size: 4455684
dataset_size: 3914235
- config_name: subset_207
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3946172
num_examples: 1853
download_size: 4449611
dataset_size: 3946172
- config_name: subset_208
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3871705
num_examples: 1818
download_size: 4402969
dataset_size: 3871705
- config_name: subset_209
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3841814
num_examples: 1804
download_size: 4369195
dataset_size: 3841814
- config_name: subset_21
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4118712
num_examples: 1934
download_size: 4588878
dataset_size: 4118712
- config_name: subset_210
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3950491
num_examples: 1855
download_size: 4509194
dataset_size: 3950491
- config_name: subset_211
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3948332
num_examples: 1854
download_size: 4480066
dataset_size: 3948332
- config_name: subset_212
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3882293
num_examples: 1823
download_size: 4428676
dataset_size: 3882293
- config_name: subset_213
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3880184
num_examples: 1822
download_size: 4422675
dataset_size: 3880184
- config_name: subset_214
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3946189
num_examples: 1853
download_size: 4476066
dataset_size: 3946189
- config_name: subset_215
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3958985
num_examples: 1859
download_size: 4486652
dataset_size: 3958985
- config_name: subset_216
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3922788
num_examples: 1842
download_size: 4462326
dataset_size: 3922788
- config_name: subset_217
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3931284
num_examples: 1846
download_size: 4463257
dataset_size: 3931284
- config_name: subset_218
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3924922
num_examples: 1843
download_size: 4461436
dataset_size: 3924922
- config_name: subset_219
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3912140
num_examples: 1837
download_size: 4452782
dataset_size: 3912140
- config_name: subset_22
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4086781
num_examples: 1919
download_size: 4555671
dataset_size: 4086781
- config_name: subset_220
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3907844
num_examples: 1835
download_size: 4456633
dataset_size: 3907844
- config_name: subset_221
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3875914
num_examples: 1820
download_size: 4406770
dataset_size: 3875914
- config_name: subset_222
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3897262
num_examples: 1830
download_size: 4419169
dataset_size: 3897262
- config_name: subset_223
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3865339
num_examples: 1815
download_size: 4394728
dataset_size: 3865339
- config_name: subset_224
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3963248
num_examples: 1861
download_size: 4513186
dataset_size: 3963248
- config_name: subset_225
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3922794
num_examples: 1842
download_size: 4462363
dataset_size: 3922794
- config_name: subset_226
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3997319
num_examples: 1877
download_size: 4539293
dataset_size: 3997319
- config_name: subset_227
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3886555
num_examples: 1825
download_size: 4440053
dataset_size: 3886555
- config_name: subset_228
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3905734
num_examples: 1834
download_size: 4431978
dataset_size: 3905734
- config_name: subset_229
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3822648
num_examples: 1795
download_size: 4364932
dataset_size: 3822648
- config_name: subset_23
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4163439
num_examples: 1955
download_size: 4639321
dataset_size: 4163439
- config_name: subset_230
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3969602
num_examples: 1864
download_size: 4512705
dataset_size: 3969602
- config_name: subset_231
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3980251
num_examples: 1869
download_size: 4535199
dataset_size: 3980251
- config_name: subset_232
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3922741
num_examples: 1842
download_size: 4451425
dataset_size: 3922741
- config_name: subset_233
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3954694
num_examples: 1857
download_size: 4480780
dataset_size: 3954694
- config_name: subset_234
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4003704
num_examples: 1880
download_size: 4563279
dataset_size: 4003704
- config_name: subset_235
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3950465
num_examples: 1855
download_size: 4486880
dataset_size: 3950465
- config_name: subset_236
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3941944
num_examples: 1851
download_size: 4485154
dataset_size: 3941944
- config_name: subset_237
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3910028
num_examples: 1836
download_size: 4465013
dataset_size: 3910028
- config_name: subset_238
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3967506
num_examples: 1863
download_size: 4511180
dataset_size: 3967506
- config_name: subset_239
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3961104
num_examples: 1860
download_size: 4509657
dataset_size: 3961104
- config_name: subset_24
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4071850
num_examples: 1912
download_size: 4527047
dataset_size: 4071850
- config_name: subset_240
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3852458
num_examples: 1809
download_size: 4377612
dataset_size: 3852458
- config_name: subset_241
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3997314
num_examples: 1877
download_size: 4546043
dataset_size: 3997314
- config_name: subset_242
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3912051
num_examples: 1837
download_size: 4442026
dataset_size: 3912051
- config_name: subset_243
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3920664
num_examples: 1841
download_size: 4461208
dataset_size: 3920664
- config_name: subset_244
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3858888
num_examples: 1812
download_size: 4390074
dataset_size: 3858888
- config_name: subset_245
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3895060
num_examples: 1829
download_size: 4445332
dataset_size: 3895060
- config_name: subset_246
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3914234
num_examples: 1838
download_size: 4461816
dataset_size: 3914234
- config_name: subset_247
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3965383
num_examples: 1862
download_size: 4507572
dataset_size: 3965383
- config_name: subset_248
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3858859
num_examples: 1812
download_size: 4387000
dataset_size: 3858859
- config_name: subset_249
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3920661
num_examples: 1841
download_size: 4469529
dataset_size: 3920661
- config_name: subset_25
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4099555
num_examples: 1925
download_size: 4581046
dataset_size: 4099555
- config_name: subset_250
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3952593
num_examples: 1856
download_size: 4482753
dataset_size: 3952593
- config_name: subset_251
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3929181
num_examples: 1845
download_size: 4481442
dataset_size: 3929181
- config_name: subset_252
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3916392
num_examples: 1839
download_size: 4457059
dataset_size: 3916392
- config_name: subset_253
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3956838
num_examples: 1858
download_size: 4505032
dataset_size: 3956838
- config_name: subset_254
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3880219
num_examples: 1822
download_size: 4417613
dataset_size: 3880219
- config_name: subset_255
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3854586
num_examples: 1810
download_size: 4395848
dataset_size: 3854586
- config_name: subset_256
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3841832
num_examples: 1804
download_size: 4369513
dataset_size: 3841832
- config_name: subset_257
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3929167
num_examples: 1845
download_size: 4492989
dataset_size: 3929167
- config_name: subset_258
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3262592
num_examples: 1532
download_size: 3701989
dataset_size: 3262592
- config_name: subset_26
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3901481
num_examples: 1832
download_size: 4311857
dataset_size: 3901481
- config_name: subset_27
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3965320
num_examples: 1862
download_size: 4430759
dataset_size: 3965320
- config_name: subset_28
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3895084
num_examples: 1829
download_size: 4340415
dataset_size: 3895084
- config_name: subset_29
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3892975
num_examples: 1828
download_size: 4318680
dataset_size: 3892975
- config_name: subset_3
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4431628
num_examples: 2081
download_size: 4966869
dataset_size: 4431628
- config_name: subset_30
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3835498
num_examples: 1801
download_size: 4281873
dataset_size: 3835498
- config_name: subset_31
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4054798
num_examples: 1904
download_size: 4496214
dataset_size: 4054798
- config_name: subset_32
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4054822
num_examples: 1904
download_size: 4513790
dataset_size: 4054822
- config_name: subset_33
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3990934
num_examples: 1874
download_size: 4437287
dataset_size: 3990934
- config_name: subset_34
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4114420
num_examples: 1932
download_size: 4579959
dataset_size: 4114420
- config_name: subset_35
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4050566
num_examples: 1902
download_size: 4520439
dataset_size: 4050566
- config_name: subset_36
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3997269
num_examples: 1877
download_size: 4447861
dataset_size: 3997269
- config_name: subset_37
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3965427
num_examples: 1862
download_size: 4432883
dataset_size: 3965427
- config_name: subset_38
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3999457
num_examples: 1878
download_size: 4476936
dataset_size: 3999457
- config_name: subset_39
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4001533
num_examples: 1879
download_size: 4470186
dataset_size: 4001533
- config_name: subset_4
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4476450
num_examples: 2102
download_size: 5030150
dataset_size: 4476450
- config_name: subset_40
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4086790
num_examples: 1919
download_size: 4571581
dataset_size: 4086790
- config_name: subset_41
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3892923
num_examples: 1828
download_size: 4354924
dataset_size: 3892923
- config_name: subset_42
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4012239
num_examples: 1884
download_size: 4484321
dataset_size: 4012239
- config_name: subset_43
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3990913
num_examples: 1874
download_size: 4471867
dataset_size: 3990913
- config_name: subset_44
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4033497
num_examples: 1894
download_size: 4511726
dataset_size: 4033497
- config_name: subset_45
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3980255
num_examples: 1869
download_size: 4452648
dataset_size: 3980255
- config_name: subset_46
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4044187
num_examples: 1899
download_size: 4538178
dataset_size: 4044187
- config_name: subset_47
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4073995
num_examples: 1913
download_size: 4570180
dataset_size: 4073995
- config_name: subset_48
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4093119
num_examples: 1922
download_size: 4583803
dataset_size: 4093119
- config_name: subset_49
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4039908
num_examples: 1897
download_size: 4514178
dataset_size: 4039908
- config_name: subset_5
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4355079
num_examples: 2045
download_size: 4884571
dataset_size: 4355079
- config_name: subset_50
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4012219
num_examples: 1884
download_size: 4502782
dataset_size: 4012219
- config_name: subset_51
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4084659
num_examples: 1918
download_size: 4558399
dataset_size: 4084659
- config_name: subset_52
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4003682
num_examples: 1880
download_size: 4487520
dataset_size: 4003682
- config_name: subset_53
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4039906
num_examples: 1897
download_size: 4541726
dataset_size: 4039906
- config_name: subset_54
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4048421
num_examples: 1901
download_size: 4544679
dataset_size: 4048421
- config_name: subset_55
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4025029
num_examples: 1890
download_size: 4522404
dataset_size: 4025029
- config_name: subset_56
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3941960
num_examples: 1851
download_size: 4410785
dataset_size: 3941960
- config_name: subset_57
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4054851
num_examples: 1904
download_size: 4548575
dataset_size: 4054851
- config_name: subset_58
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3939833
num_examples: 1850
download_size: 4406872
dataset_size: 3939833
- config_name: subset_59
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3993068
num_examples: 1875
download_size: 4488270
dataset_size: 3993068
- config_name: subset_6
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4450910
num_examples: 2090
download_size: 4965530
dataset_size: 4450910
- config_name: subset_60
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4005848
num_examples: 1881
download_size: 4485984
dataset_size: 4005848
- config_name: subset_61
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3937712
num_examples: 1849
download_size: 4414337
dataset_size: 3937712
- config_name: subset_62
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4035647
num_examples: 1895
download_size: 4545020
dataset_size: 4035647
- config_name: subset_63
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3990889
num_examples: 1874
download_size: 4486649
dataset_size: 3990889
- config_name: subset_64
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4007953
num_examples: 1882
download_size: 4502204
dataset_size: 4007953
- config_name: subset_65
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3984553
num_examples: 1871
download_size: 4481377
dataset_size: 3984553
- config_name: subset_66
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3939779
num_examples: 1850
download_size: 4424157
dataset_size: 3939779
- config_name: subset_67
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4037797
num_examples: 1896
download_size: 4543192
dataset_size: 4037797
- config_name: subset_68
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3939779
num_examples: 1850
download_size: 4434890
dataset_size: 3939779
- config_name: subset_69
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3948315
num_examples: 1854
download_size: 4441361
dataset_size: 3948315
- config_name: subset_7
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4506317
num_examples: 2116
download_size: 5030760
dataset_size: 4506317
- config_name: subset_70
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3941940
num_examples: 1851
download_size: 4430099
dataset_size: 3941940
- config_name: subset_71
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3995210
num_examples: 1876
download_size: 4501659
dataset_size: 3995210
- config_name: subset_72
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3920652
num_examples: 1841
download_size: 4414862
dataset_size: 3920652
- config_name: subset_73
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4007956
num_examples: 1882
download_size: 4502400
dataset_size: 4007956
- config_name: subset_74
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3971734
num_examples: 1865
download_size: 4476370
dataset_size: 3971734
- config_name: subset_75
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3935530
num_examples: 1848
download_size: 4432666
dataset_size: 3935530
- config_name: subset_76
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4033502
num_examples: 1894
download_size: 4541035
dataset_size: 4033502
- config_name: subset_77
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3993045
num_examples: 1875
download_size: 4489295
dataset_size: 3993045
- config_name: subset_78
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4116558
num_examples: 1933
download_size: 4614583
dataset_size: 4116558
- config_name: subset_79
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4046356
num_examples: 1900
download_size: 4547353
dataset_size: 4046356
- config_name: subset_8
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4461547
num_examples: 2095
download_size: 4986927
dataset_size: 4461547
- config_name: subset_80
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3878043
num_examples: 1821
download_size: 4383077
dataset_size: 3878043
- config_name: subset_81
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3988808
num_examples: 1873
download_size: 4484453
dataset_size: 3988808
- config_name: subset_82
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3965357
num_examples: 1862
download_size: 4484442
dataset_size: 3965357
- config_name: subset_83
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3982476
num_examples: 1870
download_size: 4481647
dataset_size: 3982476
- config_name: subset_84
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3922804
num_examples: 1842
download_size: 4440677
dataset_size: 3922804
- config_name: subset_85
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3982432
num_examples: 1870
download_size: 4472981
dataset_size: 3982432
- config_name: subset_86
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3914237
num_examples: 1838
download_size: 4398357
dataset_size: 3914237
- config_name: subset_87
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3944076
num_examples: 1852
download_size: 4433099
dataset_size: 3944076
- config_name: subset_88
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3976044
num_examples: 1867
download_size: 4476987
dataset_size: 3976044
- config_name: subset_89
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4052693
num_examples: 1903
download_size: 4572829
dataset_size: 4052693
- config_name: subset_9
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4414720
num_examples: 2073
download_size: 4927600
dataset_size: 4414720
- config_name: subset_90
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3888677
num_examples: 1826
download_size: 4407736
dataset_size: 3888677
- config_name: subset_91
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3944085
num_examples: 1852
download_size: 4456701
dataset_size: 3944085
- config_name: subset_92
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3944038
num_examples: 1852
download_size: 4450011
dataset_size: 3944038
- config_name: subset_93
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3897292
num_examples: 1830
download_size: 4402330
dataset_size: 3897292
- config_name: subset_94
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3935585
num_examples: 1848
download_size: 4445449
dataset_size: 3935585
- config_name: subset_95
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3954723
num_examples: 1857
download_size: 4470714
dataset_size: 3954723
- config_name: subset_96
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4014372
num_examples: 1885
download_size: 4523979
dataset_size: 4014372
- config_name: subset_97
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3980263
num_examples: 1869
download_size: 4478908
dataset_size: 3980263
- config_name: subset_98
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: zhA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3961128
num_examples: 1860
download_size: 4450075
dataset_size: 3961128
- config_name: subset_99
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: zhA.id
dtype: string
- name: zhA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: zhA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 4078229
num_examples: 1915
download_size: 4618170
dataset_size: 4078229
configs:
- config_name: subset_1
data_files:
- split: train
path: subset_1/train-*
- config_name: subset_10
data_files:
- split: train
path: subset_10/train-*
- config_name: subset_100
data_files:
- split: train
path: subset_100/train-*
- config_name: subset_101
data_files:
- split: train
path: subset_101/train-*
- config_name: subset_102
data_files:
- split: train
path: subset_102/train-*
- config_name: subset_103
data_files:
- split: train
path: subset_103/train-*
- config_name: subset_104
data_files:
- split: train
path: subset_104/train-*
- config_name: subset_105
data_files:
- split: train
path: subset_105/train-*
- config_name: subset_106
data_files:
- split: train
path: subset_106/train-*
- config_name: subset_107
data_files:
- split: train
path: subset_107/train-*
- config_name: subset_108
data_files:
- split: train
path: subset_108/train-*
- config_name: subset_109
data_files:
- split: train
path: subset_109/train-*
- config_name: subset_11
data_files:
- split: train
path: subset_11/train-*
- config_name: subset_110
data_files:
- split: train
path: subset_110/train-*
- config_name: subset_111
data_files:
- split: train
path: subset_111/train-*
- config_name: subset_112
data_files:
- split: train
path: subset_112/train-*
- config_name: subset_113
data_files:
- split: train
path: subset_113/train-*
- config_name: subset_114
data_files:
- split: train
path: subset_114/train-*
- config_name: subset_115
data_files:
- split: train
path: subset_115/train-*
- config_name: subset_116
data_files:
- split: train
path: subset_116/train-*
- config_name: subset_117
data_files:
- split: train
path: subset_117/train-*
- config_name: subset_118
data_files:
- split: train
path: subset_118/train-*
- config_name: subset_119
data_files:
- split: train
path: subset_119/train-*
- config_name: subset_12
data_files:
- split: train
path: subset_12/train-*
- config_name: subset_120
data_files:
- split: train
path: subset_120/train-*
- config_name: subset_121
data_files:
- split: train
path: subset_121/train-*
- config_name: subset_122
data_files:
- split: train
path: subset_122/train-*
- config_name: subset_123
data_files:
- split: train
path: subset_123/train-*
- config_name: subset_124
data_files:
- split: train
path: subset_124/train-*
- config_name: subset_125
data_files:
- split: train
path: subset_125/train-*
- config_name: subset_126
data_files:
- split: train
path: subset_126/train-*
- config_name: subset_127
data_files:
- split: train
path: subset_127/train-*
- config_name: subset_128
data_files:
- split: train
path: subset_128/train-*
- config_name: subset_129
data_files:
- split: train
path: subset_129/train-*
- config_name: subset_13
data_files:
- split: train
path: subset_13/train-*
- config_name: subset_130
data_files:
- split: train
path: subset_130/train-*
- config_name: subset_131
data_files:
- split: train
path: subset_131/train-*
- config_name: subset_132
data_files:
- split: train
path: subset_132/train-*
- config_name: subset_133
data_files:
- split: train
path: subset_133/train-*
- config_name: subset_134
data_files:
- split: train
path: subset_134/train-*
- config_name: subset_135
data_files:
- split: train
path: subset_135/train-*
- config_name: subset_136
data_files:
- split: train
path: subset_136/train-*
- config_name: subset_137
data_files:
- split: train
path: subset_137/train-*
- config_name: subset_138
data_files:
- split: train
path: subset_138/train-*
- config_name: subset_139
data_files:
- split: train
path: subset_139/train-*
- config_name: subset_14
data_files:
- split: train
path: subset_14/train-*
- config_name: subset_140
data_files:
- split: train
path: subset_140/train-*
- config_name: subset_141
data_files:
- split: train
path: subset_141/train-*
- config_name: subset_142
data_files:
- split: train
path: subset_142/train-*
- config_name: subset_143
data_files:
- split: train
path: subset_143/train-*
- config_name: subset_144
data_files:
- split: train
path: subset_144/train-*
- config_name: subset_145
data_files:
- split: train
path: subset_145/train-*
- config_name: subset_146
data_files:
- split: train
path: subset_146/train-*
- config_name: subset_147
data_files:
- split: train
path: subset_147/train-*
- config_name: subset_148
data_files:
- split: train
path: subset_148/train-*
- config_name: subset_149
data_files:
- split: train
path: subset_149/train-*
- config_name: subset_15
data_files:
- split: train
path: subset_15/train-*
- config_name: subset_150
data_files:
- split: train
path: subset_150/train-*
- config_name: subset_151
data_files:
- split: train
path: subset_151/train-*
- config_name: subset_152
data_files:
- split: train
path: subset_152/train-*
- config_name: subset_153
data_files:
- split: train
path: subset_153/train-*
- config_name: subset_154
data_files:
- split: train
path: subset_154/train-*
- config_name: subset_155
data_files:
- split: train
path: subset_155/train-*
- config_name: subset_156
data_files:
- split: train
path: subset_156/train-*
- config_name: subset_157
data_files:
- split: train
path: subset_157/train-*
- config_name: subset_158
data_files:
- split: train
path: subset_158/train-*
- config_name: subset_159
data_files:
- split: train
path: subset_159/train-*
- config_name: subset_16
data_files:
- split: train
path: subset_16/train-*
- config_name: subset_160
data_files:
- split: train
path: subset_160/train-*
- config_name: subset_161
data_files:
- split: train
path: subset_161/train-*
- config_name: subset_162
data_files:
- split: train
path: subset_162/train-*
- config_name: subset_163
data_files:
- split: train
path: subset_163/train-*
- config_name: subset_164
data_files:
- split: train
path: subset_164/train-*
- config_name: subset_165
data_files:
- split: train
path: subset_165/train-*
- config_name: subset_166
data_files:
- split: train
path: subset_166/train-*
- config_name: subset_167
data_files:
- split: train
path: subset_167/train-*
- config_name: subset_168
data_files:
- split: train
path: subset_168/train-*
- config_name: subset_169
data_files:
- split: train
path: subset_169/train-*
- config_name: subset_17
data_files:
- split: train
path: subset_17/train-*
- config_name: subset_170
data_files:
- split: train
path: subset_170/train-*
- config_name: subset_171
data_files:
- split: train
path: subset_171/train-*
- config_name: subset_172
data_files:
- split: train
path: subset_172/train-*
- config_name: subset_173
data_files:
- split: train
path: subset_173/train-*
- config_name: subset_174
data_files:
- split: train
path: subset_174/train-*
- config_name: subset_175
data_files:
- split: train
path: subset_175/train-*
- config_name: subset_176
data_files:
- split: train
path: subset_176/train-*
- config_name: subset_177
data_files:
- split: train
path: subset_177/train-*
- config_name: subset_178
data_files:
- split: train
path: subset_178/train-*
- config_name: subset_179
data_files:
- split: train
path: subset_179/train-*
- config_name: subset_18
data_files:
- split: train
path: subset_18/train-*
- config_name: subset_180
data_files:
- split: train
path: subset_180/train-*
- config_name: subset_181
data_files:
- split: train
path: subset_181/train-*
- config_name: subset_182
data_files:
- split: train
path: subset_182/train-*
- config_name: subset_183
data_files:
- split: train
path: subset_183/train-*
- config_name: subset_184
data_files:
- split: train
path: subset_184/train-*
- config_name: subset_185
data_files:
- split: train
path: subset_185/train-*
- config_name: subset_186
data_files:
- split: train
path: subset_186/train-*
- config_name: subset_187
data_files:
- split: train
path: subset_187/train-*
- config_name: subset_188
data_files:
- split: train
path: subset_188/train-*
- config_name: subset_189
data_files:
- split: train
path: subset_189/train-*
- config_name: subset_19
data_files:
- split: train
path: subset_19/train-*
- config_name: subset_190
data_files:
- split: train
path: subset_190/train-*
- config_name: subset_191
data_files:
- split: train
path: subset_191/train-*
- config_name: subset_192
data_files:
- split: train
path: subset_192/train-*
- config_name: subset_193
data_files:
- split: train
path: subset_193/train-*
- config_name: subset_194
data_files:
- split: train
path: subset_194/train-*
- config_name: subset_195
data_files:
- split: train
path: subset_195/train-*
- config_name: subset_196
data_files:
- split: train
path: subset_196/train-*
- config_name: subset_197
data_files:
- split: train
path: subset_197/train-*
- config_name: subset_198
data_files:
- split: train
path: subset_198/train-*
- config_name: subset_199
data_files:
- split: train
path: subset_199/train-*
- config_name: subset_2
data_files:
- split: train
path: subset_2/train-*
- config_name: subset_20
data_files:
- split: train
path: subset_20/train-*
- config_name: subset_200
data_files:
- split: train
path: subset_200/train-*
- config_name: subset_201
data_files:
- split: train
path: subset_201/train-*
- config_name: subset_202
data_files:
- split: train
path: subset_202/train-*
- config_name: subset_203
data_files:
- split: train
path: subset_203/train-*
- config_name: subset_204
data_files:
- split: train
path: subset_204/train-*
- config_name: subset_205
data_files:
- split: train
path: subset_205/train-*
- config_name: subset_206
data_files:
- split: train
path: subset_206/train-*
- config_name: subset_207
data_files:
- split: train
path: subset_207/train-*
- config_name: subset_208
data_files:
- split: train
path: subset_208/train-*
- config_name: subset_209
data_files:
- split: train
path: subset_209/train-*
- config_name: subset_21
data_files:
- split: train
path: subset_21/train-*
- config_name: subset_210
data_files:
- split: train
path: subset_210/train-*
- config_name: subset_211
data_files:
- split: train
path: subset_211/train-*
- config_name: subset_212
data_files:
- split: train
path: subset_212/train-*
- config_name: subset_213
data_files:
- split: train
path: subset_213/train-*
- config_name: subset_214
data_files:
- split: train
path: subset_214/train-*
- config_name: subset_215
data_files:
- split: train
path: subset_215/train-*
- config_name: subset_216
data_files:
- split: train
path: subset_216/train-*
- config_name: subset_217
data_files:
- split: train
path: subset_217/train-*
- config_name: subset_218
data_files:
- split: train
path: subset_218/train-*
- config_name: subset_219
data_files:
- split: train
path: subset_219/train-*
- config_name: subset_22
data_files:
- split: train
path: subset_22/train-*
- config_name: subset_220
data_files:
- split: train
path: subset_220/train-*
- config_name: subset_221
data_files:
- split: train
path: subset_221/train-*
- config_name: subset_222
data_files:
- split: train
path: subset_222/train-*
- config_name: subset_223
data_files:
- split: train
path: subset_223/train-*
- config_name: subset_224
data_files:
- split: train
path: subset_224/train-*
- config_name: subset_225
data_files:
- split: train
path: subset_225/train-*
- config_name: subset_226
data_files:
- split: train
path: subset_226/train-*
- config_name: subset_227
data_files:
- split: train
path: subset_227/train-*
- config_name: subset_228
data_files:
- split: train
path: subset_228/train-*
- config_name: subset_229
data_files:
- split: train
path: subset_229/train-*
- config_name: subset_23
data_files:
- split: train
path: subset_23/train-*
- config_name: subset_230
data_files:
- split: train
path: subset_230/train-*
- config_name: subset_231
data_files:
- split: train
path: subset_231/train-*
- config_name: subset_232
data_files:
- split: train
path: subset_232/train-*
- config_name: subset_233
data_files:
- split: train
path: subset_233/train-*
- config_name: subset_234
data_files:
- split: train
path: subset_234/train-*
- config_name: subset_235
data_files:
- split: train
path: subset_235/train-*
- config_name: subset_236
data_files:
- split: train
path: subset_236/train-*
- config_name: subset_237
data_files:
- split: train
path: subset_237/train-*
- config_name: subset_238
data_files:
- split: train
path: subset_238/train-*
- config_name: subset_239
data_files:
- split: train
path: subset_239/train-*
- config_name: subset_24
data_files:
- split: train
path: subset_24/train-*
- config_name: subset_240
data_files:
- split: train
path: subset_240/train-*
- config_name: subset_241
data_files:
- split: train
path: subset_241/train-*
- config_name: subset_242
data_files:
- split: train
path: subset_242/train-*
- config_name: subset_243
data_files:
- split: train
path: subset_243/train-*
- config_name: subset_244
data_files:
- split: train
path: subset_244/train-*
- config_name: subset_245
data_files:
- split: train
path: subset_245/train-*
- config_name: subset_246
data_files:
- split: train
path: subset_246/train-*
- config_name: subset_247
data_files:
- split: train
path: subset_247/train-*
- config_name: subset_248
data_files:
- split: train
path: subset_248/train-*
- config_name: subset_249
data_files:
- split: train
path: subset_249/train-*
- config_name: subset_25
data_files:
- split: train
path: subset_25/train-*
- config_name: subset_250
data_files:
- split: train
path: subset_250/train-*
- config_name: subset_251
data_files:
- split: train
path: subset_251/train-*
- config_name: subset_252
data_files:
- split: train
path: subset_252/train-*
- config_name: subset_253
data_files:
- split: train
path: subset_253/train-*
- config_name: subset_254
data_files:
- split: train
path: subset_254/train-*
- config_name: subset_255
data_files:
- split: train
path: subset_255/train-*
- config_name: subset_256
data_files:
- split: train
path: subset_256/train-*
- config_name: subset_257
data_files:
- split: train
path: subset_257/train-*
- config_name: subset_258
data_files:
- split: train
path: subset_258/train-*
- config_name: subset_26
data_files:
- split: train
path: subset_26/train-*
- config_name: subset_27
data_files:
- split: train
path: subset_27/train-*
- config_name: subset_28
data_files:
- split: train
path: subset_28/train-*
- config_name: subset_29
data_files:
- split: train
path: subset_29/train-*
- config_name: subset_3
data_files:
- split: train
path: subset_3/train-*
- config_name: subset_30
data_files:
- split: train
path: subset_30/train-*
- config_name: subset_31
data_files:
- split: train
path: subset_31/train-*
- config_name: subset_32
data_files:
- split: train
path: subset_32/train-*
- config_name: subset_33
data_files:
- split: train
path: subset_33/train-*
- config_name: subset_34
data_files:
- split: train
path: subset_34/train-*
- config_name: subset_35
data_files:
- split: train
path: subset_35/train-*
- config_name: subset_36
data_files:
- split: train
path: subset_36/train-*
- config_name: subset_37
data_files:
- split: train
path: subset_37/train-*
- config_name: subset_38
data_files:
- split: train
path: subset_38/train-*
- config_name: subset_39
data_files:
- split: train
path: subset_39/train-*
- config_name: subset_4
data_files:
- split: train
path: subset_4/train-*
- config_name: subset_40
data_files:
- split: train
path: subset_40/train-*
- config_name: subset_41
data_files:
- split: train
path: subset_41/train-*
- config_name: subset_42
data_files:
- split: train
path: subset_42/train-*
- config_name: subset_43
data_files:
- split: train
path: subset_43/train-*
- config_name: subset_44
data_files:
- split: train
path: subset_44/train-*
- config_name: subset_45
data_files:
- split: train
path: subset_45/train-*
- config_name: subset_46
data_files:
- split: train
path: subset_46/train-*
- config_name: subset_47
data_files:
- split: train
path: subset_47/train-*
- config_name: subset_48
data_files:
- split: train
path: subset_48/train-*
- config_name: subset_49
data_files:
- split: train
path: subset_49/train-*
- config_name: subset_5
data_files:
- split: train
path: subset_5/train-*
- config_name: subset_50
data_files:
- split: train
path: subset_50/train-*
- config_name: subset_51
data_files:
- split: train
path: subset_51/train-*
- config_name: subset_52
data_files:
- split: train
path: subset_52/train-*
- config_name: subset_53
data_files:
- split: train
path: subset_53/train-*
- config_name: subset_54
data_files:
- split: train
path: subset_54/train-*
- config_name: subset_55
data_files:
- split: train
path: subset_55/train-*
- config_name: subset_56
data_files:
- split: train
path: subset_56/train-*
- config_name: subset_57
data_files:
- split: train
path: subset_57/train-*
- config_name: subset_58
data_files:
- split: train
path: subset_58/train-*
- config_name: subset_59
data_files:
- split: train
path: subset_59/train-*
- config_name: subset_6
data_files:
- split: train
path: subset_6/train-*
- config_name: subset_60
data_files:
- split: train
path: subset_60/train-*
- config_name: subset_61
data_files:
- split: train
path: subset_61/train-*
- config_name: subset_62
data_files:
- split: train
path: subset_62/train-*
- config_name: subset_63
data_files:
- split: train
path: subset_63/train-*
- config_name: subset_64
data_files:
- split: train
path: subset_64/train-*
- config_name: subset_65
data_files:
- split: train
path: subset_65/train-*
- config_name: subset_66
data_files:
- split: train
path: subset_66/train-*
- config_name: subset_67
data_files:
- split: train
path: subset_67/train-*
- config_name: subset_68
data_files:
- split: train
path: subset_68/train-*
- config_name: subset_69
data_files:
- split: train
path: subset_69/train-*
- config_name: subset_7
data_files:
- split: train
path: subset_7/train-*
- config_name: subset_70
data_files:
- split: train
path: subset_70/train-*
- config_name: subset_71
data_files:
- split: train
path: subset_71/train-*
- config_name: subset_72
data_files:
- split: train
path: subset_72/train-*
- config_name: subset_73
data_files:
- split: train
path: subset_73/train-*
- config_name: subset_74
data_files:
- split: train
path: subset_74/train-*
- config_name: subset_75
data_files:
- split: train
path: subset_75/train-*
- config_name: subset_76
data_files:
- split: train
path: subset_76/train-*
- config_name: subset_77
data_files:
- split: train
path: subset_77/train-*
- config_name: subset_78
data_files:
- split: train
path: subset_78/train-*
- config_name: subset_79
data_files:
- split: train
path: subset_79/train-*
- config_name: subset_8
data_files:
- split: train
path: subset_8/train-*
- config_name: subset_80
data_files:
- split: train
path: subset_80/train-*
- config_name: subset_81
data_files:
- split: train
path: subset_81/train-*
- config_name: subset_82
data_files:
- split: train
path: subset_82/train-*
- config_name: subset_83
data_files:
- split: train
path: subset_83/train-*
- config_name: subset_84
data_files:
- split: train
path: subset_84/train-*
- config_name: subset_85
data_files:
- split: train
path: subset_85/train-*
- config_name: subset_86
data_files:
- split: train
path: subset_86/train-*
- config_name: subset_87
data_files:
- split: train
path: subset_87/train-*
- config_name: subset_88
data_files:
- split: train
path: subset_88/train-*
- config_name: subset_89
data_files:
- split: train
path: subset_89/train-*
- config_name: subset_9
data_files:
- split: train
path: subset_9/train-*
- config_name: subset_90
data_files:
- split: train
path: subset_90/train-*
- config_name: subset_91
data_files:
- split: train
path: subset_91/train-*
- config_name: subset_92
data_files:
- split: train
path: subset_92/train-*
- config_name: subset_93
data_files:
- split: train
path: subset_93/train-*
- config_name: subset_94
data_files:
- split: train
path: subset_94/train-*
- config_name: subset_95
data_files:
- split: train
path: subset_95/train-*
- config_name: subset_96
data_files:
- split: train
path: subset_96/train-*
- config_name: subset_97
data_files:
- split: train
path: subset_97/train-*
- config_name: subset_98
data_files:
- split: train
path: subset_98/train-*
- config_name: subset_99
data_files:
- split: train
path: subset_99/train-*
---
提供机构:
asahi417
原始信息汇总
数据集概述
数据集配置
-
subset_1
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1962 examples, 4178187 bytes
- 下载大小: 4697629 bytes
- 数据集大小: 4178187 bytes
- 特征:
-
subset_10
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 2031 examples, 4325241 bytes
- 下载大小: 4800589 bytes
- 数据集大小: 4325241 bytes
- 特征:
-
subset_100
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1891 examples, 4027109 bytes
- 下载大小: 4560652 bytes
- 数据集大小: 4027109 bytes
- 特征:
-
subset_101
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1885 examples, 4014383 bytes
- 下载大小: 4536325 bytes
- 数据集大小: 4014383 bytes
- 特征:
-
subset_102
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1863 examples, 3967490 bytes
- 下载大小: 4469938 bytes
- 数据集大小: 3967490 bytes
- 特征:
-
subset_103
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1861 examples, 3963253 bytes
- 下载大小: 4478877 bytes
- 数据集大小: 3963253 bytes
- 特征:
-
subset_104
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1875 examples, 3993050 bytes
- 下载大小: 4511226 bytes
- 数据集大小: 3993050 bytes
- 特征:
-
subset_105
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1871 examples, 3984522 bytes
- 下载大小: 4511926 bytes
- 数据集大小: 3984522 bytes
- 特征:
-
subset_106
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1865 examples, 3971782 bytes
- 下载大小: 4471550 bytes
- 数据集大小: 3971782 bytes
- 特征:
-
subset_107
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1838 examples, 3914294 bytes
- 下载大小: 4423934 bytes
- 数据集大小: 3914294 bytes
- 特征:
-
subset_108
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1860 examples, 3961153 bytes
- 下载大小: 4492033 bytes
- 数据集大小: 3961153 bytes
- 特征:
-
subset_109
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1866 examples, 3973882 bytes
- 下载大小: 4493942 bytes
- 数据集大小: 3973882 bytes
- 特征:
-
subset_11
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1994 examples, 4246495 bytes
- 下载大小: 4741778 bytes
- 数据集大小: 4246495 bytes
- 特征:
-
subset_110
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1843 examples, 3924898 bytes
- 下载大小: 4441323 bytes
- 数据集大小: 3924898 bytes
- 特征:
-
subset_111
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1845 examples, 3929176 bytes
- 下载大小: 4448621 bytes
- 数据集大小: 3929176 bytes
- 特征:
-
subset_112
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1844 examples, 3927021 bytes
- 下载大小: 4426963 bytes
- 数据集大小: 3927021 bytes
- 特征:
-
subset_113
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1839 examples, 3916382 bytes
- 下载大小: 4398593 bytes
- 数据集大小: 3916382 bytes
- 特征:
-
subset_114
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1851 examples, 3941981 bytes
- 下载大小: 4461303 bytes
- 数据集大小: 3941981 bytes
- 特征:
-
subset_115
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1821 examples, 3878073 bytes
- 下载大小: 4404239 bytes
- 数据集大小: 3878073 bytes
- 特征:
-
subset_116
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1837 examples, 3912139 bytes
- 下载大小: 4430164 bytes
- 数据集大小: 3912139 bytes
- 特征:
-
subset_117
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1854 examples, 3948349 bytes
- 下载大小: 4469661 bytes
- 数据集大小: 3948349 bytes
- 特征:
-
subset_118
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- enA.audio.speaker_embedding: sequence: float32
- zhA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1814 examples, 3863163 bytes
- 下载大小: 4364133 bytes
- 数据集大小: 3863163 bytes
- 特征:
-
subset_119
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 1823 examples, 3882316 bytes
- 下载大小: 4379942 bytes
- 数据集大小: 3882316 bytes
- 特征:
-
subset_12
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zhA.laser_score: float64
- zhA.audio.speaker_embedding: sequence: float32
- enA.audio.speaker_embedding: sequence: float32
- 分割:
- train: 2034 examples, 4331586 bytes
- 下载大小: 4836292 bytes
- 数据集大小: 4331586 bytes
- 特征:
-
subset_120
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- zhA.id: string
- zh
- 特征:



