asahi417/seamless-align-enA-viA.speaker-embedding.metavoice
收藏Hugging Face2024-06-02 更新2024-06-12 收录
下载链接:
https://hf-mirror.com/datasets/asahi417/seamless-align-enA-viA.speaker-embedding.metavoice
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: subset_1
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3946355
num_examples: 1853
download_size: 4372012
dataset_size: 3946355
- config_name: subset_10
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2321244
num_examples: 1090
download_size: 2465259
dataset_size: 2321244
- config_name: subset_100
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3352018
num_examples: 1574
download_size: 3717499
dataset_size: 3352018
- config_name: subset_101
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3396787
num_examples: 1595
download_size: 3755313
dataset_size: 3396787
- config_name: subset_102
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3390391
num_examples: 1592
download_size: 3747644
dataset_size: 3390391
- config_name: subset_103
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3322254
num_examples: 1560
download_size: 3684229
dataset_size: 3322254
- config_name: subset_104
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3234911
num_examples: 1519
download_size: 3578891
dataset_size: 3234911
- config_name: subset_105
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3343509
num_examples: 1570
download_size: 3687977
dataset_size: 3343509
- config_name: subset_106
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3332893
num_examples: 1565
download_size: 3692437
dataset_size: 3332893
- config_name: subset_107
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3341440
num_examples: 1569
download_size: 3708966
dataset_size: 3341440
- config_name: subset_108
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3384039
num_examples: 1589
download_size: 3746884
dataset_size: 3384039
- config_name: subset_109
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3373339
num_examples: 1584
download_size: 3735430
dataset_size: 3373339
- config_name: subset_11
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2440568
num_examples: 1146
download_size: 2630332
dataset_size: 2440568
- config_name: subset_110
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3254084
num_examples: 1528
download_size: 3591910
dataset_size: 3254084
- config_name: subset_111
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3213652
num_examples: 1509
download_size: 3569229
dataset_size: 3213652
- config_name: subset_112
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3275401
num_examples: 1538
download_size: 3631987
dataset_size: 3275401
- config_name: subset_113
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3292418
num_examples: 1546
download_size: 3651878
dataset_size: 3292418
- config_name: subset_114
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3264757
num_examples: 1533
download_size: 3614785
dataset_size: 3264757
- config_name: subset_115
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3307270
num_examples: 1553
download_size: 3668905
dataset_size: 3307270
- config_name: subset_116
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3288150
num_examples: 1544
download_size: 3667788
dataset_size: 3288150
- config_name: subset_117
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3347771
num_examples: 1572
download_size: 3712765
dataset_size: 3347771
- config_name: subset_118
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3298832
num_examples: 1549
download_size: 3674748
dataset_size: 3298832
- config_name: subset_119
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3383976
num_examples: 1589
download_size: 3743077
dataset_size: 3383976
- config_name: subset_12
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2361739
num_examples: 1109
download_size: 2543444
dataset_size: 2361739
- config_name: subset_120
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3379722
num_examples: 1587
download_size: 3728761
dataset_size: 3379722
- config_name: subset_121
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3394661
num_examples: 1594
download_size: 3748465
dataset_size: 3394661
- config_name: subset_122
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3390395
num_examples: 1592
download_size: 3767643
dataset_size: 3390395
- config_name: subset_123
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3347759
num_examples: 1572
download_size: 3684615
dataset_size: 3347759
- config_name: subset_124
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3300937
num_examples: 1550
download_size: 3660984
dataset_size: 3300937
- config_name: subset_125
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3330736
num_examples: 1564
download_size: 3700309
dataset_size: 3330736
- config_name: subset_126
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3332893
num_examples: 1565
download_size: 3694337
dataset_size: 3332893
- config_name: subset_127
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3352047
num_examples: 1574
download_size: 3733701
dataset_size: 3352047
- config_name: subset_128
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3383973
num_examples: 1589
download_size: 3742855
dataset_size: 3383973
- config_name: subset_129
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3456342
num_examples: 1623
download_size: 3824614
dataset_size: 3456342
- config_name: subset_13
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2442651
num_examples: 1147
download_size: 2622566
dataset_size: 2442651
- config_name: subset_130
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3356311
num_examples: 1576
download_size: 3715538
dataset_size: 3356311
- config_name: subset_131
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3377592
num_examples: 1586
download_size: 3742444
dataset_size: 3377592
- config_name: subset_132
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3335047
num_examples: 1566
download_size: 3688756
dataset_size: 3335047
- config_name: subset_133
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3369083
num_examples: 1582
download_size: 3738767
dataset_size: 3369083
- config_name: subset_134
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3200845
num_examples: 1503
download_size: 3556465
dataset_size: 3200845
- config_name: subset_135
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3151869
num_examples: 1480
download_size: 3517348
dataset_size: 3151869
- config_name: subset_136
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3396766
num_examples: 1595
download_size: 3748631
dataset_size: 3396766
- config_name: subset_137
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3454317
num_examples: 1622
download_size: 3816794
dataset_size: 3454317
- config_name: subset_138
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3396760
num_examples: 1595
download_size: 3781606
dataset_size: 3396760
- config_name: subset_139
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3366945
num_examples: 1581
download_size: 3742818
dataset_size: 3366945
- config_name: subset_14
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2466081
num_examples: 1158
download_size: 2653868
dataset_size: 2466081
- config_name: subset_140
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3352035
num_examples: 1574
download_size: 3709704
dataset_size: 3352035
- config_name: subset_141
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3305223
num_examples: 1552
download_size: 3689934
dataset_size: 3305223
- config_name: subset_142
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3443625
num_examples: 1617
download_size: 3822762
dataset_size: 3443625
- config_name: subset_143
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3437243
num_examples: 1614
download_size: 3826040
dataset_size: 3437243
- config_name: subset_144
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3507446
num_examples: 1647
download_size: 3903543
dataset_size: 3507446
- config_name: subset_145
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3392544
num_examples: 1593
download_size: 3781804
dataset_size: 3392544
- config_name: subset_146
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3413815
num_examples: 1603
download_size: 3790645
dataset_size: 3413815
- config_name: subset_147
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3452143
num_examples: 1621
download_size: 3826197
dataset_size: 3452143
- config_name: subset_148
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3420196
num_examples: 1606
download_size: 3798264
dataset_size: 3420196
- config_name: subset_149
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 404623
num_examples: 190
download_size: 438210
dataset_size: 404623
- config_name: subset_15
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2570457
num_examples: 1207
download_size: 2770690
dataset_size: 2570457
- config_name: subset_16
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2472469
num_examples: 1161
download_size: 2679339
dataset_size: 2472469
- config_name: subset_17
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2549099
num_examples: 1197
download_size: 2750754
dataset_size: 2549099
- config_name: subset_18
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2689715
num_examples: 1263
download_size: 2903357
dataset_size: 2689715
- config_name: subset_19
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2574673
num_examples: 1209
download_size: 2777056
dataset_size: 2574673
- config_name: subset_2
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3188077
num_examples: 1497
download_size: 3466458
dataset_size: 3188077
- config_name: subset_20
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2547040
num_examples: 1196
download_size: 2744853
dataset_size: 2547040
- config_name: subset_21
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2630082
num_examples: 1235
download_size: 2849490
dataset_size: 2630082
- config_name: subset_22
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2574650
num_examples: 1209
download_size: 2794817
dataset_size: 2574650
- config_name: subset_23
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2651349
num_examples: 1245
download_size: 2856738
dataset_size: 2651349
- config_name: subset_24
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2683297
num_examples: 1260
download_size: 2889919
dataset_size: 2683297
- config_name: subset_25
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2747201
num_examples: 1290
download_size: 2982113
dataset_size: 2747201
- config_name: subset_26
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2843001
num_examples: 1335
download_size: 3086417
dataset_size: 2843001
- config_name: subset_27
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2698266
num_examples: 1267
download_size: 2927220
dataset_size: 2698266
- config_name: subset_28
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2787633
num_examples: 1309
download_size: 3024846
dataset_size: 2787633
- config_name: subset_29
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2779174
num_examples: 1305
download_size: 3019625
dataset_size: 2779174
- config_name: subset_3
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2821732
num_examples: 1325
download_size: 3022175
dataset_size: 2821732
- config_name: subset_30
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2796171
num_examples: 1313
download_size: 3017758
dataset_size: 2796171
- config_name: subset_31
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2877116
num_examples: 1351
download_size: 3102010
dataset_size: 2877116
- config_name: subset_32
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2885620
num_examples: 1355
download_size: 3123190
dataset_size: 2885620
- config_name: subset_33
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2875026
num_examples: 1350
download_size: 3126671
dataset_size: 2875026
- config_name: subset_34
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2955913
num_examples: 1388
download_size: 3213770
dataset_size: 2955913
- config_name: subset_35
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2828085
num_examples: 1328
download_size: 3051138
dataset_size: 2828085
- config_name: subset_36
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2919700
num_examples: 1371
download_size: 3191550
dataset_size: 2919700
- config_name: subset_37
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2909088
num_examples: 1366
download_size: 3150727
dataset_size: 2909088
- config_name: subset_38
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2800429
num_examples: 1315
download_size: 3037157
dataset_size: 2800429
- config_name: subset_39
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2770624
num_examples: 1301
download_size: 3012017
dataset_size: 2770624
- config_name: subset_4
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2493778
num_examples: 1171
download_size: 2737069
dataset_size: 2493778
- config_name: subset_40
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2866468
num_examples: 1346
download_size: 3107410
dataset_size: 2866468
- config_name: subset_41
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2653505
num_examples: 1246
download_size: 2884102
dataset_size: 2653505
- config_name: subset_42
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2966548
num_examples: 1393
download_size: 3212888
dataset_size: 2966548
- config_name: subset_43
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2958082
num_examples: 1389
download_size: 3208780
dataset_size: 2958082
- config_name: subset_44
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2977224
num_examples: 1398
download_size: 3238666
dataset_size: 2977224
- config_name: subset_45
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3009155
num_examples: 1413
download_size: 3300403
dataset_size: 3009155
- config_name: subset_46
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2847300
num_examples: 1337
download_size: 3107182
dataset_size: 2847300
- config_name: subset_47
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2990012
num_examples: 1404
download_size: 3263138
dataset_size: 2990012
- config_name: subset_48
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2951646
num_examples: 1386
download_size: 3201977
dataset_size: 2951646
- config_name: subset_49
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3041077
num_examples: 1428
download_size: 3341894
dataset_size: 3041077
- config_name: subset_5
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2406488
num_examples: 1130
download_size: 2621237
dataset_size: 2406488
- config_name: subset_50
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2960211
num_examples: 1390
download_size: 3209904
dataset_size: 2960211
- config_name: subset_51
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3070926
num_examples: 1442
download_size: 3359544
dataset_size: 3070926
- config_name: subset_52
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3139077
num_examples: 1474
download_size: 3441154
dataset_size: 3139077
- config_name: subset_53
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3045373
num_examples: 1430
download_size: 3339780
dataset_size: 3045373
- config_name: subset_54
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3122075
num_examples: 1466
download_size: 3409121
dataset_size: 3122075
- config_name: subset_55
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3073063
num_examples: 1443
download_size: 3387666
dataset_size: 3073063
- config_name: subset_56
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3041116
num_examples: 1428
download_size: 3330036
dataset_size: 3041116
- config_name: subset_57
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3107165
num_examples: 1459
download_size: 3408106
dataset_size: 3107165
- config_name: subset_58
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3194471
num_examples: 1500
download_size: 3506168
dataset_size: 3194471
- config_name: subset_59
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3107112
num_examples: 1459
download_size: 3404140
dataset_size: 3107112
- config_name: subset_6
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2402244
num_examples: 1128
download_size: 2605454
dataset_size: 2402244
- config_name: subset_60
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3102871
num_examples: 1457
download_size: 3422379
dataset_size: 3102871
- config_name: subset_61
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3100763
num_examples: 1456
download_size: 3407939
dataset_size: 3100763
- config_name: subset_62
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3045393
num_examples: 1430
download_size: 3343316
dataset_size: 3045393
- config_name: subset_63
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2930352
num_examples: 1376
download_size: 3211827
dataset_size: 2930352
- config_name: subset_64
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3051754
num_examples: 1433
download_size: 3349211
dataset_size: 3051754
- config_name: subset_65
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3087970
num_examples: 1450
download_size: 3416928
dataset_size: 3087970
- config_name: subset_66
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3096487
num_examples: 1454
download_size: 3408748
dataset_size: 3096487
- config_name: subset_67
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3136944
num_examples: 1473
download_size: 3458292
dataset_size: 3136944
- config_name: subset_68
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3119929
num_examples: 1465
download_size: 3426628
dataset_size: 3119929
- config_name: subset_69
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3113500
num_examples: 1462
download_size: 3419868
dataset_size: 3113500
- config_name: subset_7
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2323384
num_examples: 1091
download_size: 2499611
dataset_size: 2323384
- config_name: subset_70
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3168870
num_examples: 1488
download_size: 3471365
dataset_size: 3168870
- config_name: subset_71
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3141169
num_examples: 1475
download_size: 3454916
dataset_size: 3141169
- config_name: subset_72
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3190197
num_examples: 1498
download_size: 3523199
dataset_size: 3190197
- config_name: subset_73
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3260444
num_examples: 1531
download_size: 3587708
dataset_size: 3260444
- config_name: subset_74
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3290291
num_examples: 1545
download_size: 3611135
dataset_size: 3290291
- config_name: subset_75
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3254106
num_examples: 1528
download_size: 3590004
dataset_size: 3254106
- config_name: subset_76
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3162527
num_examples: 1485
download_size: 3489091
dataset_size: 3162527
- config_name: subset_77
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3154031
num_examples: 1481
download_size: 3463153
dataset_size: 3154031
- config_name: subset_78
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2989986
num_examples: 1404
download_size: 3301715
dataset_size: 2989986
- config_name: subset_79
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3139068
num_examples: 1474
download_size: 3456080
dataset_size: 3139068
- config_name: subset_8
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2257344
num_examples: 1060
download_size: 2436583
dataset_size: 2257344
- config_name: subset_80
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3170988
num_examples: 1489
download_size: 3497335
dataset_size: 3170988
- config_name: subset_81
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3168930
num_examples: 1488
download_size: 3504770
dataset_size: 3168930
- config_name: subset_82
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3213614
num_examples: 1509
download_size: 3551115
dataset_size: 3213614
- config_name: subset_83
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3198684
num_examples: 1502
download_size: 3528756
dataset_size: 3198684
- config_name: subset_84
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3234909
num_examples: 1519
download_size: 3570752
dataset_size: 3234909
- config_name: subset_85
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3177416
num_examples: 1492
download_size: 3507713
dataset_size: 3177416
- config_name: subset_86
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3296666
num_examples: 1548
download_size: 3649844
dataset_size: 3296666
- config_name: subset_87
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3273204
num_examples: 1537
download_size: 3606911
dataset_size: 3273204
- config_name: subset_88
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3286009
num_examples: 1543
download_size: 3634550
dataset_size: 3286009
- config_name: subset_89
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3247642
num_examples: 1525
download_size: 3592506
dataset_size: 3247642
- config_name: subset_9
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 2208415
num_examples: 1037
download_size: 2373841
dataset_size: 2208415
- config_name: subset_90
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3194451
num_examples: 1500
download_size: 3518694
dataset_size: 3194451
- config_name: subset_91
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3230670
num_examples: 1517
download_size: 3567949
dataset_size: 3230670
- config_name: subset_92
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3211474
num_examples: 1508
download_size: 3549585
dataset_size: 3211474
- config_name: subset_93
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3277520
num_examples: 1539
download_size: 3606838
dataset_size: 3277520
- config_name: subset_94
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3320107
num_examples: 1559
download_size: 3673961
dataset_size: 3320107
- config_name: subset_95
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3226358
num_examples: 1515
download_size: 3556487
dataset_size: 3226358
- config_name: subset_96
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: viA.audio.speaker_embedding
sequence: float32
- name: enA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3264715
num_examples: 1533
download_size: 3630906
dataset_size: 3264715
- config_name: subset_97
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3322215
num_examples: 1560
download_size: 3647262
dataset_size: 3322215
- config_name: subset_98
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3241249
num_examples: 1522
download_size: 3578435
dataset_size: 3241249
- config_name: subset_99
features:
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.laser_score
dtype: float64
- name: enA.audio.speaker_embedding
sequence: float32
- name: viA.audio.speaker_embedding
sequence: float32
splits:
- name: train
num_bytes: 3328599
num_examples: 1563
download_size: 3692070
dataset_size: 3328599
configs:
- config_name: subset_1
data_files:
- split: train
path: subset_1/train-*
- config_name: subset_10
data_files:
- split: train
path: subset_10/train-*
- config_name: subset_100
data_files:
- split: train
path: subset_100/train-*
- config_name: subset_101
data_files:
- split: train
path: subset_101/train-*
- config_name: subset_102
data_files:
- split: train
path: subset_102/train-*
- config_name: subset_103
data_files:
- split: train
path: subset_103/train-*
- config_name: subset_104
data_files:
- split: train
path: subset_104/train-*
- config_name: subset_105
data_files:
- split: train
path: subset_105/train-*
- config_name: subset_106
data_files:
- split: train
path: subset_106/train-*
- config_name: subset_107
data_files:
- split: train
path: subset_107/train-*
- config_name: subset_108
data_files:
- split: train
path: subset_108/train-*
- config_name: subset_109
data_files:
- split: train
path: subset_109/train-*
- config_name: subset_11
data_files:
- split: train
path: subset_11/train-*
- config_name: subset_110
data_files:
- split: train
path: subset_110/train-*
- config_name: subset_111
data_files:
- split: train
path: subset_111/train-*
- config_name: subset_112
data_files:
- split: train
path: subset_112/train-*
- config_name: subset_113
data_files:
- split: train
path: subset_113/train-*
- config_name: subset_114
data_files:
- split: train
path: subset_114/train-*
- config_name: subset_115
data_files:
- split: train
path: subset_115/train-*
- config_name: subset_116
data_files:
- split: train
path: subset_116/train-*
- config_name: subset_117
data_files:
- split: train
path: subset_117/train-*
- config_name: subset_118
data_files:
- split: train
path: subset_118/train-*
- config_name: subset_119
data_files:
- split: train
path: subset_119/train-*
- config_name: subset_12
data_files:
- split: train
path: subset_12/train-*
- config_name: subset_120
data_files:
- split: train
path: subset_120/train-*
- config_name: subset_121
data_files:
- split: train
path: subset_121/train-*
- config_name: subset_122
data_files:
- split: train
path: subset_122/train-*
- config_name: subset_123
data_files:
- split: train
path: subset_123/train-*
- config_name: subset_124
data_files:
- split: train
path: subset_124/train-*
- config_name: subset_125
data_files:
- split: train
path: subset_125/train-*
- config_name: subset_126
data_files:
- split: train
path: subset_126/train-*
- config_name: subset_127
data_files:
- split: train
path: subset_127/train-*
- config_name: subset_128
data_files:
- split: train
path: subset_128/train-*
- config_name: subset_129
data_files:
- split: train
path: subset_129/train-*
- config_name: subset_13
data_files:
- split: train
path: subset_13/train-*
- config_name: subset_130
data_files:
- split: train
path: subset_130/train-*
- config_name: subset_131
data_files:
- split: train
path: subset_131/train-*
- config_name: subset_132
data_files:
- split: train
path: subset_132/train-*
- config_name: subset_133
data_files:
- split: train
path: subset_133/train-*
- config_name: subset_134
data_files:
- split: train
path: subset_134/train-*
- config_name: subset_135
data_files:
- split: train
path: subset_135/train-*
- config_name: subset_136
data_files:
- split: train
path: subset_136/train-*
- config_name: subset_137
data_files:
- split: train
path: subset_137/train-*
- config_name: subset_138
data_files:
- split: train
path: subset_138/train-*
- config_name: subset_139
data_files:
- split: train
path: subset_139/train-*
- config_name: subset_14
data_files:
- split: train
path: subset_14/train-*
- config_name: subset_140
data_files:
- split: train
path: subset_140/train-*
- config_name: subset_141
data_files:
- split: train
path: subset_141/train-*
- config_name: subset_142
data_files:
- split: train
path: subset_142/train-*
- config_name: subset_143
data_files:
- split: train
path: subset_143/train-*
- config_name: subset_144
data_files:
- split: train
path: subset_144/train-*
- config_name: subset_145
data_files:
- split: train
path: subset_145/train-*
- config_name: subset_146
data_files:
- split: train
path: subset_146/train-*
- config_name: subset_147
data_files:
- split: train
path: subset_147/train-*
- config_name: subset_148
data_files:
- split: train
path: subset_148/train-*
- config_name: subset_149
data_files:
- split: train
path: subset_149/train-*
- config_name: subset_15
data_files:
- split: train
path: subset_15/train-*
- config_name: subset_16
data_files:
- split: train
path: subset_16/train-*
- config_name: subset_17
data_files:
- split: train
path: subset_17/train-*
- config_name: subset_18
data_files:
- split: train
path: subset_18/train-*
- config_name: subset_19
data_files:
- split: train
path: subset_19/train-*
- config_name: subset_2
data_files:
- split: train
path: subset_2/train-*
- config_name: subset_20
data_files:
- split: train
path: subset_20/train-*
- config_name: subset_21
data_files:
- split: train
path: subset_21/train-*
- config_name: subset_22
data_files:
- split: train
path: subset_22/train-*
- config_name: subset_23
data_files:
- split: train
path: subset_23/train-*
- config_name: subset_24
data_files:
- split: train
path: subset_24/train-*
- config_name: subset_25
data_files:
- split: train
path: subset_25/train-*
- config_name: subset_26
data_files:
- split: train
path: subset_26/train-*
- config_name: subset_27
data_files:
- split: train
path: subset_27/train-*
- config_name: subset_28
data_files:
- split: train
path: subset_28/train-*
- config_name: subset_29
data_files:
- split: train
path: subset_29/train-*
- config_name: subset_3
data_files:
- split: train
path: subset_3/train-*
- config_name: subset_30
data_files:
- split: train
path: subset_30/train-*
- config_name: subset_31
data_files:
- split: train
path: subset_31/train-*
- config_name: subset_32
data_files:
- split: train
path: subset_32/train-*
- config_name: subset_33
data_files:
- split: train
path: subset_33/train-*
- config_name: subset_34
data_files:
- split: train
path: subset_34/train-*
- config_name: subset_35
data_files:
- split: train
path: subset_35/train-*
- config_name: subset_36
data_files:
- split: train
path: subset_36/train-*
- config_name: subset_37
data_files:
- split: train
path: subset_37/train-*
- config_name: subset_38
data_files:
- split: train
path: subset_38/train-*
- config_name: subset_39
data_files:
- split: train
path: subset_39/train-*
- config_name: subset_4
data_files:
- split: train
path: subset_4/train-*
- config_name: subset_40
data_files:
- split: train
path: subset_40/train-*
- config_name: subset_41
data_files:
- split: train
path: subset_41/train-*
- config_name: subset_42
data_files:
- split: train
path: subset_42/train-*
- config_name: subset_43
data_files:
- split: train
path: subset_43/train-*
- config_name: subset_44
data_files:
- split: train
path: subset_44/train-*
- config_name: subset_45
data_files:
- split: train
path: subset_45/train-*
- config_name: subset_46
data_files:
- split: train
path: subset_46/train-*
- config_name: subset_47
data_files:
- split: train
path: subset_47/train-*
- config_name: subset_48
data_files:
- split: train
path: subset_48/train-*
- config_name: subset_49
data_files:
- split: train
path: subset_49/train-*
- config_name: subset_5
data_files:
- split: train
path: subset_5/train-*
- config_name: subset_50
data_files:
- split: train
path: subset_50/train-*
- config_name: subset_51
data_files:
- split: train
path: subset_51/train-*
- config_name: subset_52
data_files:
- split: train
path: subset_52/train-*
- config_name: subset_53
data_files:
- split: train
path: subset_53/train-*
- config_name: subset_54
data_files:
- split: train
path: subset_54/train-*
- config_name: subset_55
data_files:
- split: train
path: subset_55/train-*
- config_name: subset_56
data_files:
- split: train
path: subset_56/train-*
- config_name: subset_57
data_files:
- split: train
path: subset_57/train-*
- config_name: subset_58
data_files:
- split: train
path: subset_58/train-*
- config_name: subset_59
data_files:
- split: train
path: subset_59/train-*
- config_name: subset_6
data_files:
- split: train
path: subset_6/train-*
- config_name: subset_60
data_files:
- split: train
path: subset_60/train-*
- config_name: subset_61
data_files:
- split: train
path: subset_61/train-*
- config_name: subset_62
data_files:
- split: train
path: subset_62/train-*
- config_name: subset_63
data_files:
- split: train
path: subset_63/train-*
- config_name: subset_64
data_files:
- split: train
path: subset_64/train-*
- config_name: subset_65
data_files:
- split: train
path: subset_65/train-*
- config_name: subset_66
data_files:
- split: train
path: subset_66/train-*
- config_name: subset_67
data_files:
- split: train
path: subset_67/train-*
- config_name: subset_68
data_files:
- split: train
path: subset_68/train-*
- config_name: subset_69
data_files:
- split: train
path: subset_69/train-*
- config_name: subset_7
data_files:
- split: train
path: subset_7/train-*
- config_name: subset_70
data_files:
- split: train
path: subset_70/train-*
- config_name: subset_71
data_files:
- split: train
path: subset_71/train-*
- config_name: subset_72
data_files:
- split: train
path: subset_72/train-*
- config_name: subset_73
data_files:
- split: train
path: subset_73/train-*
- config_name: subset_74
data_files:
- split: train
path: subset_74/train-*
- config_name: subset_75
data_files:
- split: train
path: subset_75/train-*
- config_name: subset_76
data_files:
- split: train
path: subset_76/train-*
- config_name: subset_77
data_files:
- split: train
path: subset_77/train-*
- config_name: subset_78
data_files:
- split: train
path: subset_78/train-*
- config_name: subset_79
data_files:
- split: train
path: subset_79/train-*
- config_name: subset_8
data_files:
- split: train
path: subset_8/train-*
- config_name: subset_80
data_files:
- split: train
path: subset_80/train-*
- config_name: subset_81
data_files:
- split: train
path: subset_81/train-*
- config_name: subset_82
data_files:
- split: train
path: subset_82/train-*
- config_name: subset_83
data_files:
- split: train
path: subset_83/train-*
- config_name: subset_84
data_files:
- split: train
path: subset_84/train-*
- config_name: subset_85
data_files:
- split: train
path: subset_85/train-*
- config_name: subset_86
data_files:
- split: train
path: subset_86/train-*
- config_name: subset_87
data_files:
- split: train
path: subset_87/train-*
- config_name: subset_88
data_files:
- split: train
path: subset_88/train-*
- config_name: subset_89
data_files:
- split: train
path: subset_89/train-*
- config_name: subset_9
data_files:
- split: train
path: subset_9/train-*
- config_name: subset_90
data_files:
- split: train
path: subset_90/train-*
- config_name: subset_91
data_files:
- split: train
path: subset_91/train-*
- config_name: subset_92
data_files:
- split: train
path: subset_92/train-*
- config_name: subset_93
data_files:
- split: train
path: subset_93/train-*
- config_name: subset_94
data_files:
- split: train
path: subset_94/train-*
- config_name: subset_95
data_files:
- split: train
path: subset_95/train-*
- config_name: subset_96
data_files:
- split: train
path: subset_96/train-*
- config_name: subset_97
data_files:
- split: train
path: subset_97/train-*
- config_name: subset_98
data_files:
- split: train
path: subset_98/train-*
- config_name: subset_99
data_files:
- split: train
path: subset_99/train-*
---
数据集信息:
- 配置名称:subset_1
特征:
- 字段名:line_no,数据类型:int64(64位整数)
- 字段名:enA.id,数据类型:string(字符串),表示英文语句A的标识符
- 字段名:enA.laser_score,数据类型:float64(64位浮点数),表示英文语句A的LASER翻译评分
- 字段名:viA.id,数据类型:string(字符串),表示越南语翻译语句A的标识符
- 字段名:viA.laser_score,数据类型:float64(64位浮点数),表示越南语翻译语句A的LASER翻译评分
- 字段名:enA.audio.speaker_embedding,数据类型:float32序列(32位浮点数序列),表示英文语句A对应的音频说话人嵌入
- 字段名:viA.audio.speaker_embedding,数据类型:float32序列(32位浮点数序列),表示越南语翻译语句A对应的音频说话人嵌入
数据拆分:
- 拆分名称:train(训练集),字节数:3946355,样本数量:1853
下载大小:4372012,数据集大小:3946355
- 配置名称:subset_10
特征与subset_1一致
数据拆分:
- 拆分名称:train(训练集),字节数:2321244,样本数量:1090
下载大小:2465259,数据集大小:2321244
- 配置名称:subset_100
特征与subset_1一致
数据拆分:
- 拆分名称:train(训练集),字节数:3352018,样本数量:1574
下载大小:3717499,数据集大小:3352018
...(其余配置子集均遵循上述结构,特征字段与subset_1一致,仅数据拆分的字节数、样本数量、下载大小及数据集大小存在差异)
配置项:
- 配置名称:subset_1,数据文件:
- 拆分:train(训练集),路径:subset_1/train-*
- 配置名称:subset_10,数据文件:
- 拆分:train(训练集),路径:subset_10/train-*
- 配置名称:subset_100,数据文件:
- 拆分:train(训练集),路径:subset_100/train-*
...(其余配置项均遵循上述结构,对应各自的子集路径)
提供机构:
asahi417
原始信息汇总
数据集概述
子集1 (subset_1)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1853 examples, 3946355 bytes
- 下载大小: 4372012 bytes
- 数据集大小: 3946355 bytes
子集10 (subset_10)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1090 examples, 2321244 bytes
- 下载大小: 2465259 bytes
- 数据集大小: 2321244 bytes
子集100 (subset_100)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1574 examples, 3352018 bytes
- 下载大小: 3717499 bytes
- 数据集大小: 3352018 bytes
子集101 (subset_101)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1595 examples, 3396787 bytes
- 下载大小: 3755313 bytes
- 数据集大小: 3396787 bytes
子集102 (subset_102)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1592 examples, 3390391 bytes
- 下载大小: 3747644 bytes
- 数据集大小: 3390391 bytes
子集103 (subset_103)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1560 examples, 3322254 bytes
- 下载大小: 3684229 bytes
- 数据集大小: 3322254 bytes
子集104 (subset_104)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1519 examples, 3234911 bytes
- 下载大小: 3578891 bytes
- 数据集大小: 3234911 bytes
子集105 (subset_105)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1570 examples, 3343509 bytes
- 下载大小: 3687977 bytes
- 数据集大小: 3343509 bytes
子集106 (subset_106)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1565 examples, 3332893 bytes
- 下载大小: 3692437 bytes
- 数据集大小: 3332893 bytes
子集107 (subset_107)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1569 examples, 3341440 bytes
- 下载大小: 3708966 bytes
- 数据集大小: 3341440 bytes
子集108 (subset_108)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1589 examples, 3384039 bytes
- 下载大小: 3746884 bytes
- 数据集大小: 3384039 bytes
子集109 (subset_109)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1584 examples, 3373339 bytes
- 下载大小: 3735430 bytes
- 数据集大小: 3373339 bytes
子集11 (subset_11)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1146 examples, 2440568 bytes
- 下载大小: 2630332 bytes
- 数据集大小: 2440568 bytes
子集110 (subset_110)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1528 examples, 3254084 bytes
- 下载大小: 3591910 bytes
- 数据集大小: 3254084 bytes
子集111 (subset_111)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1509 examples, 3213652 bytes
- 下载大小: 3569229 bytes
- 数据集大小: 3213652 bytes
子集112 (subset_112)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1538 examples, 3275401 bytes
- 下载大小: 3631987 bytes
- 数据集大小: 3275401 bytes
子集113 (subset_113)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1546 examples, 3292418 bytes
- 下载大小: 3651878 bytes
- 数据集大小: 3292418 bytes
子集114 (subset_114)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1533 examples, 3264757 bytes
- 下载大小: 3614785 bytes
- 数据集大小: 3264757 bytes
子集115 (subset_115)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1553 examples, 3307270 bytes
- 下载大小: 3668905 bytes
- 数据集大小: 3307270 bytes
子集116 (subset_116)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1544 examples, 3288150 bytes
- 下载大小: 3667788 bytes
- 数据集大小: 3288150 bytes
子集117 (subset_117)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1572 examples, 3347771 bytes
- 下载大小: 3712765 bytes
- 数据集大小: 3347771 bytes
子集118 (subset_118)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1549 examples, 3298832 bytes
- 下载大小: 3674748 bytes
- 数据集大小: 3298832 bytes
子集119 (subset_119)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1589 examples, 3383976 bytes
- 下载大小: 3743077 bytes
- 数据集大小: 3383976 bytes
子集12 (subset_12)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- viA.laser_score: float64
- enA.audio.speaker_embedding: sequence of float32
- viA.audio.speaker_embedding: sequence of float32
- 分割:
- train: 1109 examples, 2361739 bytes
- 下载大小: 2543444 bytes
- 数据集大小: 2361739 bytes
子集120 (subset_120)
- 特征:
- line_no: int64
- enA.id: string
- enA.laser_score: float64
- viA.id: string
- vi



