asahi417/seamless-align-enA-viA
收藏Hugging Face2024-06-01 更新2024-06-12 收录
下载链接:
https://hf-mirror.com/datasets/asahi417/seamless-align-enA-viA
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: subset_1
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 310875698.231
num_examples: 1873
download_size: 308530375
dataset_size: 310875698.231
- config_name: subset_10
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 149955109.948
num_examples: 1092
download_size: 146857826
dataset_size: 149955109.948
- config_name: subset_100
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 223956333.212
num_examples: 1579
download_size: 226057233
dataset_size: 223956333.212
- config_name: subset_101
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 231032122.276
num_examples: 1602
download_size: 227637023
dataset_size: 231032122.276
- config_name: subset_102
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 232900680.766
num_examples: 1602
download_size: 231018926
dataset_size: 232900680.766
- config_name: subset_103
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 227524749.978
num_examples: 1566
download_size: 225183888
dataset_size: 227524749.978
- config_name: subset_104
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 219203850.624
num_examples: 1533
download_size: 216784773
dataset_size: 219203850.624
- config_name: subset_105
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 229345952.545
num_examples: 1579
download_size: 223684351
dataset_size: 229345952.545
- config_name: subset_106
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 227860903.064
num_examples: 1572
download_size: 225460466
dataset_size: 227860903.064
- config_name: subset_107
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 230034699.8
num_examples: 1580
download_size: 229436008
dataset_size: 230034699.8
- config_name: subset_108
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 229984236.205
num_examples: 1595
download_size: 227003908
dataset_size: 229984236.205
- config_name: subset_109
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 230223518.904
num_examples: 1592
download_size: 229888287
dataset_size: 230223518.904
- config_name: subset_11
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 159427053.981
num_examples: 1149
download_size: 157508759
dataset_size: 159427053.981
- config_name: subset_110
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 221202904.385
num_examples: 1545
download_size: 216917344
dataset_size: 221202904.385
- config_name: subset_111
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 222022142.521
num_examples: 1541
download_size: 221692410
dataset_size: 222022142.521
- config_name: subset_112
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 223541761.058
num_examples: 1574
download_size: 222885517
dataset_size: 223541761.058
- config_name: subset_113
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 227046162.64
num_examples: 1570
download_size: 225591085
dataset_size: 227046162.64
- config_name: subset_114
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 227709702.89
num_examples: 1546
download_size: 226767725
dataset_size: 227709702.89
- config_name: subset_115
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 228926744.736
num_examples: 1566
download_size: 224568565
dataset_size: 228926744.736
- config_name: subset_116
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 227653832.943
num_examples: 1561
download_size: 232146377
dataset_size: 227653832.943
- config_name: subset_117
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 227743285.512
num_examples: 1582
download_size: 224092845
dataset_size: 227743285.512
- config_name: subset_118
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 227900796.96
num_examples: 1560
download_size: 230509185
dataset_size: 227900796.96
- config_name: subset_119
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 223083481.146
num_examples: 1597
download_size: 226456315
dataset_size: 223083481.146
- config_name: subset_12
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 149419294.92
num_examples: 1116
download_size: 145387701
dataset_size: 149419294.92
- config_name: subset_120
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 226304614.435
num_examples: 1595
download_size: 224233079
dataset_size: 226304614.435
- config_name: subset_121
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 230882729.604
num_examples: 1609
download_size: 229141571
dataset_size: 230882729.604
- config_name: subset_122
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 238447274.748
num_examples: 1613
download_size: 234558465
dataset_size: 238447274.748
- config_name: subset_123
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 232748237.677
num_examples: 1591
download_size: 226306521
dataset_size: 232748237.677
- config_name: subset_124
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 231983208.555
num_examples: 1565
download_size: 227923039
dataset_size: 231983208.555
- config_name: subset_125
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 227690230.136
num_examples: 1576
download_size: 230570896
dataset_size: 227690230.136
- config_name: subset_126
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 235160086.532
num_examples: 1572
download_size: 233481121
dataset_size: 235160086.532
- config_name: subset_127
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 240618942.242
num_examples: 1581
download_size: 237076316
dataset_size: 240618942.242
- config_name: subset_128
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 230061431.695
num_examples: 1599
download_size: 229299204
dataset_size: 230061431.695
- config_name: subset_129
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 234189078.41
num_examples: 1630
download_size: 232346165
dataset_size: 234189078.41
- config_name: subset_13
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 152914560.13
num_examples: 1154
download_size: 148938968
dataset_size: 152914560.13
- config_name: subset_130
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 233080252.61
num_examples: 1586
download_size: 230235284
dataset_size: 233080252.61
- config_name: subset_131
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 228739289.225
num_examples: 1595
download_size: 231496717
dataset_size: 228739289.225
- config_name: subset_132
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 226494815.064
num_examples: 1576
download_size: 227722327
dataset_size: 226494815.064
- config_name: subset_133
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 233293851.104
num_examples: 1603
download_size: 235022943
dataset_size: 233293851.104
- config_name: subset_134
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 231775389.503
num_examples: 1511
download_size: 230666679
dataset_size: 231775389.503
- config_name: subset_135
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 225773678.04
num_examples: 1484
download_size: 225762769
dataset_size: 225773678.04
- config_name: subset_136
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 232262750.32
num_examples: 1604
download_size: 229876414
dataset_size: 232262750.32
- config_name: subset_137
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 240627285.857
num_examples: 1633
download_size: 236622510
dataset_size: 240627285.857
- config_name: subset_138
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 239299377.065
num_examples: 1601
download_size: 238661872
dataset_size: 239299377.065
- config_name: subset_139
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 234999461.34
num_examples: 1588
download_size: 234537745
dataset_size: 234999461.34
- config_name: subset_14
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 154341555.289
num_examples: 1161
download_size: 151311166
dataset_size: 154341555.289
- config_name: subset_140
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 228155801.9
num_examples: 1578
download_size: 230951364
dataset_size: 228155801.9
- config_name: subset_141
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 236897269.32
num_examples: 1560
download_size: 232718766
dataset_size: 236897269.32
- config_name: subset_142
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 240248711.52
num_examples: 1624
download_size: 240163141
dataset_size: 240248711.52
- config_name: subset_143
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 244276889.66
num_examples: 1620
download_size: 243264596
dataset_size: 244276889.66
- config_name: subset_144
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 247766886.287
num_examples: 1653
download_size: 246696467
dataset_size: 247766886.287
- config_name: subset_145
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 239955104.664
num_examples: 1599
download_size: 241078776
dataset_size: 239955104.664
- config_name: subset_146
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 235630392.648
num_examples: 1608
download_size: 239247793
dataset_size: 235630392.648
- config_name: subset_147
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 250432343.098
num_examples: 1626
download_size: 246276516
dataset_size: 250432343.098
- config_name: subset_148
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 239373922.616
num_examples: 1609
download_size: 237156605
dataset_size: 239373922.616
- config_name: subset_149
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 28850858.0
num_examples: 190
download_size: 28752902
dataset_size: 28850858.0
- config_name: subset_15
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 158704821.112
num_examples: 1212
download_size: 156250069
dataset_size: 158704821.112
- config_name: subset_16
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 155209942.72
num_examples: 1161
download_size: 154114284
dataset_size: 155209942.72
- config_name: subset_17
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 163391398.17
num_examples: 1205
download_size: 159061334
dataset_size: 163391398.17
- config_name: subset_18
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 163791628.69
num_examples: 1271
download_size: 161745864
dataset_size: 163791628.69
- config_name: subset_19
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 155977557.193
num_examples: 1211
download_size: 155982997
dataset_size: 155977557.193
- config_name: subset_2
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 255383348.999
num_examples: 1501
download_size: 242972339
dataset_size: 255383348.999
- config_name: subset_20
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 156223584.554
num_examples: 1202
download_size: 153141144
dataset_size: 156223584.554
- config_name: subset_21
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 161855596.52
num_examples: 1240
download_size: 158053336
dataset_size: 161855596.52
- config_name: subset_22
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 158406301.458
num_examples: 1213
download_size: 157210561
dataset_size: 158406301.458
- config_name: subset_23
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 167749186.202
num_examples: 1249
download_size: 162940216
dataset_size: 167749186.202
- config_name: subset_24
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 165062454.332
num_examples: 1262
download_size: 159480676
dataset_size: 165062454.332
- config_name: subset_25
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 170347855.908
num_examples: 1298
download_size: 168544155
dataset_size: 170347855.908
- config_name: subset_26
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 173806911.921
num_examples: 1343
download_size: 172313240
dataset_size: 173806911.921
- config_name: subset_27
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 161992905.943
num_examples: 1273
download_size: 162178088
dataset_size: 161992905.943
- config_name: subset_28
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 178872749.754
num_examples: 1318
download_size: 173492414
dataset_size: 178872749.754
- config_name: subset_29
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 171459561.584
num_examples: 1312
download_size: 169633295
dataset_size: 171459561.584
- config_name: subset_3
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 214986145.46
num_examples: 1332
download_size: 204928920
dataset_size: 214986145.46
- config_name: subset_30
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 169084862.305
num_examples: 1317
download_size: 168033628
dataset_size: 169084862.305
- config_name: subset_31
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 173661661.416
num_examples: 1364
download_size: 173691965
dataset_size: 173661661.416
- config_name: subset_32
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 175707583.6
num_examples: 1368
download_size: 173173915
dataset_size: 175707583.6
- config_name: subset_33
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 177043168.56
num_examples: 1360
download_size: 175684340
dataset_size: 177043168.56
- config_name: subset_34
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 188630816.356
num_examples: 1397
download_size: 185736894
dataset_size: 188630816.356
- config_name: subset_35
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 171525586.072
num_examples: 1333
download_size: 170348116
dataset_size: 171525586.072
- config_name: subset_36
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 184316589.125
num_examples: 1379
download_size: 181497104
dataset_size: 184316589.125
- config_name: subset_37
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 178336192.292
num_examples: 1372
download_size: 176190963
dataset_size: 178336192.292
- config_name: subset_38
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 173407451.331
num_examples: 1327
download_size: 172073991
dataset_size: 173407451.331
- config_name: subset_39
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 173654076.07
num_examples: 1331
download_size: 171034686
dataset_size: 173654076.07
- config_name: subset_4
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 179584766.498
num_examples: 1178
download_size: 179984981
dataset_size: 179584766.498
- config_name: subset_40
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 175794155.758
num_examples: 1383
download_size: 177307587
dataset_size: 175794155.758
- config_name: subset_41
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 170720868.75
num_examples: 1250
download_size: 167296596
dataset_size: 170720868.75
- config_name: subset_42
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 185513579.8
num_examples: 1400
download_size: 182885965
dataset_size: 185513579.8
- config_name: subset_43
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 184311653.184
num_examples: 1396
download_size: 181481075
dataset_size: 184311653.184
- config_name: subset_44
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 186517797.03
num_examples: 1402
download_size: 183790122
dataset_size: 186517797.03
- config_name: subset_45
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 183945771.902
num_examples: 1414
download_size: 179222296
dataset_size: 183945771.902
- config_name: subset_46
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 180070600.582
num_examples: 1337
download_size: 178093153
dataset_size: 180070600.582
- config_name: subset_47
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 189947264.796
num_examples: 1409
download_size: 186216439
dataset_size: 189947264.796
- config_name: subset_48
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 180627530.832
num_examples: 1394
download_size: 178288704
dataset_size: 180627530.832
- config_name: subset_49
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 194018383.292
num_examples: 1433
download_size: 191076814
dataset_size: 194018383.292
- config_name: subset_5
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 168546325.752
num_examples: 1134
download_size: 165637463
dataset_size: 168546325.752
- config_name: subset_50
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 189554636.862
num_examples: 1394
download_size: 184194064
dataset_size: 189554636.862
- config_name: subset_51
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 189978986.936
num_examples: 1448
download_size: 189082336
dataset_size: 189978986.936
- config_name: subset_52
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 195071287.01
num_examples: 1485
download_size: 192959284
dataset_size: 195071287.01
- config_name: subset_53
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 190700114.36
num_examples: 1436
download_size: 192189922
dataset_size: 190700114.36
- config_name: subset_54
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 199075823.168
num_examples: 1476
download_size: 194708868
dataset_size: 199075823.168
- config_name: subset_55
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 201781391.278
num_examples: 1453
download_size: 197619384
dataset_size: 201781391.278
- config_name: subset_56
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 192917911.061
num_examples: 1439
download_size: 192868347
dataset_size: 192917911.061
- config_name: subset_57
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 200590538.34
num_examples: 1471
download_size: 198683663
dataset_size: 200590538.34
- config_name: subset_58
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 207156961.878
num_examples: 1514
download_size: 204447380
dataset_size: 207156961.878
- config_name: subset_59
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 192300733.396
num_examples: 1468
download_size: 191662863
dataset_size: 192300733.396
- config_name: subset_6
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 164417811.176
num_examples: 1134
download_size: 159909521
dataset_size: 164417811.176
- config_name: subset_60
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 200504150.708
num_examples: 1463
download_size: 198903349
dataset_size: 200504150.708
- config_name: subset_61
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 200144302.296
num_examples: 1464
download_size: 199524937
dataset_size: 200144302.296
- config_name: subset_62
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 191833280.981
num_examples: 1441
download_size: 192598762
dataset_size: 191833280.981
- config_name: subset_63
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 193231323.876
num_examples: 1412
download_size: 192662466
dataset_size: 193231323.876
- config_name: subset_64
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 196705041.688
num_examples: 1464
download_size: 194107017
dataset_size: 196705041.688
- config_name: subset_65
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 206332923.223
num_examples: 1473
download_size: 201801672
dataset_size: 206332923.223
- config_name: subset_66
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 202892778.525
num_examples: 1467
download_size: 203314969
dataset_size: 202892778.525
- config_name: subset_67
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 203069236.868
num_examples: 1487
download_size: 203543875
dataset_size: 203069236.868
- config_name: subset_68
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 198375621.523
num_examples: 1469
download_size: 196283029
dataset_size: 198375621.523
- config_name: subset_69
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 199518624.828
num_examples: 1466
download_size: 196677881
dataset_size: 199518624.828
- config_name: subset_7
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 153526686.74
num_examples: 1094
download_size: 150771966
dataset_size: 153526686.74
- config_name: subset_70
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 202239623.877
num_examples: 1499
download_size: 201622627
dataset_size: 202239623.877
- config_name: subset_71
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 209077684.12
num_examples: 1480
download_size: 202612617
dataset_size: 209077684.12
- config_name: subset_72
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 205634031.938
num_examples: 1502
download_size: 206548831
dataset_size: 205634031.938
- config_name: subset_73
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 205620277.541
num_examples: 1537
download_size: 207235674
dataset_size: 205620277.541
- config_name: subset_74
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 211365289.656
num_examples: 1552
download_size: 208397439
dataset_size: 211365289.656
- config_name: subset_75
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 212772877.29
num_examples: 1530
download_size: 210498834
dataset_size: 212772877.29
- config_name: subset_76
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 206112786.005
num_examples: 1489
download_size: 201788032
dataset_size: 206112786.005
- config_name: subset_77
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 209897856.5
num_examples: 1500
download_size: 207377057
dataset_size: 209897856.5
- config_name: subset_78
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 201569744.389
num_examples: 1409
download_size: 198686702
dataset_size: 201569744.389
- config_name: subset_79
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 200293245.652
num_examples: 1483
download_size: 201312816
dataset_size: 200293245.652
- config_name: subset_8
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 147022997.888
num_examples: 1064
download_size: 144672115
dataset_size: 147022997.888
- config_name: subset_80
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 208273325.696
num_examples: 1499
download_size: 206010953
dataset_size: 208273325.696
- config_name: subset_81
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 209944487.192
num_examples: 1504
download_size: 208664089
dataset_size: 209944487.192
- config_name: subset_82
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 215803715.633
num_examples: 1519
download_size: 216023812
dataset_size: 215803715.633
- config_name: subset_83
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 203900631.708
num_examples: 1514
download_size: 207380169
dataset_size: 203900631.708
- config_name: subset_84
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 213353996.584
num_examples: 1528
download_size: 211661519
dataset_size: 213353996.584
- config_name: subset_85
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 211206252.884
num_examples: 1508
download_size: 209889356
dataset_size: 211206252.884
- config_name: subset_86
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 221347606.024
num_examples: 1562
download_size: 219544717
dataset_size: 221347606.024
- config_name: subset_87
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 219279941.164
num_examples: 1546
download_size: 216445698
dataset_size: 219279941.164
- config_name: subset_88
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 218293314.24
num_examples: 1552
download_size: 217291133
dataset_size: 218293314.24
- config_name: subset_89
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 218973225.985
num_examples: 1535
download_size: 215207486
dataset_size: 218973225.985
- config_name: subset_9
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 140013198.633
num_examples: 1041
download_size: 136782991
dataset_size: 140013198.633
- config_name: subset_90
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 214324893.072
num_examples: 1528
download_size: 210703927
dataset_size: 214324893.072
- config_name: subset_91
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 213824504.0
num_examples: 1550
download_size: 212817143
dataset_size: 213824504.0
- config_name: subset_92
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 213175439.024
num_examples: 1528
download_size: 210761425
dataset_size: 213175439.024
- config_name: subset_93
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 215499234.443
num_examples: 1549
download_size: 212851716
dataset_size: 215499234.443
- config_name: subset_94
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 221111997.336
num_examples: 1571
download_size: 221926986
dataset_size: 221111997.336
- config_name: subset_95
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 215049548.216
num_examples: 1527
download_size: 212824744
dataset_size: 215049548.216
- config_name: subset_96
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 225940579.74
num_examples: 1546
download_size: 218771088
dataset_size: 225940579.74
- config_name: subset_97
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 224904577.416
num_examples: 1571
download_size: 218411995
dataset_size: 224904577.416
- config_name: subset_98
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 215296349.324
num_examples: 1531
download_size: 212970827
dataset_size: 215296349.324
- config_name: subset_99
features:
- name: enA.audio
dtype: audio
- name: viA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 222013456.684
num_examples: 1572
download_size: 224284828
dataset_size: 222013456.684
- config_name: subset_test
features:
- name: viA.audio
dtype: audio
- name: enA.audio
dtype: audio
- name: line_no
dtype: int64
- name: enA.id
dtype: string
- name: enA.url
dtype: string
- name: enA.duration_start
dtype: int64
- name: enA.duration_end
dtype: int64
- name: enA.laser_score
dtype: float64
- name: viA.id
dtype: string
- name: viA.url
dtype: string
- name: viA.duration_start
dtype: int64
- name: viA.duration_end
dtype: int64
- name: viA.laser_score
dtype: float64
splits:
- name: train
num_bytes: 925938.0
num_examples: 7
download_size: 931404
dataset_size: 925938.0
configs:
- config_name: subset_1
data_files:
- split: train
path: subset_1/train-*
- config_name: subset_10
data_files:
- split: train
path: subset_10/train-*
- config_name: subset_100
data_files:
- split: train
path: subset_100/train-*
- config_name: subset_101
data_files:
- split: train
path: subset_101/train-*
- config_name: subset_102
data_files:
- split: train
path: subset_102/train-*
- config_name: subset_103
data_files:
- split: train
path: subset_103/train-*
- config_name: subset_104
data_files:
- split: train
path: subset_104/train-*
- config_name: subset_105
data_files:
- split: train
path: subset_105/train-*
- config_name: subset_106
data_files:
- split: train
path: subset_106/train-*
- config_name: subset_107
data_files:
- split: train
path: subset_107/train-*
- config_name: subset_108
data_files:
- split: train
path: subset_108/train-*
- config_name: subset_109
data_files:
- split: train
path: subset_109/train-*
- config_name: subset_11
data_files:
- split: train
path: subset_11/train-*
- config_name: subset_110
data_files:
- split: train
path: subset_110/train-*
- config_name: subset_111
data_files:
- split: train
path: subset_111/train-*
- config_name: subset_112
data_files:
- split: train
path: subset_112/train-*
- config_name: subset_113
data_files:
- split: train
path: subset_113/train-*
- config_name: subset_114
data_files:
- split: train
path: subset_114/train-*
- config_name: subset_115
data_files:
- split: train
path: subset_115/train-*
- config_name: subset_116
data_files:
- split: train
path: subset_116/train-*
- config_name: subset_117
data_files:
- split: train
path: subset_117/train-*
- config_name: subset_118
data_files:
- split: train
path: subset_118/train-*
- config_name: subset_119
data_files:
- split: train
path: subset_119/train-*
- config_name: subset_12
data_files:
- split: train
path: subset_12/train-*
- config_name: subset_120
data_files:
- split: train
path: subset_120/train-*
- config_name: subset_121
data_files:
- split: train
path: subset_121/train-*
- config_name: subset_122
data_files:
- split: train
path: subset_122/train-*
- config_name: subset_123
data_files:
- split: train
path: subset_123/train-*
- config_name: subset_124
data_files:
- split: train
path: subset_124/train-*
- config_name: subset_125
data_files:
- split: train
path: subset_125/train-*
- config_name: subset_126
data_files:
- split: train
path: subset_126/train-*
- config_name: subset_127
data_files:
- split: train
path: subset_127/train-*
- config_name: subset_128
data_files:
- split: train
path: subset_128/train-*
- config_name: subset_129
data_files:
- split: train
path: subset_129/train-*
- config_name: subset_13
data_files:
- split: train
path: subset_13/train-*
- config_name: subset_130
data_files:
- split: train
path: subset_130/train-*
- config_name: subset_131
data_files:
- split: train
path: subset_131/train-*
- config_name: subset_132
data_files:
- split: train
path: subset_132/train-*
- config_name: subset_133
data_files:
- split: train
path: subset_133/train-*
- config_name: subset_134
data_files:
- split: train
path: subset_134/train-*
- config_name: subset_135
data_files:
- split: train
path: subset_135/train-*
- config_name: subset_136
data_files:
- split: train
path: subset_136/train-*
- config_name: subset_137
data_files:
- split: train
path: subset_137/train-*
- config_name: subset_138
data_files:
- split: train
path: subset_138/train-*
- config_name: subset_139
data_files:
- split: train
path: subset_139/train-*
- config_name: subset_14
data_files:
- split: train
path: subset_14/train-*
- config_name: subset_140
data_files:
- split: train
path: subset_140/train-*
- config_name: subset_141
data_files:
- split: train
path: subset_141/train-*
- config_name: subset_142
data_files:
- split: train
path: subset_142/train-*
- config_name: subset_143
data_files:
- split: train
path: subset_143/train-*
- config_name: subset_144
data_files:
- split: train
path: subset_144/train-*
- config_name: subset_145
data_files:
- split: train
path: subset_145/train-*
- config_name: subset_146
data_files:
- split: train
path: subset_146/train-*
- config_name: subset_147
data_files:
- split: train
path: subset_147/train-*
- config_name: subset_148
data_files:
- split: train
path: subset_148/train-*
- config_name: subset_149
data_files:
- split: train
path: subset_149/train-*
- config_name: subset_15
data_files:
- split: train
path: subset_15/train-*
- config_name: subset_16
data_files:
- split: train
path: subset_16/train-*
- config_name: subset_17
data_files:
- split: train
path: subset_17/train-*
- config_name: subset_18
data_files:
- split: train
path: subset_18/train-*
- config_name: subset_19
data_files:
- split: train
path: subset_19/train-*
- config_name: subset_2
data_files:
- split: train
path: subset_2/train-*
- config_name: subset_20
data_files:
- split: train
path: subset_20/train-*
- config_name: subset_21
data_files:
- split: train
path: subset_21/train-*
- config_name: subset_22
data_files:
- split: train
path: subset_22/train-*
- config_name: subset_23
data_files:
- split: train
path: subset_23/train-*
- config_name: subset_24
data_files:
- split: train
path: subset_24/train-*
- config_name: subset_25
data_files:
- split: train
path: subset_25/train-*
- config_name: subset_26
data_files:
- split: train
path: subset_26/train-*
- config_name: subset_27
data_files:
- split: train
path: subset_27/train-*
- config_name: subset_28
data_files:
- split: train
path: subset_28/train-*
- config_name: subset_29
data_files:
- split: train
path: subset_29/train-*
- config_name: subset_3
data_files:
- split: train
path: subset_3/train-*
- config_name: subset_30
data_files:
- split: train
path: subset_30/train-*
- config_name: subset_31
data_files:
- split: train
path: subset_31/train-*
- config_name: subset_32
data_files:
- split: train
path: subset_32/train-*
- config_name: subset_33
data_files:
- split: train
path: subset_33/train-*
- config_name: subset_34
data_files:
- split: train
path: subset_34/train-*
- config_name: subset_35
data_files:
- split: train
path: subset_35/train-*
- config_name: subset_36
data_files:
- split: train
path: subset_36/train-*
- config_name: subset_37
data_files:
- split: train
path: subset_37/train-*
- config_name: subset_38
data_files:
- split: train
path: subset_38/train-*
- config_name: subset_39
data_files:
- split: train
path: subset_39/train-*
- config_name: subset_4
data_files:
- split: train
path: subset_4/train-*
- config_name: subset_40
data_files:
- split: train
path: subset_40/train-*
- config_name: subset_41
data_files:
- split: train
path: subset_41/train-*
- config_name: subset_42
data_files:
- split: train
path: subset_42/train-*
- config_name: subset_43
data_files:
- split: train
path: subset_43/train-*
- config_name: subset_44
data_files:
- split: train
path: subset_44/train-*
- config_name: subset_45
data_files:
- split: train
path: subset_45/train-*
- config_name: subset_46
data_files:
- split: train
path: subset_46/train-*
- config_name: subset_47
data_files:
- split: train
path: subset_47/train-*
- config_name: subset_48
data_files:
- split: train
path: subset_48/train-*
- config_name: subset_49
data_files:
- split: train
path: subset_49/train-*
- config_name: subset_5
data_files:
- split: train
path: subset_5/train-*
- config_name: subset_50
data_files:
- split: train
path: subset_50/train-*
- config_name: subset_51
data_files:
- split: train
path: subset_51/train-*
- config_name: subset_52
data_files:
- split: train
path: subset_52/train-*
- config_name: subset_53
data_files:
- split: train
path: subset_53/train-*
- config_name: subset_54
data_files:
- split: train
path: subset_54/train-*
- config_name: subset_55
data_files:
- split: train
path: subset_55/train-*
- config_name: subset_56
data_files:
- split: train
path: subset_56/train-*
- config_name: subset_57
data_files:
- split: train
path: subset_57/train-*
- config_name: subset_58
data_files:
- split: train
path: subset_58/train-*
- config_name: subset_59
data_files:
- split: train
path: subset_59/train-*
- config_name: subset_6
data_files:
- split: train
path: subset_6/train-*
- config_name: subset_60
data_files:
- split: train
path: subset_60/train-*
- config_name: subset_61
data_files:
- split: train
path: subset_61/train-*
- config_name: subset_62
data_files:
- split: train
path: subset_62/train-*
- config_name: subset_63
data_files:
- split: train
path: subset_63/train-*
- config_name: subset_64
data_files:
- split: train
path: subset_64/train-*
- config_name: subset_65
data_files:
- split: train
path: subset_65/train-*
- config_name: subset_66
data_files:
- split: train
path: subset_66/train-*
- config_name: subset_67
data_files:
- split: train
path: subset_67/train-*
- config_name: subset_68
data_files:
- split: train
path: subset_68/train-*
- config_name: subset_69
data_files:
- split: train
path: subset_69/train-*
- config_name: subset_7
data_files:
- split: train
path: subset_7/train-*
- config_name: subset_70
data_files:
- split: train
path: subset_70/train-*
- config_name: subset_71
data_files:
- split: train
path: subset_71/train-*
- config_name: subset_72
data_files:
- split: train
path: subset_72/train-*
- config_name: subset_73
data_files:
- split: train
path: subset_73/train-*
- config_name: subset_74
data_files:
- split: train
path: subset_74/train-*
- config_name: subset_75
data_files:
- split: train
path: subset_75/train-*
- config_name: subset_76
data_files:
- split: train
path: subset_76/train-*
- config_name: subset_77
data_files:
- split: train
path: subset_77/train-*
- config_name: subset_78
data_files:
- split: train
path: subset_78/train-*
- config_name: subset_79
data_files:
- split: train
path: subset_79/train-*
- config_name: subset_8
data_files:
- split: train
path: subset_8/train-*
- config_name: subset_80
data_files:
- split: train
path: subset_80/train-*
- config_name: subset_81
data_files:
- split: train
path: subset_81/train-*
- config_name: subset_82
data_files:
- split: train
path: subset_82/train-*
- config_name: subset_83
data_files:
- split: train
path: subset_83/train-*
- config_name: subset_84
data_files:
- split: train
path: subset_84/train-*
- config_name: subset_85
data_files:
- split: train
path: subset_85/train-*
- config_name: subset_86
data_files:
- split: train
path: subset_86/train-*
- config_name: subset_87
data_files:
- split: train
path: subset_87/train-*
- config_name: subset_88
data_files:
- split: train
path: subset_88/train-*
- config_name: subset_89
data_files:
- split: train
path: subset_89/train-*
- config_name: subset_9
data_files:
- split: train
path: subset_9/train-*
- config_name: subset_90
data_files:
- split: train
path: subset_90/train-*
- config_name: subset_91
data_files:
- split: train
path: subset_91/train-*
- config_name: subset_92
data_files:
- split: train
path: subset_92/train-*
- config_name: subset_93
data_files:
- split: train
path: subset_93/train-*
- config_name: subset_94
data_files:
- split: train
path: subset_94/train-*
- config_name: subset_95
data_files:
- split: train
path: subset_95/train-*
- config_name: subset_96
data_files:
- split: train
path: subset_96/train-*
- config_name: subset_97
data_files:
- split: train
path: subset_97/train-*
- config_name: subset_98
data_files:
- split: train
path: subset_98/train-*
- config_name: subset_99
data_files:
- split: train
path: subset_99/train-*
- config_name: subset_test
data_files:
- split: train
path: subset_test/train-*
---
提供机构:
asahi417
原始信息汇总
数据集概述
数据集配置及特征
-
配置名称:
- subset_1
- subset_10
- subset_100
- subset_101
- subset_102
- subset_103
- subset_104
- subset_105
- subset_106
- subset_107
- subset_108
- subset_109
- subset_11
- subset_110
- subset_111
- subset_112
- subset_113
- subset_114
- subset_115
- subset_116
- subset_117
- subset_118
- subset_119
- subset_12
- subset_120
- subset_121
- subset_122
- subset_123
- subset_124
-
数据集特征:
- 音频特征:
- enA.audio
- viA.audio
- 数值特征:
- line_no (int64)
- enA.duration_start (int64)
- enA.duration_end (int64)
- viA.duration_start (int64)
- viA.duration_end (int64)
- 字符串特征:
- enA.id
- enA.url
- viA.id
- viA.url
- 浮点特征:
- enA.laser_score (float64)
- viA.laser_score (float64)
- 音频特征:
数据集分割及大小
-
分割名称: train
-
数据集大小:
- subset_1: 310875698.231 bytes
- subset_10: 149955109.948 bytes
- subset_100: 223956333.212 bytes
- subset_101: 231032122.276 bytes
- subset_102: 232900680.766 bytes
- subset_103: 227524749.978 bytes
- subset_104: 219203850.624 bytes
- subset_105: 229345952.545 bytes
- subset_106: 227860903.064 bytes
- subset_107: 230034699.8 bytes
- subset_108: 229984236.205 bytes
- subset_109: 230223518.904 bytes
- subset_11: 159427053.981 bytes
- subset_110: 221202904.385 bytes
- subset_111: 222022142.521 bytes
- subset_112: 223541761.058 bytes
- subset_113: 227046162.64 bytes
- subset_114: 227709702.89 bytes
- subset_115: 228926744.736 bytes
- subset_116: 227653832.943 bytes
- subset_117: 227743285.512 bytes
- subset_118: 227900796.96 bytes
- subset_119: 223083481.146 bytes
- subset_12: 149419294.92 bytes
- subset_120: 226304614.435 bytes
- subset_121: 230882729.604 bytes
- subset_122: 238447274.748 bytes
- subset_123: 232748237.677 bytes
- subset_124: 数据集大小未提供
-
下载大小:
- subset_1: 308530375 bytes
- subset_10: 146857826 bytes
- subset_100: 226057233 bytes
- subset_101: 227637023 bytes
- subset_102: 231018926 bytes
- subset_103: 225183888 bytes
- subset_104: 216784773 bytes
- subset_105: 223684351 bytes
- subset_106: 225460466 bytes
- subset_107: 229436008 bytes
- subset_108: 227003908 bytes
- subset_109: 229888287 bytes
- subset_11: 157508759 bytes
- subset_110: 216917344 bytes
- subset_111: 221692410 bytes
- subset_112: 222885517 bytes
- subset_113: 225591085 bytes
- subset_114: 226767725 bytes
- subset_115: 224568565 bytes
- subset_116: 232146377 bytes
- subset_117: 224092845 bytes
- subset_118: 230509185 bytes
- subset_119: 226456315 bytes
- subset_12: 145387701 bytes
- subset_120: 224233079 bytes
- subset_121: 229141571 bytes
- subset_122: 234558465 bytes
- subset_123: 226306521 bytes
- subset_124: 下载大小未提供
-
示例数量:
- subset_1: 1873 examples
- subset_10: 1092 examples
- subset_100: 1579 examples
- subset_101: 1602 examples
- subset_102: 1602 examples
- subset_103: 1566 examples
- subset_104: 1533 examples
- subset_105: 1579 examples
- subset_106: 1572 examples
- subset_107: 1580 examples
- subset_108: 1595 examples
- subset_109: 1592 examples
- subset_11: 1149 examples
- subset_110: 1545 examples
- subset_111: 1541 examples
- subset_112: 1574 examples
- subset_113: 1570 examples
- subset_114: 1546 examples
- subset_115: 1566 examples
- subset_116: 1561 examples
- subset_117: 1582 examples
- subset_118: 1560 examples
- subset_119: 1597 examples
- subset_12: 1116 examples
- subset_120: 1595 examples
- subset_121: 1609 examples
- subset_122: 1613 examples
- subset_123: 1591 examples
- subset_124: 示例数量未提供



