mugezhang/pawsx_eval_multirepr
收藏Hugging Face2026-04-03 更新2026-04-12 收录
下载链接:
https://hf-mirror.com/datasets/mugezhang/pawsx_eval_multirepr
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: en
features:
- name: id
dtype: int32
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype:
class_label:
names:
'0': '0'
'1': '1'
- name: sentence1_phonemes
dtype: string
- name: sentence1_ipa_stripped
dtype: string
- name: sentence1_romanized
dtype: string
- name: sentence2_phonemes
dtype: string
- name: sentence2_ipa_stripped
dtype: string
- name: sentence2_romanized
dtype: string
splits:
- name: train
num_bytes: 56981323
num_examples: 49401
- name: validation
num_bytes: 2292126
num_examples: 2000
- name: test
num_bytes: 2301886
num_examples: 2000
download_size: 38093203
dataset_size: 61575335
- config_name: es
features:
- name: id
dtype: int32
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype:
class_label:
names:
'0': '0'
'1': '1'
- name: sentence1_phonemes
dtype: string
- name: sentence1_ipa_stripped
dtype: string
- name: sentence1_romanized
dtype: string
- name: sentence2_phonemes
dtype: string
- name: sentence2_ipa_stripped
dtype: string
- name: sentence2_romanized
dtype: string
splits:
- name: train
num_bytes: 55587964
num_examples: 49401
- name: validation
num_bytes: 2232440
num_examples: 2000
- name: test
num_bytes: 2254547
num_examples: 2000
download_size: 38690169
dataset_size: 60074951
- config_name: fr
features:
- name: id
dtype: int32
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype:
class_label:
names:
'0': '0'
'1': '1'
- name: sentence1_phonemes
dtype: string
- name: sentence1_ipa_stripped
dtype: string
- name: sentence1_romanized
dtype: string
- name: sentence2_phonemes
dtype: string
- name: sentence2_ipa_stripped
dtype: string
- name: sentence2_romanized
dtype: string
splits:
- name: train
num_bytes: 56097701
num_examples: 49401
- name: validation
num_bytes: 2253811
num_examples: 2000
- name: test
num_bytes: 2263366
num_examples: 2000
download_size: 38510715
dataset_size: 60614878
- config_name: zh
features:
- name: id
dtype: int32
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype:
class_label:
names:
'0': '0'
'1': '1'
- name: sentence1_phonemes
dtype: string
- name: sentence1_ipa_stripped
dtype: string
- name: sentence1_romanized
dtype: string
- name: sentence2_phonemes
dtype: string
- name: sentence2_ipa_stripped
dtype: string
- name: sentence2_romanized
dtype: string
splits:
- name: train
num_bytes: 60175899
num_examples: 49401
- name: validation
num_bytes: 2712791
num_examples: 2000
- name: test
num_bytes: 2715120
num_examples: 2000
download_size: 37853922
dataset_size: 65603810
configs:
- config_name: en
data_files:
- split: train
path: en/train-*
- split: validation
path: en/validation-*
- split: test
path: en/test-*
- config_name: es
data_files:
- split: train
path: es/train-*
- split: validation
path: es/validation-*
- split: test
path: es/test-*
- config_name: fr
data_files:
- split: train
path: fr/train-*
- split: validation
path: fr/validation-*
- split: test
path: fr/test-*
- config_name: zh
data_files:
- split: train
path: zh/train-*
- split: validation
path: zh/validation-*
- split: test
path: zh/test-*
---
提供机构:
mugezhang



