Cognitive-Lab/GoogleIndicGenBench_xquad_in
收藏Hugging Face2024-06-03 更新2024-06-12 收录
下载链接:
https://hf-mirror.com/datasets/Cognitive-Lab/GoogleIndicGenBench_xquad_in
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: gu
features:
- name: context
dtype: string
- name: title
dtype: string
- name: lang
dtype: string
- name: answers
list:
- name: answer_start
dtype: int64
- name: text
dtype: string
- name: id
dtype: string
- name: question
dtype: string
splits:
- name: train
num_bytes: 263749
num_examples: 103
- name: test
num_bytes: 2829431
num_examples: 1190
- name: dev
num_bytes: 242684
num_examples: 111
download_size: 422378
dataset_size: 3335864
- config_name: hi
features:
- name: context
dtype: string
- name: title
dtype: string
- name: lang
dtype: string
- name: answers
list:
- name: answer_start
dtype: int64
- name: text
dtype: string
- name: id
dtype: string
- name: question
dtype: string
splits:
- name: train
num_bytes: 254588
num_examples: 103
- name: test
num_bytes: 2929434
num_examples: 1190
- name: dev
num_bytes: 247672
num_examples: 111
download_size: 430286
dataset_size: 3431694
- config_name: kn
features:
- name: context
dtype: string
- name: title
dtype: string
- name: lang
dtype: string
- name: answers
list:
- name: answer_start
dtype: int64
- name: text
dtype: string
- name: id
dtype: string
- name: question
dtype: string
splits:
- name: train
num_bytes: 279583
num_examples: 103
- name: test
num_bytes: 3091347
num_examples: 1190
- name: dev
num_bytes: 271974
num_examples: 111
download_size: 450576
dataset_size: 3642904
- config_name: ml
features:
- name: context
dtype: string
- name: title
dtype: string
- name: lang
dtype: string
- name: answers
list:
- name: answer_start
dtype: int64
- name: text
dtype: string
- name: id
dtype: string
- name: question
dtype: string
splits:
- name: train
num_bytes: 303941
num_examples: 103
- name: test
num_bytes: 3368319
num_examples: 1190
- name: dev
num_bytes: 284925
num_examples: 111
download_size: 480526
dataset_size: 3957185
- config_name: mr
features:
- name: context
dtype: string
- name: title
dtype: string
- name: lang
dtype: string
- name: answers
list:
- name: answer_start
dtype: int64
- name: text
dtype: string
- name: id
dtype: string
- name: question
dtype: string
splits:
- name: train
num_bytes: 258321
num_examples: 103
- name: test
num_bytes: 2903226
num_examples: 1190
- name: dev
num_bytes: 243598
num_examples: 111
download_size: 433926
dataset_size: 3405145
- config_name: ta
features:
- name: context
dtype: string
- name: title
dtype: string
- name: lang
dtype: string
- name: answers
list:
- name: answer_start
dtype: int64
- name: text
dtype: string
- name: id
dtype: string
- name: question
dtype: string
splits:
- name: train
num_bytes: 323325
num_examples: 103
- name: test
num_bytes: 3518507
num_examples: 1190
- name: dev
num_bytes: 291858
num_examples: 111
download_size: 471680
dataset_size: 4133690
- config_name: te
features:
- name: context
dtype: string
- name: title
dtype: string
- name: lang
dtype: string
- name: answers
list:
- name: answer_start
dtype: int64
- name: text
dtype: string
- name: id
dtype: string
- name: question
dtype: string
splits:
- name: train
num_bytes: 260819
num_examples: 103
- name: test
num_bytes: 2958471
num_examples: 1190
- name: dev
num_bytes: 244230
num_examples: 110
download_size: 439873
dataset_size: 3463520
configs:
- config_name: gu
data_files:
- split: train
path: gu/train-*
- split: test
path: gu/test-*
- split: dev
path: gu/dev-*
- config_name: hi
data_files:
- split: train
path: hi/train-*
- split: test
path: hi/test-*
- split: dev
path: hi/dev-*
- config_name: kn
data_files:
- split: train
path: kn/train-*
- split: test
path: kn/test-*
- split: dev
path: kn/dev-*
- config_name: ml
data_files:
- split: train
path: ml/train-*
- split: test
path: ml/test-*
- split: dev
path: ml/dev-*
- config_name: mr
data_files:
- split: train
path: mr/train-*
- split: test
path: mr/test-*
- split: dev
path: mr/dev-*
- config_name: ta
data_files:
- split: train
path: ta/train-*
- split: test
path: ta/test-*
- split: dev
path: ta/dev-*
- config_name: te
data_files:
- split: train
path: te/train-*
- split: test
path: te/test-*
- split: dev
path: te/dev-*
---
提供机构:
Cognitive-Lab
原始信息汇总
数据集概述
数据集配置及特征
-
config_name: gu
- 特征:
- context: string
- title: string
- lang: string
- answers:
- answer_start: int64
- text: string
- id: string
- question: string
- 分割:
- train: 103 examples, 263749 bytes
- test: 1190 examples, 2829431 bytes
- dev: 111 examples, 242684 bytes
- 下载大小: 422378 bytes
- 数据集大小: 3335864 bytes
- 特征:
-
config_name: hi
- 特征:
- context: string
- title: string
- lang: string
- answers:
- answer_start: int64
- text: string
- id: string
- question: string
- 分割:
- train: 103 examples, 254588 bytes
- test: 1190 examples, 2929434 bytes
- dev: 111 examples, 247672 bytes
- 下载大小: 430286 bytes
- 数据集大小: 3431694 bytes
- 特征:
-
config_name: kn
- 特征:
- context: string
- title: string
- lang: string
- answers:
- answer_start: int64
- text: string
- id: string
- question: string
- 分割:
- train: 103 examples, 279583 bytes
- test: 1190 examples, 3091347 bytes
- dev: 111 examples, 271974 bytes
- 下载大小: 450576 bytes
- 数据集大小: 3642904 bytes
- 特征:
-
config_name: ml
- 特征:
- context: string
- title: string
- lang: string
- answers:
- answer_start: int64
- text: string
- id: string
- question: string
- 分割:
- train: 103 examples, 303941 bytes
- test: 1190 examples, 3368319 bytes
- dev: 111 examples, 284925 bytes
- 下载大小: 480526 bytes
- 数据集大小: 3957185 bytes
- 特征:
-
config_name: mr
- 特征:
- context: string
- title: string
- lang: string
- answers:
- answer_start: int64
- text: string
- id: string
- question: string
- 分割:
- train: 103 examples, 258321 bytes
- test: 1190 examples, 2903226 bytes
- dev: 111 examples, 243598 bytes
- 下载大小: 433926 bytes
- 数据集大小: 3405145 bytes
- 特征:
-
config_name: ta
- 特征:
- context: string
- title: string
- lang: string
- answers:
- answer_start: int64
- text: string
- id: string
- question: string
- 分割:
- train: 103 examples, 323325 bytes
- test: 1190 examples, 3518507 bytes
- dev: 111 examples, 291858 bytes
- 下载大小: 471680 bytes
- 数据集大小: 4133690 bytes
- 特征:
-
config_name: te
- 特征:
- context: string
- title: string
- lang: string
- answers:
- answer_start: int64
- text: string
- id: string
- question: string
- 分割:
- train: 103 examples, 260819 bytes
- test: 1190 examples, 2958471 bytes
- dev: 110 examples, 244230 bytes
- 下载大小: 439873 bytes
- 数据集大小: 3463520 bytes
- 特征:
数据文件路径
-
config_name: gu
- train: gu/train-*
- test: gu/test-*
- dev: gu/dev-*
-
config_name: hi
- train: hi/train-*
- test: hi/test-*
- dev: hi/dev-*
-
config_name: kn
- train: kn/train-*
- test: kn/test-*
- dev: kn/dev-*
-
config_name: ml
- train: ml/train-*
- test: ml/test-*
- dev: ml/dev-*
-
config_name: mr
- train: mr/train-*
- test: mr/test-*
- dev: mr/dev-*
-
config_name: ta
- train: ta/train-*
- test: ta/test-*
- dev: ta/dev-*
-
config_name: te
- train: te/train-*
- test: te/test-*
- dev: te/dev-*



