nthakur/miracl-raft-instruct-1-pos-4-neg-mistral
收藏Hugging Face2024-04-03 更新2024-06-11 收录
下载链接:
https://hf-mirror.com/datasets/nthakur/miracl-raft-instruct-1-pos-4-neg-mistral
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: ar
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 23085256
num_examples: 2761
download_size: 9582259
dataset_size: 23085256
- config_name: bn
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 34795181
num_examples: 2945
download_size: 10692946
dataset_size: 34795181
- config_name: en
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 31636295
num_examples: 5707
download_size: 13902931
dataset_size: 31636295
- config_name: es
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 18430799
num_examples: 3581
download_size: 7934347
dataset_size: 18430799
- config_name: fa
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 23124051
num_examples: 3298
download_size: 9006826
dataset_size: 23124051
- config_name: fi
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 10275011
num_examples: 1972
download_size: 5156216
dataset_size: 10275011
- config_name: fr
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 10022166
num_examples: 2004
download_size: 4815465
dataset_size: 10022166
- config_name: hi
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 20483583
num_examples: 2041
download_size: 6573144
dataset_size: 20483583
- config_name: id
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 38136877
num_examples: 7244
download_size: 16101961
dataset_size: 38136877
- config_name: ja
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 34740939
num_examples: 5743
download_size: 15926749
dataset_size: 34740939
- config_name: ko
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 6677931
num_examples: 1314
download_size: 3237577
dataset_size: 6677931
- config_name: ru
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 35062570
num_examples: 3804
download_size: 14049413
dataset_size: 35062570
- config_name: sw
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 1031878
num_examples: 203
download_size: 527001
dataset_size: 1031878
- config_name: te
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 1986018
num_examples: 206
download_size: 722739
dataset_size: 1986018
- config_name: th
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 34991199
num_examples: 3058
download_size: 11282773
dataset_size: 34991199
- config_name: zh
features:
- name: output
dtype: string
- name: prompt
dtype: string
- name: query_id
dtype: string
- name: doc_ids
sequence: string
- name: positive_ids
sequence: string
- name: negative_ids
sequence: string
- name: reason
dtype: string
- name: answer
dtype: string
splits:
- name: train
num_bytes: 9474623
num_examples: 2214
download_size: 4861442
dataset_size: 9474623
configs:
- config_name: ar
data_files:
- split: train
path: ar/train-*
- config_name: bn
data_files:
- split: train
path: bn/train-*
- config_name: en
data_files:
- split: train
path: en/train-*
- config_name: es
data_files:
- split: train
path: es/train-*
- config_name: fa
data_files:
- split: train
path: fa/train-*
- config_name: fi
data_files:
- split: train
path: fi/train-*
- config_name: fr
data_files:
- split: train
path: fr/train-*
- config_name: hi
data_files:
- split: train
path: hi/train-*
- config_name: id
data_files:
- split: train
path: id/train-*
- config_name: ja
data_files:
- split: train
path: ja/train-*
- config_name: ko
data_files:
- split: train
path: ko/train-*
- config_name: ru
data_files:
- split: train
path: ru/train-*
- config_name: sw
data_files:
- split: train
path: sw/train-*
- config_name: te
data_files:
- split: train
path: te/train-*
- config_name: th
data_files:
- split: train
path: th/train-*
- config_name: zh
data_files:
- split: train
path: zh/train-*
---
# Dataset Card for "miracl-raft-instruct-1-pos-4-neg-mistral"
[More Information needed](https://github.com/huggingface/datasets/blob/main/CONTRIBUTING.md#how-to-contribute-to-the-dataset-cards)
提供机构:
nthakur
原始信息汇总
数据集概述
数据集名称
"miracl-raft-instruct-1-pos-4-neg-mistral"
数据集配置
配置名称:ar
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 23085256
- 示例数: 2761
- train
- 下载大小:9582259
- 数据集大小:23085256
配置名称:bn
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 34795181
- 示例数: 2945
- train
- 下载大小:10692946
- 数据集大小:34795181
配置名称:en
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 31636295
- 示例数: 5707
- train
- 下载大小:13902931
- 数据集大小:31636295
配置名称:es
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 18430799
- 示例数: 3581
- train
- 下载大小:7934347
- 数据集大小:18430799
配置名称:fa
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 23124051
- 示例数: 3298
- train
- 下载大小:9006826
- 数据集大小:23124051
配置名称:fi
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 10275011
- 示例数: 1972
- train
- 下载大小:5156216
- 数据集大小:10275011
配置名称:fr
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 10022166
- 示例数: 2004
- train
- 下载大小:4815465
- 数据集大小:10022166
配置名称:hi
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 20483583
- 示例数: 2041
- train
- 下载大小:6573144
- 数据集大小:20483583
配置名称:id
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 38136877
- 示例数: 7244
- train
- 下载大小:16101961
- 数据集大小:38136877
配置名称:ja
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 34740939
- 示例数: 5743
- train
- 下载大小:15926749
- 数据集大小:34740939
配置名称:ko
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 6677931
- 示例数: 1314
- train
- 下载大小:3237577
- 数据集大小:6677931
配置名称:ru
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 35062570
- 示例数: 3804
- train
- 下载大小:14049413
- 数据集大小:35062570
配置名称:sw
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 1031878
- 示例数: 203
- train
- 下载大小:527001
- 数据集大小:1031878
配置名称:te
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 1986018
- 示例数: 206
- train
- 下载大小:722739
- 数据集大小:1986018
配置名称:th
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 34991199
- 示例数: 3058
- train
- 下载大小:11282773
- 数据集大小:34991199
配置名称:zh
- 特征:
- output: string
- prompt: string
- query_id: string
- doc_ids: sequence (string)
- positive_ids: sequence (string)
- negative_ids: sequence (string)
- reason: string
- answer: string
- 分割:
- train
- 字节数: 9474623
- 示例数: 2214
- train
- 下载大小:4861442
- 数据集大小:9474623



