TeraflopAI/beir-minus-nanobeir-queries-random-nested-subsets
收藏Hugging Face2026-04-02 更新2026-04-12 收录
下载链接:
https://hf-mirror.com/datasets/TeraflopAI/beir-minus-nanobeir-queries-random-nested-subsets
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: queries_100
features:
- name: _id
dtype: string
- name: title
dtype: string
- name: text
dtype: string
splits:
- name: train
num_bytes: 6801
num_examples: 100
download_size: 6922
dataset_size: 6801
- config_name: queries_1000
features:
- name: _id
dtype: string
- name: title
dtype: string
- name: text
dtype: string
splits:
- name: train
num_bytes: 68016
num_examples: 1000
download_size: 48773
dataset_size: 68016
- config_name: queries_10000
features:
- name: _id
dtype: string
- name: title
dtype: string
- name: text
dtype: string
splits:
- name: train
num_bytes: 680160
num_examples: 10000
download_size: 470970
dataset_size: 680160
- config_name: queries_100000
features:
- name: _id
dtype: string
- name: title
dtype: string
- name: text
dtype: string
splits:
- name: train
num_bytes: 6801606
num_examples: 100000
download_size: 4572189
dataset_size: 6801606
- config_name: queries_20000
features:
- name: _id
dtype: string
- name: title
dtype: string
- name: text
dtype: string
splits:
- name: train
num_bytes: 1360321
num_examples: 20000
download_size: 947344
dataset_size: 1360321
- config_name: queries_5000
features:
- name: _id
dtype: string
- name: title
dtype: string
- name: text
dtype: string
splits:
- name: train
num_bytes: 340080
num_examples: 5000
download_size: 231171
dataset_size: 340080
- config_name: queries_50000
features:
- name: _id
dtype: string
- name: title
dtype: string
- name: text
dtype: string
splits:
- name: train
num_bytes: 3400803
num_examples: 50000
download_size: 2326651
dataset_size: 3400803
configs:
- config_name: queries_100
data_files:
- split: train
path: queries_100/train-*
- config_name: queries_1000
data_files:
- split: train
path: queries_1000/train-*
- config_name: queries_10000
data_files:
- split: train
path: queries_10000/train-*
- config_name: queries_100000
data_files:
- split: train
path: queries_100000/train-*
- config_name: queries_20000
data_files:
- split: train
path: queries_20000/train-*
- config_name: queries_5000
data_files:
- split: train
path: queries_5000/train-*
- config_name: queries_50000
data_files:
- split: train
path: queries_50000/train-*
---
提供机构:
TeraflopAI



