YoheiOhto/pharma-bench-mlm
收藏Hugging Face2026-01-11 更新2026-03-29 收录
下载链接:
https://hf-mirror.com/datasets/YoheiOhto/pharma-bench-mlm
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: ade_corpus_v2_classification
features:
- name: text
dtype: string
- name: label
dtype:
class_label:
names:
'0': Not-Related
'1': Related
splits:
- name: train
num_bytes: 2722843.4082326926
num_examples: 18812
- name: validation
num_bytes: 680855.5917673074
num_examples: 4704
download_size: 1977276
dataset_size: 3403699.0
- config_name: bc2gm
features:
- name: tokens
sequence: string
- name: labels
sequence: string
- name: id
dtype: string
splits:
- name: train
num_bytes: 5030166
num_examples: 12574
- name: validation
num_bytes: 1003097
num_examples: 2519
- name: test
num_bytes: 2024802
num_examples: 5038
download_size: 2162996
dataset_size: 8058065
- config_name: bc5cdr-chem
features:
- name: tokens
sequence: string
- name: labels
sequence: string
- name: id
dtype: string
splits:
- name: train
num_bytes: 1695523
num_examples: 4560
- name: validation
num_bytes: 1684497
num_examples: 4581
- name: test
num_bytes: 1779657
num_examples: 4797
download_size: 1183674
dataset_size: 5159677
- config_name: bc5cdr-disease
features:
- name: tokens
sequence: string
- name: labels
sequence: string
- name: id
dtype: string
splits:
- name: train
num_bytes: 1695523
num_examples: 4560
- name: validation
num_bytes: 1684497
num_examples: 4581
- name: test
num_bytes: 1779657
num_examples: 4797
download_size: 1180845
dataset_size: 5159677
- config_name: bioasq
features:
- name: id
dtype: string
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype: string
splits:
- name: train
num_bytes: 2056424
num_examples: 670
- name: validation
num_bytes: 227036
num_examples: 75
- name: test
num_bytes: 239626
num_examples: 140
download_size: 1190356
dataset_size: 2523086
- config_name: biosses
features:
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype: float64
- name: id
dtype: string
splits:
- name: train
num_bytes: 21475
num_examples: 64
- name: validation
num_bytes: 5419
num_examples: 16
- name: test
num_bytes: 6873
num_examples: 20
download_size: 32197
dataset_size: 33767
- config_name: chemprot
features:
- name: id
dtype: string
- name: sentence
dtype: string
- name: label
dtype: string
splits:
- name: train
num_bytes: 4664879
num_examples: 18035
- name: validation
num_bytes: 2980445
num_examples: 11268
- name: test
num_bytes: 4419113
num_examples: 15745
download_size: 2354003
dataset_size: 12064437
- config_name: ddi
features:
- name: id
dtype: string
- name: sentence
dtype: string
- name: label
dtype: string
splits:
- name: train
num_bytes: 9299537
num_examples: 25296
- name: validation
num_bytes: 648277
num_examples: 2496
- name: test
num_bytes: 1768131
num_examples: 5716
download_size: 1559977
dataset_size: 11715945
- config_name: ebmnlp
features:
- name: tokens
sequence: string
- name: labels
sequence: string
- name: id
dtype: string
splits:
- name: train
num_bytes: 16568481
num_examples: 40935
- name: validation
num_bytes: 4181009
num_examples: 10386
- name: test
num_bytes: 823318
num_examples: 2076
download_size: 4813621
dataset_size: 21572808
- config_name: gad
features:
- name: id
dtype: string
- name: sentence
dtype: string
- name: label
dtype: string
splits:
- name: train
num_bytes: 811477
num_examples: 4261
- name: validation
num_bytes: 99407
num_examples: 535
- name: test
num_bytes: 107079
num_examples: 534
download_size: 485308
dataset_size: 1017963
- config_name: hoc
features:
- name: sentence
dtype: string
- name: label
sequence: int64
- name: id
dtype: string
splits:
- name: train
num_bytes: 2101293
num_examples: 1295
- name: validation
num_bytes: 316170
num_examples: 186
- name: test
num_bytes: 613822
num_examples: 371
download_size: 1560923
dataset_size: 3031285
- config_name: hotpot
features:
- name: id
dtype: string
- name: question
dtype: string
- name: context
dtype: string
- name: answers
struct:
- name: answer_start
sequence: int64
- name: text
sequence: string
splits:
- name: train
num_bytes: 91055424
num_examples: 80220
- name: validation
num_bytes: 4047163
num_examples: 2950
- name: test
num_bytes: 4013429
num_examples: 2951
download_size: 59536812
dataset_size: 99116016
- config_name: jnlpba
features:
- name: tokens
sequence: string
- name: labels
sequence: string
- name: id
dtype: string
splits:
- name: train
num_bytes: 6598421
num_examples: 16807
- name: validation
num_bytes: 696780
num_examples: 1739
- name: test
num_bytes: 1498445
num_examples: 3856
download_size: 1941518
dataset_size: 8793646
- config_name: medmcqa
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: train
num_bytes: 33443573
num_examples: 182822
- name: test
num_bytes: 978657
num_examples: 6150
- name: validation
num_bytes: 838502
num_examples: 4183
download_size: 22183135
dataset_size: 35260732
- config_name: medmcqa_multi
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: train
num_bytes: 12755718
num_examples: 62057
- name: test
num_bytes: 359007
num_examples: 2016
- name: validation
num_bytes: 301598
num_examples: 1367
download_size: 8315650
dataset_size: 13416323
- config_name: medmcqa_single
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: train
num_bytes: 20687855
num_examples: 120765
- name: test
num_bytes: 619650
num_examples: 4134
- name: validation
num_bytes: 536904
num_examples: 2816
download_size: 13639912
dataset_size: 21844409
- config_name: medqa_usmle
features:
- name: id
dtype: string
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype: int64
- name: choices
sequence: string
splits:
- name: train
num_bytes: 9001679
num_examples: 10178
- name: validation
num_bytes: 1123522
num_examples: 1272
- name: test
num_bytes: 1151554
num_examples: 1273
download_size: 6124414
dataset_size: 11276755
- config_name: mmlu
features:
- name: id
dtype: string
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype: int64
- name: choices
sequence: string
splits:
- name: validation
num_bytes: 29034
num_examples: 36
- name: test
num_bytes: 228429
num_examples: 272
download_size: 144004
dataset_size: 257463
- config_name: mmlu_anatomy
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: test
num_bytes: 33109
num_examples: 135
- name: validation
num_bytes: 3128
num_examples: 14
- name: dev
num_bytes: 955
num_examples: 5
download_size: 26206
dataset_size: 37192
- config_name: mmlu_clinical_knowledge
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: test
num_bytes: 62742
num_examples: 265
- name: validation
num_bytes: 6652
num_examples: 29
- name: dev
num_bytes: 1198
num_examples: 5
download_size: 48415
dataset_size: 70592
- config_name: mmlu_college_biology
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: test
num_bytes: 48785
num_examples: 144
- name: validation
num_bytes: 4807
num_examples: 16
- name: dev
num_bytes: 1520
num_examples: 5
download_size: 39875
dataset_size: 55112
- config_name: mmlu_college_medicine
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: test
num_bytes: 82385
num_examples: 173
- name: validation
num_bytes: 7897
num_examples: 22
- name: dev
num_bytes: 1658
num_examples: 5
download_size: 52745
dataset_size: 91940
- config_name: mmlu_medical_genetics
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: test
num_bytes: 20852
num_examples: 100
- name: validation
num_bytes: 2993
num_examples: 11
- name: dev
num_bytes: 1077
num_examples: 5
download_size: 22714
dataset_size: 24922
- config_name: mmlu_professional_medicine
features:
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
splits:
- name: test
num_bytes: 217549
num_examples: 272
- name: validation
num_bytes: 23835
num_examples: 31
- name: dev
num_bytes: 3795
num_examples: 5
download_size: 144905
dataset_size: 245179
- config_name: naturalqa
features:
- name: id
dtype: string
- name: question
dtype: string
- name: context
dtype: string
- name: answers
struct:
- name: answer_start
sequence: int64
- name: text
sequence: string
splits:
- name: train
num_bytes: 108546039
num_examples: 114478
- name: validation
num_bytes: 6355137
num_examples: 6418
- name: test
num_bytes: 6331151
num_examples: 6418
download_size: 69332911
dataset_size: 121232327
- config_name: ncbi-disease
features:
- name: tokens
sequence: string
- name: labels
sequence: string
- name: id
dtype: string
splits:
- name: train
num_bytes: 1941909
num_examples: 5424
- name: validation
num_bytes: 341962
num_examples: 923
- name: test
num_bytes: 349320
num_examples: 940
download_size: 571920
dataset_size: 2633191
- config_name: newsqa
features:
- name: id
dtype: string
- name: question
dtype: string
- name: context
dtype: string
- name: answers
struct:
- name: answer_start
sequence: int64
- name: text
sequence: string
splits:
- name: train
num_bytes: 235771764
num_examples: 74160
- name: validation
num_bytes: 6613789
num_examples: 2125
- name: test
num_bytes: 6681014
num_examples: 2087
download_size: 28623546
dataset_size: 249066567
- config_name: openfda_drug_lama
features:
- name: uuid
dtype: string
- name: sub_id
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 1667501
num_examples: 731
download_size: 771333
dataset_size: 1667501
- config_name: openfda_drug_lama_v2
features:
- name: uuid
dtype: string
- name: sub_id
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
list: string
- name: masked_sentences
list: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 1693817
num_examples: 731
download_size: 785697
dataset_size: 1693817
- config_name: openfda_tf_evaluation
features:
- name: id
dtype: string
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype: int64
- name: section
dtype: string
- name: set_id
dtype: string
- name: source
dtype: string
splits:
- name: test
num_bytes: 17515322
num_examples: 4554
download_size: 2752720
dataset_size: 17515322
- config_name: openfda_tf_tuning
features:
- name: id
dtype: string
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype: int64
- name: section
dtype: string
- name: set_id
dtype: string
- name: source
dtype: string
splits:
- name: train
num_bytes: 13516055
num_examples: 3576
- name: test
num_bytes: 3999267
num_examples: 978
download_size: 2782983
dataset_size: 17515322
- config_name: pubmedqa
features:
- name: id
dtype: string
- name: sentence1
dtype: string
- name: sentence2
dtype: string
- name: label
dtype: string
splits:
- name: train
num_bytes: 654325
num_examples: 450
- name: validation
num_bytes: 72266
num_examples: 50
- name: test
num_bytes: 737995
num_examples: 500
download_size: 833795
dataset_size: 1464586
- config_name: rxnorm_lama_brand_has_active_ingredient
features:
- name: uuid
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 762
num_examples: 4
download_size: 3542
dataset_size: 762
- config_name: rxnorm_lama_brand_of_generic
features:
- name: uuid
dtype: string
- name: sub_id
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 1499183
num_examples: 6586
download_size: 612573
dataset_size: 1499183
- config_name: rxnorm_lama_chemical_has_synonym
features:
- name: uuid
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 626182
num_examples: 3916
download_size: 335600
dataset_size: 626182
- config_name: rxnorm_lama_chemical_has_synonym_v2
features:
- name: uuid
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 6865704
num_examples: 27230
download_size: 2927194
dataset_size: 6865704
- config_name: rxnorm_lama_chemical_has_synonym_v3
features:
- name: uuid
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 915086.0562982005
num_examples: 5131
download_size: 455362
dataset_size: 915086.0562982005
- config_name: rxnorm_lama_generic_has_brand
features:
- name: uuid
dtype: string
- name: sub_id
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 572131
num_examples: 1926
download_size: 256437
dataset_size: 572131
- config_name: searchqa
features:
- name: id
dtype: string
- name: question
dtype: string
- name: context
dtype: string
- name: answers
struct:
- name: answer_start
sequence: int64
- name: text
sequence: string
splits:
- name: train
num_bytes: 463607158
num_examples: 117384
- name: validation
num_bytes: 33291447
num_examples: 8490
- name: test
num_bytes: 33435038
num_examples: 8490
download_size: 310012520
dataset_size: 530333643
- config_name: sider_lama_ade
features:
- name: uuid
dtype: string
- name: sub_id
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 1337287
num_examples: 1411
download_size: 249479
dataset_size: 1337287
- config_name: sider_lama_indication
features:
- name: uuid
dtype: string
- name: sub_id
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 336288
num_examples: 1161
download_size: 122961
dataset_size: 336288
- config_name: sider_lama_indication_v2
features:
- name: uuid
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 519935
num_examples: 1281
download_size: 161633
dataset_size: 519935
- config_name: sider_lama_indication_v3
features:
- name: uuid
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 232071.6182669789
num_examples: 1107
download_size: 90158
dataset_size: 232071.6182669789
- config_name: sider_lama_side_effect_v2
features:
- name: uuid
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 3163438
num_examples: 1347
download_size: 461151
dataset_size: 3163438
- config_name: sider_lama_side_effect_v3
features:
- name: uuid
dtype: string
- name: sub_label
dtype: string
- name: obj_labels
sequence: string
- name: masked_sentences
sequence: string
- name: relation
dtype: string
splits:
- name: test
num_bytes: 1193176.236080178
num_examples: 1343
download_size: 208883
dataset_size: 1193176.236080178
- config_name: squad
features:
- name: id
dtype: string
- name: question
dtype: string
- name: context
dtype: string
- name: answers
struct:
- name: answer_start
sequence: int64
- name: text
sequence: string
splits:
- name: train
num_bytes: 84969541
num_examples: 95246
- name: validation
num_bytes: 5121715
num_examples: 5236
- name: test
num_bytes: 5231224
num_examples: 5271
download_size: 21088024
dataset_size: 95322480
- config_name: triviaqa
features:
- name: id
dtype: string
- name: question
dtype: string
- name: context
dtype: string
- name: answers
struct:
- name: answer_start
sequence: int64
- name: text
sequence: string
splits:
- name: train
num_bytes: 288069956
num_examples: 67856
- name: validation
num_bytes: 16482534
num_examples: 3892
- name: test
num_bytes: 16527521
num_examples: 3893
download_size: 187161163
dataset_size: 321080011
- config_name: yakugaku_qa_filtered_5_options_multi_answer
features:
- name: id
dtype: string
- name: question
dtype: string
- name: choices
sequence: string
- name: label
sequence: int32
- name: type
dtype: string
splits:
- name: train
num_bytes: 700539
num_examples: 932
- name: test
num_bytes: 172890
num_examples: 233
download_size: 466975
dataset_size: 873429
- config_name: yakugaku_qa_filtered_5_options_single_answer
features:
- name: id
dtype: string
- name: question
dtype: string
- name: choices
sequence: string
- name: label
dtype: int64
- name: type
dtype: string
splits:
- name: train
num_bytes: 643011
num_examples: 1326
- name: test
num_bytes: 160019
num_examples: 332
download_size: 434130
dataset_size: 803030
- config_name: yakugaku_qa_gpt5.2_mini_translated
features:
- name: id
dtype: string
- name: question
dtype: string
- name: choices
sequence: string
- name: answer_indices
sequence: int32
- name: num_choices
dtype: int32
- name: num_answers
dtype: int32
- name: question_type
dtype: string
- name: source
dtype: string
splits:
- name: test
num_bytes: 1896835
num_examples: 3009
download_size: 955332
dataset_size: 1896835
configs:
- config_name: ade_corpus_v2_classification
data_files:
- split: train
path: ade_corpus_v2_classification/train-*
- split: validation
path: ade_corpus_v2_classification/validation-*
- config_name: bc2gm
data_files:
- split: train
path: bc2gm/train-*
- split: validation
path: bc2gm/validation-*
- split: test
path: bc2gm/test-*
- config_name: bc5cdr-chem
data_files:
- split: train
path: bc5cdr-chem/train-*
- split: validation
path: bc5cdr-chem/validation-*
- split: test
path: bc5cdr-chem/test-*
- config_name: bc5cdr-disease
data_files:
- split: train
path: bc5cdr-disease/train-*
- split: validation
path: bc5cdr-disease/validation-*
- split: test
path: bc5cdr-disease/test-*
- config_name: bioasq
data_files:
- split: train
path: bioasq/train-*
- split: validation
path: bioasq/validation-*
- split: test
path: bioasq/test-*
- config_name: biosses
data_files:
- split: train
path: biosses/train-*
- split: validation
path: biosses/validation-*
- split: test
path: biosses/test-*
- config_name: chemprot
data_files:
- split: train
path: chemprot/train-*
- split: validation
path: chemprot/validation-*
- split: test
path: chemprot/test-*
- config_name: ddi
data_files:
- split: train
path: ddi/train-*
- split: validation
path: ddi/validation-*
- split: test
path: ddi/test-*
- config_name: ebmnlp
data_files:
- split: train
path: ebmnlp/train-*
- split: validation
path: ebmnlp/validation-*
- split: test
path: ebmnlp/test-*
- config_name: gad
data_files:
- split: train
path: gad/train-*
- split: validation
path: gad/validation-*
- split: test
path: gad/test-*
- config_name: hoc
data_files:
- split: train
path: hoc/train-*
- split: validation
path: hoc/validation-*
- split: test
path: hoc/test-*
- config_name: hotpot
data_files:
- split: train
path: hotpot/train-*
- split: validation
path: hotpot/validation-*
- split: test
path: hotpot/test-*
- config_name: jnlpba
data_files:
- split: train
path: jnlpba/train-*
- split: validation
path: jnlpba/validation-*
- split: test
path: jnlpba/test-*
- config_name: medmcqa
data_files:
- split: train
path: medmcqa/train-*
- split: test
path: medmcqa/test-*
- split: validation
path: medmcqa/validation-*
- config_name: medmcqa_multi
data_files:
- split: train
path: medmcqa_multi/train-*
- split: test
path: medmcqa_multi/test-*
- split: validation
path: medmcqa_multi/validation-*
- config_name: medmcqa_single
data_files:
- split: train
path: medmcqa_single/train-*
- split: test
path: medmcqa_single/test-*
- split: validation
path: medmcqa_single/validation-*
- config_name: medqa_usmle
data_files:
- split: train
path: medqa_usmle/train-*
- split: validation
path: medqa_usmle/validation-*
- split: test
path: medqa_usmle/test-*
- config_name: mmlu
data_files:
- split: validation
path: mmlu/validation-*
- split: test
path: mmlu/test-*
- config_name: mmlu_anatomy
data_files:
- split: test
path: mmlu_anatomy/test-*
- split: validation
path: mmlu_anatomy/validation-*
- split: dev
path: mmlu_anatomy/dev-*
- config_name: mmlu_clinical_knowledge
data_files:
- split: test
path: mmlu_clinical_knowledge/test-*
- split: validation
path: mmlu_clinical_knowledge/validation-*
- split: dev
path: mmlu_clinical_knowledge/dev-*
- config_name: mmlu_college_biology
data_files:
- split: test
path: mmlu_college_biology/test-*
- split: validation
path: mmlu_college_biology/validation-*
- split: dev
path: mmlu_college_biology/dev-*
- config_name: mmlu_college_medicine
data_files:
- split: test
path: mmlu_college_medicine/test-*
- split: validation
path: mmlu_college_medicine/validation-*
- split: dev
path: mmlu_college_medicine/dev-*
- config_name: mmlu_medical_genetics
data_files:
- split: test
path: mmlu_medical_genetics/test-*
- split: validation
path: mmlu_medical_genetics/validation-*
- split: dev
path: mmlu_medical_genetics/dev-*
- config_name: mmlu_professional_medicine
data_files:
- split: test
path: mmlu_professional_medicine/test-*
- split: validation
path: mmlu_professional_medicine/validation-*
- split: dev
path: mmlu_professional_medicine/dev-*
- config_name: naturalqa
data_files:
- split: train
path: naturalqa/train-*
- split: validation
path: naturalqa/validation-*
- split: test
path: naturalqa/test-*
- config_name: ncbi-disease
data_files:
- split: train
path: ncbi-disease/train-*
- split: validation
path: ncbi-disease/validation-*
- split: test
path: ncbi-disease/test-*
- config_name: newsqa
data_files:
- split: train
path: newsqa/train-*
- split: validation
path: newsqa/validation-*
- split: test
path: newsqa/test-*
- config_name: openfda_drug_lama
data_files:
- split: test
path: openfda_drug_lama/test-*
- config_name: openfda_drug_lama_v2
data_files:
- split: test
path: openfda_drug_lama_v2/test-*
- config_name: openfda_tf_evaluation
data_files:
- split: test
path: openfda_tf_evaluation/test-*
- config_name: openfda_tf_tuning
data_files:
- split: train
path: openfda_tf_tuning/train-*
- split: test
path: openfda_tf_tuning/test-*
- config_name: pubmedqa
data_files:
- split: train
path: pubmedqa/train-*
- split: validation
path: pubmedqa/validation-*
- split: test
path: pubmedqa/test-*
- config_name: rxnorm_lama_brand_has_active_ingredient
data_files:
- split: test
path: rxnorm_lama_brand_has_active_ingredient/test-*
- config_name: rxnorm_lama_brand_of_generic
data_files:
- split: test
path: rxnorm_lama_brand_of_generic/test-*
- config_name: rxnorm_lama_chemical_has_synonym
data_files:
- split: test
path: rxnorm_lama_chemical_has_synonym/test-*
- config_name: rxnorm_lama_chemical_has_synonym_v2
data_files:
- split: test
path: rxnorm_lama_chemical_has_synonym_v2/test-*
- config_name: rxnorm_lama_chemical_has_synonym_v3
data_files:
- split: test
path: rxnorm_lama_chemical_has_synonym_v3/test-*
- config_name: rxnorm_lama_generic_has_brand
data_files:
- split: test
path: rxnorm_lama_generic_has_brand/test-*
- config_name: searchqa
data_files:
- split: train
path: searchqa/train-*
- split: validation
path: searchqa/validation-*
- split: test
path: searchqa/test-*
- config_name: sider_lama_ade
data_files:
- split: test
path: sider_lama_ade/test-*
- config_name: sider_lama_indication
data_files:
- split: test
path: sider_lama_indication/test-*
- config_name: sider_lama_indication_v2
data_files:
- split: test
path: sider_lama_indication_v2/test-*
- config_name: sider_lama_indication_v3
data_files:
- split: test
path: sider_lama_indication_v3/test-*
- config_name: sider_lama_side_effect_v2
data_files:
- split: test
path: sider_lama_side_effect_v2/test-*
- config_name: sider_lama_side_effect_v3
data_files:
- split: test
path: sider_lama_side_effect_v3/test-*
- config_name: squad
data_files:
- split: train
path: squad/train-*
- split: validation
path: squad/validation-*
- split: test
path: squad/test-*
- config_name: triviaqa
data_files:
- split: train
path: triviaqa/train-*
- split: validation
path: triviaqa/validation-*
- split: test
path: triviaqa/test-*
- config_name: yakugaku_qa_filtered_5_options_multi_answer
data_files:
- split: train
path: yakugaku_qa_filtered_5_options_multi_answer/train-*
- split: test
path: yakugaku_qa_filtered_5_options_multi_answer/test-*
- config_name: yakugaku_qa_filtered_5_options_single_answer
data_files:
- split: train
path: yakugaku_qa_filtered_5_options_single_answer/train-*
- split: test
path: yakugaku_qa_filtered_5_options_single_answer/test-*
- config_name: yakugaku_qa_gpt5.2_mini_translated
data_files:
- split: test
path: yakugaku_qa_gpt5.2_mini_translated/test-*
---
提供机构:
YoheiOhto



