Innovator-Evaluation/sciassess
收藏Hugging Face2026-04-22 更新2026-04-26 收录
下载链接:
https://hf-mirror.com/datasets/Innovator-Evaluation/sciassess
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: cot
features:
- name: task
dtype: string
- name: cot
dtype: bool
- name: prompt
dtype: string
- name: ideal
dtype: string
- name: choices
list: string
- name: messages_json
dtype: string
- name: doi
dtype: string
- name: pages
list: int64
- name: option
dtype: string
- name: file_name
dtype: string
- name: index
dtype: string
- name: compare_fields
dtype: string
splits:
- name: BIO_biology_chart_qa
num_bytes: 1851795
num_examples: 199
- name: BIO_chemical_entities_recognition
num_bytes: 1850701
num_examples: 500
- name: BIO_compound_disease_recognition
num_bytes: 3103726
num_examples: 775
- name: BIO_disease_entities_recognition
num_bytes: 1886245
num_examples: 500
- name: BIO_gene_disease_function
num_bytes: 169605
num_examples: 24
- name: BIO_mmlu_pro_biology
num_bytes: 2713790
num_examples: 717
- name: CHEM_electrolyte_table_qa
num_bytes: 5965897
num_examples: 199
- name: CHEM_mmlu_pro_chemistry
num_bytes: 2488880
num_examples: 1132
- name: CHEM_oled_property_extraction
num_bytes: 386786
num_examples: 13
- name: CHEM_polymer_chart_qa
num_bytes: 170779
num_examples: 15
- name: CHEM_polymer_composition_qa
num_bytes: 6427609
num_examples: 208
- name: CHEM_polymer_property_extraction
num_bytes: 3588446
num_examples: 109
- name: CHEM_reactant_qa
num_bytes: 6006996
num_examples: 195
- name: CHEM_reaction_mechanism_qa
num_bytes: 686121
num_examples: 22
- name: CHEM_solubility_extraction
num_bytes: 3356720
num_examples: 100
- name: MAT_alloy_chart_qa
num_bytes: 112015
num_examples: 15
- name: MAT_composition_extraction
num_bytes: 8076398
num_examples: 244
- name: MAT_material_qa
num_bytes: 386211
num_examples: 263
- name: MAT_sample_differentiation
num_bytes: 7279692
num_examples: 237
- name: MAT_temperature_qa
num_bytes: 6425352
num_examples: 207
- name: MAT_treatment_sequence
num_bytes: 6272403
num_examples: 202
- name: MED_affinity_extraction
num_bytes: 832464
num_examples: 40
- name: MED_drug_chart_qa
num_bytes: 164098
num_examples: 15
- name: MED_markush2mol
num_bytes: 44736
num_examples: 37
- name: MED_mmlu_pro_health
num_bytes: 2124114
num_examples: 818
- name: MED_mol_in_document
num_bytes: 1355981
num_examples: 50
- name: MED_tag2mol
num_bytes: 1407759
num_examples: 50
download_size: 33322510
dataset_size: 75135319
- config_name: default
features:
- name: task
dtype: string
- name: cot
dtype: bool
- name: prompt
dtype: string
- name: ideal
dtype: string
- name: choices
list: string
- name: messages_json
dtype: string
- name: doi
dtype: string
- name: pages
list: int64
- name: option
dtype: string
- name: file_name
dtype: string
- name: index
dtype: string
- name: compare_fields
dtype: string
splits:
- name: BIO_biology_chart_qa
num_bytes: 1809806
num_examples: 199
- name: BIO_chemical_entities_recognition
num_bytes: 1655201
num_examples: 500
- name: BIO_compound_disease_recognition
num_bytes: 2715351
num_examples: 775
- name: BIO_disease_entities_recognition
num_bytes: 1695745
num_examples: 500
- name: BIO_gene_disease_function
num_bytes: 161757
num_examples: 24
- name: BIO_mmlu_pro_biology
num_bytes: 2515181
num_examples: 717
- name: CHEM_electrolyte_table_qa
num_bytes: 5927092
num_examples: 199
- name: CHEM_mmlu_pro_chemistry
num_bytes: 2175316
num_examples: 1132
- name: CHEM_oled_property_extraction
num_bytes: 379558
num_examples: 13
- name: CHEM_polymer_chart_qa
num_bytes: 167614
num_examples: 15
- name: CHEM_polymer_composition_qa
num_bytes: 6383721
num_examples: 208
- name: CHEM_polymer_property_extraction
num_bytes: 3527842
num_examples: 109
- name: CHEM_reactant_qa
num_bytes: 5943263
num_examples: 195
- name: CHEM_reaction_mechanism_qa
num_bytes: 684075
num_examples: 22
- name: CHEM_solubility_extraction
num_bytes: 3301120
num_examples: 100
- name: MAT_alloy_chart_qa
num_bytes: 110046
num_examples: 15
- name: MAT_composition_extraction
num_bytes: 7940490
num_examples: 244
- name: MAT_material_qa
num_bytes: 313360
num_examples: 263
- name: MAT_sample_differentiation
num_bytes: 7233477
num_examples: 237
- name: MAT_temperature_qa
num_bytes: 6384987
num_examples: 207
- name: MAT_treatment_sequence
num_bytes: 6219277
num_examples: 202
- name: MED_affinity_extraction
num_bytes: 810224
num_examples: 40
- name: MED_drug_chart_qa
num_bytes: 160933
num_examples: 15
- name: MED_markush2mol
num_bytes: 27383
num_examples: 37
- name: MED_mmlu_pro_health
num_bytes: 1897528
num_examples: 818
- name: MED_mol_in_document
num_bytes: 1340331
num_examples: 50
- name: MED_tag2mol
num_bytes: 1392309
num_examples: 50
download_size: 33027404
dataset_size: 72872987
- config_name: unified
features:
- name: task
dtype: string
- name: cot
dtype: bool
- name: prompt
dtype: string
- name: ideal
dtype: string
- name: choices
list: string
- name: messages_json
dtype: string
- name: doi
dtype: string
- name: pages
list: int64
- name: option
dtype: string
- name: file_name
dtype: string
- name: index
dtype: string
- name: compare_fields
dtype: string
splits:
- name: train
num_bytes: 148008288
num_examples: 13772
download_size: 65106749
dataset_size: 148008288
configs:
- config_name: cot
data_files:
- split: BIO_biology_chart_qa
path: cot/BIO_biology_chart_qa-*
- split: BIO_chemical_entities_recognition
path: cot/BIO_chemical_entities_recognition-*
- split: BIO_compound_disease_recognition
path: cot/BIO_compound_disease_recognition-*
- split: BIO_disease_entities_recognition
path: cot/BIO_disease_entities_recognition-*
- split: BIO_gene_disease_function
path: cot/BIO_gene_disease_function-*
- split: BIO_mmlu_pro_biology
path: cot/BIO_mmlu_pro_biology-*
- split: CHEM_electrolyte_table_qa
path: cot/CHEM_electrolyte_table_qa-*
- split: CHEM_mmlu_pro_chemistry
path: cot/CHEM_mmlu_pro_chemistry-*
- split: CHEM_oled_property_extraction
path: cot/CHEM_oled_property_extraction-*
- split: CHEM_polymer_chart_qa
path: cot/CHEM_polymer_chart_qa-*
- split: CHEM_polymer_composition_qa
path: cot/CHEM_polymer_composition_qa-*
- split: CHEM_polymer_property_extraction
path: cot/CHEM_polymer_property_extraction-*
- split: CHEM_reactant_qa
path: cot/CHEM_reactant_qa-*
- split: CHEM_reaction_mechanism_qa
path: cot/CHEM_reaction_mechanism_qa-*
- split: CHEM_solubility_extraction
path: cot/CHEM_solubility_extraction-*
- split: MAT_alloy_chart_qa
path: cot/MAT_alloy_chart_qa-*
- split: MAT_composition_extraction
path: cot/MAT_composition_extraction-*
- split: MAT_material_qa
path: cot/MAT_material_qa-*
- split: MAT_sample_differentiation
path: cot/MAT_sample_differentiation-*
- split: MAT_temperature_qa
path: cot/MAT_temperature_qa-*
- split: MAT_treatment_sequence
path: cot/MAT_treatment_sequence-*
- split: MED_affinity_extraction
path: cot/MED_affinity_extraction-*
- split: MED_drug_chart_qa
path: cot/MED_drug_chart_qa-*
- split: MED_markush2mol
path: cot/MED_markush2mol-*
- split: MED_mmlu_pro_health
path: cot/MED_mmlu_pro_health-*
- split: MED_mol_in_document
path: cot/MED_mol_in_document-*
- split: MED_tag2mol
path: cot/MED_tag2mol-*
- config_name: default
data_files:
- split: BIO_biology_chart_qa
path: data/BIO_biology_chart_qa-*
- split: BIO_chemical_entities_recognition
path: data/BIO_chemical_entities_recognition-*
- split: BIO_compound_disease_recognition
path: data/BIO_compound_disease_recognition-*
- split: BIO_disease_entities_recognition
path: data/BIO_disease_entities_recognition-*
- split: BIO_gene_disease_function
path: data/BIO_gene_disease_function-*
- split: BIO_mmlu_pro_biology
path: data/BIO_mmlu_pro_biology-*
- split: CHEM_electrolyte_table_qa
path: data/CHEM_electrolyte_table_qa-*
- split: CHEM_mmlu_pro_chemistry
path: data/CHEM_mmlu_pro_chemistry-*
- split: CHEM_oled_property_extraction
path: data/CHEM_oled_property_extraction-*
- split: CHEM_polymer_chart_qa
path: data/CHEM_polymer_chart_qa-*
- split: CHEM_polymer_composition_qa
path: data/CHEM_polymer_composition_qa-*
- split: CHEM_polymer_property_extraction
path: data/CHEM_polymer_property_extraction-*
- split: CHEM_reactant_qa
path: data/CHEM_reactant_qa-*
- split: CHEM_reaction_mechanism_qa
path: data/CHEM_reaction_mechanism_qa-*
- split: CHEM_solubility_extraction
path: data/CHEM_solubility_extraction-*
- split: MAT_alloy_chart_qa
path: data/MAT_alloy_chart_qa-*
- split: MAT_composition_extraction
path: data/MAT_composition_extraction-*
- split: MAT_material_qa
path: data/MAT_material_qa-*
- split: MAT_sample_differentiation
path: data/MAT_sample_differentiation-*
- split: MAT_temperature_qa
path: data/MAT_temperature_qa-*
- split: MAT_treatment_sequence
path: data/MAT_treatment_sequence-*
- split: MED_affinity_extraction
path: data/MED_affinity_extraction-*
- split: MED_drug_chart_qa
path: data/MED_drug_chart_qa-*
- split: MED_markush2mol
path: data/MED_markush2mol-*
- split: MED_mmlu_pro_health
path: data/MED_mmlu_pro_health-*
- split: MED_mol_in_document
path: data/MED_mol_in_document-*
- split: MED_tag2mol
path: data/MED_tag2mol-*
- config_name: unified
data_files:
- split: train
path: unified/train-*
---
提供机构:
Innovator-Evaluation



