OALL/details_ConvexAI__Luminex-34B-v0.1
收藏数据集概述
数据集基本信息
- 名称: Evaluation run of ConvexAI/Luminex-34B-v0.1
- 来源: 自动创建于模型 ConvexAI/Luminex-34B-v0.1 的评估运行过程中。
- 组成: 包含 136 个配置,每个配置对应一个评估任务。
- 创建方式: 从 1 次运行中创建,每次运行对应一个特定的分割,分割名称使用运行的时间戳。
- 额外配置: 包含一个名为 "results" 的配置,存储所有运行的聚合结果。
数据加载示例
python from datasets import load_dataset data = load_dataset("OALL/details_ConvexAI__Luminex-34B-v0.1", "lighteval_xstory_cloze_ar_0", split="train")
最新结果
- 时间戳: 2024-06-09T19:07:11.018642
- 结果: 包含多个任务的评估结果,具体结果如下:
python { "all": { "acc_norm": 0.47087734770401, "acc_norm_stderr": 0.03798774954289448, "acc": 0.5744540039708802, "acc_stderr": 0.01272367041916633 }, "community|acva:Algeria|0": { "acc_norm": 0.517948717948718, "acc_norm_stderr": 0.03587477098773825 }, "community|acva:Ancient_Egypt|0": { "acc_norm": 0.6634920634920635, "acc_norm_stderr": 0.02666555933592602 }, "community|acva:Arab_Empire|0": { "acc_norm": 0.4, "acc_norm_stderr": 0.0301511344577763 }, "community|acva:Arabic_Architecture|0": { "acc_norm": 0.6410256410256411, "acc_norm_stderr": 0.03444042881521375 }, "community|acva:Arabic_Art|0": { "acc_norm": 0.47692307692307695, "acc_norm_stderr": 0.03585965308947411 }, "community|acva:Arabic_Astronomy|0": { "acc_norm": 0.5128205128205128, "acc_norm_stderr": 0.03588610523192216 }, "community|acva:Arabic_Calligraphy|0": { "acc_norm": 0.7019607843137254, "acc_norm_stderr": 0.02869962835498248 }, "community|acva:Arabic_Ceremony|0": { "acc_norm": 0.572972972972973, "acc_norm_stderr": 0.03646580777990099 }, "community|acva:Arabic_Clothing|0": { "acc_norm": 0.6051282051282051, "acc_norm_stderr": 0.03509545602262039 }, "community|acva:Arabic_Culture|0": { "acc_norm": 0.7076923076923077, "acc_norm_stderr": 0.032654383937495104 }, "community|acva:Arabic_Food|0": { "acc_norm": 0.6820512820512821, "acc_norm_stderr": 0.03343383454355787 }, "community|acva:Arabic_Funeral|0": { "acc_norm": 0.5368421052631579, "acc_norm_stderr": 0.05143087276324537 }, "community|acva:Arabic_Geography|0": { "acc_norm": 0.5241379310344828, "acc_norm_stderr": 0.041618085035015295 }, "community|acva:Arabic_History|0": { "acc_norm": 0.4564102564102564, "acc_norm_stderr": 0.035761230969912135 }, "community|acva:Arabic_Language_Origin|0": { "acc_norm": 0.7263157894736842, "acc_norm_stderr": 0.04598579376319263 }, "community|acva:Arabic_Literature|0": { "acc_norm": 0.5724137931034483, "acc_norm_stderr": 0.04122737111370331 }, "community|acva:Arabic_Math|0": { "acc_norm": 0.35384615384615387, "acc_norm_stderr": 0.03433004254147036 }, "community|acva:Arabic_Medicine|0": { "acc_norm": 0.6, "acc_norm_stderr": 0.040824829046386284 }, "community|acva:Arabic_Music|0": { "acc_norm": 0.48201438848920863, "acc_norm_stderr": 0.042535280989201354 }, "community|acva:Arabic_Ornament|0": { "acc_norm": 0.6256410256410256, "acc_norm_stderr": 0.03474608430626235 }, "community|acva:Arabic_Philosophy|0": { "acc_norm": 0.7310344827586207, "acc_norm_stderr": 0.03695183311650232 }, "community|acva:Arabic_Physics_and_Chemistry|0": { "acc_norm": 0.7487179487179487, "acc_norm_stderr": 0.031141461571214366 }, "community|acva:Arabic_Wedding|0": { "acc_norm": 0.7128205128205128, "acc_norm_stderr": 0.03248373338539885 }, "community|acva:Bahrain|0": { "acc_norm": 0.6444444444444445, "acc_norm_stderr": 0.07216392363431012 }, "community|acva:Comoros|0": { "acc_norm": 0.5777777777777777, "acc_norm_stderr": 0.07446027270295806 }, "community|acva:Egypt_modern|0": { "acc_norm": 0.6210526315789474, "acc_norm_stderr": 0.050036822652392066 }, "community|acva:InfluenceFromAncientEgypt|0": { "acc_norm": 0.6923076923076923, "acc_norm_stderr": 0.03313653039774172 }, "community|acva:InfluenceFromByzantium|0": { "acc_norm": 0.7862068965517242, "acc_norm_stderr": 0.03416520447747548 }, "community|acva:InfluenceFromChina|0": { "acc_norm": 0.4205128205128205, "acc_norm_stderr": 0.03544138389303483 }, "community|acva:InfluenceFromGreece|0": { "acc_norm": 0.7333333333333333, "acc_norm_stderr": 0.031749304364126714 }, "community|acva:InfluenceFromIslam|0": { "acc_norm": 0.7034482758620689, "acc_norm_stderr": 0.03806142687309992 }, "community|acva:InfluenceFromPersia|0": { "acc_norm": 0.8457142857142858, "acc_norm_stderr": 0.027384200564099657 }, "community|acva:InfluenceFromRome|0": { "acc_norm": 0.6307692307692307, "acc_norm_stderr": 0.03464841141863756 }, "community|acva:Iraq|0": { "acc_norm": 0.611764705882353, "acc_norm_stderr": 0.05317409082203827 }, "community|acva:Islam_Education|0": { "acc_norm": 0.5692307692307692, "acc_norm_stderr": 0.03555213252058761 }, "community|acva:Islam_branches_and_schools|0": { "acc_norm": 0.4114285714285714, "acc_norm_stderr": 0.03730544181135405 }, "community|acva:Islamic_law_system|0": { "acc_norm": 0.6153846153846154, "acc_norm_stderr": 0.03492896993742303 }, "community|acva:Jordan|0": { "acc_norm": 0.5333333333333333, "acc_norm_stderr": 0.0752101433090355 }, "community|acva:Kuwait|0": { "acc_norm": 0.6666666666666666, "acc_norm_stderr": 0.07106690545187012 }, "community|acva:Lebanon|0": { "acc_norm": 0.6666666666666666, "acc_norm_stderr": 0.07106690545187014 }, "community|acva:Libya|0": { "acc_norm": 0.5555555555555556, "acc_norm_stderr": 0.07491109582924914 }, "community|acva:Mauritania|0": { "acc_norm": 0.4444444444444444, "acc_norm_stderr": 0.07491109582924915 }, "community|acva:Mesopotamia_civilization|0": { "acc_norm": 0.6129032258064516, "acc_norm_stderr": 0.03925051588729524 }, "community|acva:Morocco|0": { "acc_norm": 0.6, "acc_norm_stderr": 0.07385489458759965 }, "community|acva:Oman|0": { "acc_norm": 0.8444444444444444, "acc_norm_stderr": 0.05463890236888295 }, "community|acva:Palestine|0": { "acc_norm": 0.47058823529411764, "acc_norm_stderr": 0.0544600058689736 }, "community|acva:Qatar|0": { "acc_norm": 0.7333333333333333, "acc_norm_stderr": 0.06666666666666668 }, "community|acva:Saudi_Arabia|0": { "acc_norm": 0.6, "acc_norm_stderr": 0.0351726229056329 }, "community|acva:Somalia|0": { "acc_norm": 0.6, "acc_norm_stderr": 0.07385489458759965 }, "community|acva:Sudan|0": { "acc_norm": 0.6444444444444445, "acc_norm_stderr": 0.0721639



