From 77ce2797494d76d39945e2fa6208b33fffaf94d4 Mon Sep 17 00:00:00 2001 From: github-actions <41898282+github-actions[bot]@users.noreply.github.com> Date: Mon, 13 Jan 2025 11:18:36 +0000 Subject: [PATCH] auto: update csv outputs to version 2025.01.13 --- csv/huggingface_v2.csv | 232 +++++++++++++++++++++-------------------- csv/merged.csv | 24 ++--- 2 files changed, 130 insertions(+), 126 deletions(-) diff --git a/csv/huggingface_v2.csv b/csv/huggingface_v2.csv index 7afca9a..74ba1bd 100644 --- a/csv/huggingface_v2.csv +++ b/csv/huggingface_v2.csv @@ -18,7 +18,7 @@ id,model_name,model_sha,model_precision,model_type,model_weight_type,model_archi 01-ai/Yi-6B-Chat_bfloat16_01f7fabb6cfb26efeb764da4a0a19cad2c754232_True,01-ai/Yi-6B-Chat,01f7fabb6cfb26efeb764da4a0a19cad2c754232,bfloat16,chatmodels,Original,LlamaForCausalLM,14.0043569538772,TRUE,IFEval,0.339521358883319,33.9521358883319,BBH,0.413260192075487,17.0001665674238,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.294463087248322,5.92841163310962,MUSR,0.368791666666667,3.565625,MMLU-PRO,0.30610039893617,22.9000443262411,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-22,2024-06-12,0,01-ai/Yi-6B-Chat,apache-2.0,64,6.061,0.555332836121801 01-ai/Yi-9B_bfloat16_b4a466d95091696285409f1dcca3028543cb39da_False,01-ai/Yi-9B,b4a466d95091696285409f1dcca3028543cb39da,bfloat16,pretrained,Original,LlamaForCausalLM,17.7741030172929,FALSE,IFEval,0.270877937206612,27.0877937206612,BBH,0.493960751253081,27.6269561120779,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.317953020134228,9.06040268456376,MUSR,0.40540625,8.90911458333333,MMLU-PRO,0.357380319148936,28.5978132387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-01,2024-06-12,0,01-ai/Yi-9B,apache-2.0,186,8.829,0.765331980708509 01-ai/Yi-9B-200K_bfloat16_8c93accd5589dbb74ee938e103613508c4a9b88d_False,01-ai/Yi-9B-200K,8c93accd5589dbb74ee938e103613508c4a9b88d,bfloat16,pretrained,Original,LlamaForCausalLM,17.7421399029321,FALSE,IFEval,0.232709211558664,23.2709211558664,BBH,0.479330260202364,26.4924950971475,MATH Level 5,0.0672205438066465,6.72205438066465,GPQA,0.315436241610738,8.7248322147651,MUSR,0.42940625,12.1091145833333,MMLU-PRO,0.36220079787234,29.1334219858156,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-15,2024-06-12,0,01-ai/Yi-9B-200K,apache-2.0,75,8.829,0.774491171896652 -01-ai/Yi-Coder-9B-Chat_bfloat16_356a1f8d4e4a606d0b879e54191ca809918576b8_True,01-ai/Yi-Coder-9B-Chat,356a1f8d4e4a606d0b879e54191ca809918576b8,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,16.8726962635044,TRUE,IFEval,0.481704100675098,48.1704100675098,BBH,0.481420003391117,25.9431529449139,MATH Level 5,0.0332326283987915,3.32326283987915,GPQA,0.24748322147651,0,MUSR,0.399177083333333,7.96380208333333,MMLU-PRO,0.242519946808511,15.8355496453901,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-21,2024-09-12,1,01-ai/Yi-Coder-9B,apache-2.0,194,8.829,0.909766114796084 +01-ai/Yi-Coder-9B-Chat_bfloat16_356a1f8d4e4a606d0b879e54191ca809918576b8_True,01-ai/Yi-Coder-9B-Chat,356a1f8d4e4a606d0b879e54191ca809918576b8,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,16.8726962635044,TRUE,IFEval,0.481704100675098,48.1704100675098,BBH,0.481420003391117,25.9431529449139,MATH Level 5,0.0332326283987915,3.32326283987915,GPQA,0.24748322147651,0,MUSR,0.399177083333333,7.96380208333333,MMLU-PRO,0.242519946808511,15.8355496453901,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-21,2024-09-12,1,01-ai/Yi-Coder-9B,apache-2.0,195,8.829,0.909766114796084 152334H/miqu-1-70b-sf_float16_1dca4cce36f01f2104ee2e6b97bac6ff7bb300c1_False,152334H/miqu-1-70b-sf,1dca4cce36f01f2104ee2e6b97bac6ff7bb300c1,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,29.0596433757835,FALSE,IFEval,0.518174000540787,51.8174000540787,BBH,0.610236168509969,43.807147003692,MATH Level 5,0.122356495468278,12.2356495468278,GPQA,0.350671140939597,13.4228187919463,MUSR,0.458208333333333,17.209375,MMLU-PRO,0.422789228723404,35.865469858156,FALSE,FALSE,FALSE,FALSE,FALSE,2024-01-30,2024-06-26,0,152334H/miqu-1-70b-sf,"",220,68.977,6.09898597691416 1TuanPham/T-VisStar-7B-v0.1_float16_b111b59971c14b46c888b96723ff7f3c7b6fd92f_True,1TuanPham/T-VisStar-7B-v0.1,b111b59971c14b46c888b96723ff7f3c7b6fd92f,float16,chatmodels,Original,MistralForCausalLM,19.0441036763536,TRUE,IFEval,0.360704043050218,36.0704043050218,BBH,0.505220311335247,30.243834478826,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.285234899328859,4.6979865771812,MUSR,0.4375,13.5541666666667,MMLU-PRO,0.321060505319149,24.5622783687943,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-19,2024-09-22,0,1TuanPham/T-VisStar-7B-v0.1,apache-2.0,2,7.294,1.2695126379214 1TuanPham/T-VisStar-v0.1_float16_c9779bd9630a533f7e42fd8effcca69623d48c9c_True,1TuanPham/T-VisStar-v0.1,c9779bd9630a533f7e42fd8effcca69623d48c9c,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,19.0441036763536,TRUE,IFEval,0.360704043050218,36.0704043050218,BBH,0.505220311335247,30.243834478826,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.285234899328859,4.6979865771812,MUSR,0.4375,13.5541666666667,MMLU-PRO,0.321060505319149,24.5622783687943,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-19,2024-09-20,0,1TuanPham/T-VisStar-v0.1,apache-2.0,2,7.294,0.624384413568203 @@ -36,7 +36,7 @@ AELLM/gemma-2-lyco-infinity-9b_bfloat16_2941a682fcbcfea3f1485c9e0691cc1d9edc742e AGI-0/Artificium-llama3.1-8B-001_float16_6bf3dcca3b75a06a4e04e5f944e709cccf4673fd_True,AGI-0/Artificium-llama3.1-8B-001,6bf3dcca3b75a06a4e04e5f944e709cccf4673fd,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.0638219529364,TRUE,IFEval,0.524768724761411,52.4768724761411,BBH,0.425621502259236,19.3488980732397,MATH Level 5,0.110271903323263,11.0271903323263,GPQA,0.265939597315436,2.12527964205817,MUSR,0.379458333333333,5.165625,MMLU-PRO,0.318151595744681,24.2390661938534,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-08,0,Removed,"",0,8.03,1.86032650369272 AGI-0/smartllama3.1-8B-001_float16_974d5ee685f1be003a1d8d08e907fe672d225035_False,AGI-0/smartllama3.1-8B-001,974d5ee685f1be003a1d8d08e907fe672d225035,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.2357303253963,FALSE,IFEval,0.351786592906821,35.1786592906821,BBH,0.467017875108682,24.8577369132814,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.306208053691275,7.49440715883669,MUSR,0.438645833333333,14.3973958333333,MMLU-PRO,0.348653590425532,27.628176713948,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-11-25,0,Removed,"",0,8.03,0.718834247509005 AI-MO/NuminaMath-7B-CoT_bfloat16_ff7e3044218efe64128bd9c21f9ec66c3de04324_True,AI-MO/NuminaMath-7B-CoT,ff7e3044218efe64128bd9c21f9ec66c3de04324,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,13.0973091817693,TRUE,IFEval,0.268854417390302,26.8854417390302,BBH,0.431419349586001,19.1523642820903,MATH Level 5,0.088368580060423,8.8368580060423,GPQA,0.265939597315436,2.12527964205817,MUSR,0.33034375,0.826302083333333,MMLU-PRO,0.286818484042553,20.7576093380615,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-15,2024-09-10,1,deepseek-ai/deepseek-math-7b-base,apache-2.0,19,6.91,0.745988957719221 -AI-MO/NuminaMath-7B-TIR_bfloat16_c6e394cc0579423c9cde6df6cc192c07dae73388_False,AI-MO/NuminaMath-7B-TIR,c6e394cc0579423c9cde6df6cc192c07dae73388,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,11.8157231814413,FALSE,IFEval,0.275624232591745,27.5624232591746,BBH,0.414369133758979,16.8735472579587,MATH Level 5,0.0188821752265861,1.88821752265861,GPQA,0.258389261744966,1.11856823266219,MUSR,0.350927083333333,4.19921875,MMLU-PRO,0.273271276595745,19.2523640661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-04,2024-07-11,1,deepseek-ai/deepseek-math-7b-base,apache-2.0,325,6.91,1.07410978749413 +AI-MO/NuminaMath-7B-TIR_bfloat16_c6e394cc0579423c9cde6df6cc192c07dae73388_False,AI-MO/NuminaMath-7B-TIR,c6e394cc0579423c9cde6df6cc192c07dae73388,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,11.8157231814413,FALSE,IFEval,0.275624232591745,27.5624232591746,BBH,0.414369133758979,16.8735472579587,MATH Level 5,0.0188821752265861,1.88821752265861,GPQA,0.258389261744966,1.11856823266219,MUSR,0.350927083333333,4.19921875,MMLU-PRO,0.273271276595745,19.2523640661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-04,2024-07-11,1,deepseek-ai/deepseek-math-7b-base,apache-2.0,326,6.91,1.07410978749413 AI-Sweden-Models/Llama-3-8B-instruct_bfloat16_4e1c955228bdb4d69c1c4560e8d5872312a8f033_True,AI-Sweden-Models/Llama-3-8B-instruct,4e1c955228bdb4d69c1c4560e8d5872312a8f033,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,13.7772044149452,TRUE,IFEval,0.240128414828211,24.0128414828211,BBH,0.41734601545153,18.3880956150275,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.265939597315436,2.12527964205817,MUSR,0.47709375,19.93671875,MMLU-PRO,0.259724069148936,17.7471187943262,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-01,2024-06-27,2,meta-llama/Meta-Llama-3-8B,llama3,10,8.03,1.16611088086752 AI-Sweden-Models/gpt-sw3-40b_float16_1af27994df1287a7fac1b10d60e40ca43a22a385_False,AI-Sweden-Models/gpt-sw3-40b,1af27994df1287a7fac1b10d60e40ca43a22a385,float16,pretrained,Original,GPT2LMHeadModel,4.73443320029372,FALSE,IFEval,0.147029880716499,14.7029880716499,BBH,0.326774470295765,6.89493405079658,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.23489932885906,0,MUSR,0.363239583333333,2.83828125,MMLU-PRO,0.127576462765957,3.06405141843972,TRUE,FALSE,FALSE,FALSE,FALSE,2023-02-22,2024-06-26,0,AI-Sweden-Models/gpt-sw3-40b,other,10,39.927,2.95981936505708 Aashraf995/Creative-7B-nerd_bfloat16_fc24bca48549ef8e39cbee5a438e5a16e25e4afa_False,Aashraf995/Creative-7B-nerd,fc24bca48549ef8e39cbee5a438e5a16e25e4afa,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,29.4620797264411,FALSE,IFEval,0.472187130148007,47.2187130148007,BBH,0.56067855656402,37.0801538173552,MATH Level 5,0.285498489425982,28.5498489425982,GPQA,0.326342281879195,10.1789709172259,MUSR,0.451541666666667,14.9427083333333,MMLU-PRO,0.44921875,38.8020833333333,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-13,2024-12-13,1,Aashraf995/Creative-7B-nerd (Merge),apache-2.0,2,7.616,0.648867000524312 @@ -109,10 +109,10 @@ BoltMonkey/NeuralDaredevil-SuperNova-Lite-7B-DARETIES-abliterated_bfloat16_969e4 BoltMonkey/NeuralDaredevil-SuperNova-Lite-7B-DARETIES-abliterated_float16_969e4c9b41e733a367f5ea18ed50a6171b5e2357_False,BoltMonkey/NeuralDaredevil-SuperNova-Lite-7B-DARETIES-abliterated,969e4c9b41e733a367f5ea18ed50a6171b5e2357,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,21.3455105902695,FALSE,IFEval,0.459023169634348,45.9023169634348,BBH,0.518544191244718,30.7937847526593,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.274328859060403,3.24384787472036,MUSR,0.408260416666667,9.53255208333334,MMLU-PRO,0.363115026595745,29.2350029550827,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-01,2024-10-01,1,BoltMonkey/NeuralDaredevil-SuperNova-Lite-7B-DARETIES-abliterated (Merge),llama3.1,2,8.03,0.774318574067633 BoltMonkey/SuperNeuralDreadDevil-8b_bfloat16_804d5864127e603abec179a159b43f446246fafc_True,BoltMonkey/SuperNeuralDreadDevil-8b,804d5864127e603abec179a159b43f446246fafc,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,21.8477261012612,TRUE,IFEval,0.485801007992128,48.5801007992128,BBH,0.515107801571382,30.6067137896696,MATH Level 5,0.0906344410876133,9.06344410876133,GPQA,0.285234899328859,4.6979865771812,MUSR,0.415947916666667,10.4268229166667,MMLU-PRO,0.349401595744681,27.7112884160757,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-13,2024-10-13,1,BoltMonkey/SuperNeuralDreadDevil-8b (Merge),"",1,8.03,2.40533122936953 BrainWave-ML/llama3.2-3B-maths-orpo_float16_d149d83d8e8f3883421d800848fec85766181923_False,BrainWave-ML/llama3.2-3B-maths-orpo,d149d83d8e8f3883421d800848fec85766181923,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,5.07608283209792,FALSE,IFEval,0.204907423414318,20.4907423414319,BBH,0.291177810298844,2.34704095752041,MATH Level 5,0,0,GPQA,0.259228187919463,1.23042505592841,MUSR,0.35753125,4.52473958333333,MMLU-PRO,0.116771941489362,1.86354905437352,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-24,2024-10-24,2,meta-llama/Llama-3.2-3B-Instruct,apache-2.0,2,3,0.707219058323977 -BramVanroy/GEITje-7B-ultra_bfloat16_d4552cdc6f015754646464d8411aa4f6bcdba8e8_True,BramVanroy/GEITje-7B-ultra,d4552cdc6f015754646464d8411aa4f6bcdba8e8,bfloat16,chatmodels,Original,MistralForCausalLM,10.909605767857,TRUE,IFEval,0.372344268762439,37.2344268762439,BBH,0.377616129973055,12.8799130100359,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.26258389261745,1.67785234899329,MUSR,0.328979166666667,1.52239583333333,MMLU-PRO,0.201130319148936,11.2367021276596,TRUE,FALSE,FALSE,FALSE,FALSE,2024-01-27,2024-10-28,3,mistralai/Mistral-7B-v0.1,cc-by-nc-4.0,37,7.242,0.619523220998688 +BramVanroy/GEITje-7B-ultra_bfloat16_d4552cdc6f015754646464d8411aa4f6bcdba8e8_True,BramVanroy/GEITje-7B-ultra,d4552cdc6f015754646464d8411aa4f6bcdba8e8,bfloat16,chatmodels,Original,MistralForCausalLM,10.909605767857,TRUE,IFEval,0.372344268762439,37.2344268762439,BBH,0.377616129973055,12.8799130100359,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.26258389261745,1.67785234899329,MUSR,0.328979166666667,1.52239583333333,MMLU-PRO,0.201130319148936,11.2367021276596,TRUE,FALSE,FALSE,FALSE,FALSE,2024-01-27,2024-10-28,3,mistralai/Mistral-7B-v0.1,cc-by-nc-4.0,38,7.242,0.619523220998688 BramVanroy/fietje-2_bfloat16_3abe75d01094b713368e3d911ffb78a2d66ead22_False,BramVanroy/fietje-2,3abe75d01094b713368e3d911ffb78a2d66ead22,bfloat16,continuouslypretrained,Original,PhiForCausalLM,9.02700742645131,FALSE,IFEval,0.209803321852684,20.9803321852684,BBH,0.403566951783862,15.6036761925679,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.254194630872483,0.559284116331097,MUSR,0.3695625,5.16197916666667,MMLU-PRO,0.198553856382979,10.9504284869976,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-09,2024-10-28,1,microsoft/phi-2,mit,7,2.78,0.312538644411375 -BramVanroy/fietje-2-chat_bfloat16_364e785d90438b787b94e33741a930c9932353c0_True,BramVanroy/fietje-2-chat,364e785d90438b787b94e33741a930c9932353c0,bfloat16,chatmodels,Original,PhiForCausalLM,10.3888691075389,TRUE,IFEval,0.291735927339459,29.1735927339459,BBH,0.4149753717402,17.7189658483235,MATH Level 5,0.00528700906344411,0.528700906344411,GPQA,0.23993288590604,0,MUSR,0.352760416666667,3.19505208333333,MMLU-PRO,0.205452127659574,11.7169030732861,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-29,2024-10-28,3,microsoft/phi-2,mit,1,2.775,0.399032708170906 -BramVanroy/fietje-2-instruct_bfloat16_b7b44797cd52eda1182667217e8371dbdfee4976_True,BramVanroy/fietje-2-instruct,b7b44797cd52eda1182667217e8371dbdfee4976,bfloat16,chatmodels,Original,PhiForCausalLM,10.1961916875489,TRUE,IFEval,0.278996396228673,27.8996396228673,BBH,0.413607141730298,17.5724798088476,MATH Level 5,0.00528700906344411,0.528700906344411,GPQA,0.233221476510067,0,MUSR,0.336916666666667,2.91458333333333,MMLU-PRO,0.210355718085106,12.2617464539007,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-27,2024-10-28,2,microsoft/phi-2,mit,2,2.775,0.324395092917699 +BramVanroy/fietje-2-chat_bfloat16_364e785d90438b787b94e33741a930c9932353c0_True,BramVanroy/fietje-2-chat,364e785d90438b787b94e33741a930c9932353c0,bfloat16,chatmodels,Original,PhiForCausalLM,10.3888691075389,TRUE,IFEval,0.291735927339459,29.1735927339459,BBH,0.4149753717402,17.7189658483235,MATH Level 5,0.00528700906344411,0.528700906344411,GPQA,0.23993288590604,0,MUSR,0.352760416666667,3.19505208333333,MMLU-PRO,0.205452127659574,11.7169030732861,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-29,2024-10-28,3,microsoft/phi-2,mit,2,2.775,0.399032708170906 +BramVanroy/fietje-2-instruct_bfloat16_b7b44797cd52eda1182667217e8371dbdfee4976_True,BramVanroy/fietje-2-instruct,b7b44797cd52eda1182667217e8371dbdfee4976,bfloat16,chatmodels,Original,PhiForCausalLM,10.1961916875489,TRUE,IFEval,0.278996396228673,27.8996396228673,BBH,0.413607141730298,17.5724798088476,MATH Level 5,0.00528700906344411,0.528700906344411,GPQA,0.233221476510067,0,MUSR,0.336916666666667,2.91458333333333,MMLU-PRO,0.210355718085106,12.2617464539007,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-27,2024-10-28,2,microsoft/phi-2,mit,3,2.775,0.324395092917699 CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct_float16_5be46c768d800447b82de41fdc9df2f8c43ba3c0_True,CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct,5be46c768d800447b82de41fdc9df2f8c43ba3c0,float16,chatmodels,Original,LlamaForCausalLM,20.5008910053068,TRUE,IFEval,0.719882134957468,71.9882134957469,BBH,0.442671908082079,21.4973103328035,MATH Level 5,0.0249244712990937,2.49244712990937,GPQA,0.270973154362416,2.79642058165548,MUSR,0.364916666666667,3.98125,MMLU-PRO,0.282247340425532,20.2497044917258,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-30,2024-12-20,1,CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct (Merge),llama3.2,8,3.213,0.567953731894678 CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct-2412_float16_ac6f1c0b756412163e17cb05d9e2f7ced274dc12_False,CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct-2412,ac6f1c0b756412163e17cb05d9e2f7ced274dc12,float16,chatmodels,Original,LlamaForCausalLM,20.2388147588296,FALSE,IFEval,0.478182333984938,47.8182333984938,BBH,0.435772464982467,20.175679614215,MATH Level 5,0.172205438066465,17.2205438066465,GPQA,0.292785234899329,5.70469798657718,MUSR,0.387208333333333,6.80104166666667,MMLU-PRO,0.313414228723404,23.7126920803782,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-03,2024-12-19,1,CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct-2412 (Merge),llama3.2,0,3.213,0.643589333680084 Casual-Autopsy/L3-Umbral-Mind-RP-v2.0-8B_bfloat16_b46c066ea8387264858dc3461f382e7b42fd9c48_True,Casual-Autopsy/L3-Umbral-Mind-RP-v2.0-8B,b46c066ea8387264858dc3461f382e7b42fd9c48,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,25.9119269260344,TRUE,IFEval,0.712263460950279,71.2263460950279,BBH,0.526240614549372,32.4862776238149,MATH Level 5,0.110271903323263,11.0271903323263,GPQA,0.286912751677852,4.92170022371365,MUSR,0.368666666666667,5.55,MMLU-PRO,0.372340425531915,30.2600472813239,TRUE,TRUE,FALSE,FALSE,FALSE,2024-06-26,2024-07-02,1,Casual-Autopsy/L3-Umbral-Mind-RP-v2.0-8B (Merge),llama3,13,8.03,0.988384908126601 @@ -131,7 +131,7 @@ CohereForAI/aya-expanse-8b_float16_b9848575c8731981dfcf2e1f3bfbcb917a2e585d_True CohereForAI/c4ai-command-r-plus_float16_fa1bd7fb1572ceb861bbbbecfa8af83b29fa8cca_True,CohereForAI/c4ai-command-r-plus,fa1bd7fb1572ceb861bbbbecfa8af83b29fa8cca,float16,chatmodels,Original,CohereForCausalLM,30.961246846254,TRUE,IFEval,0.766418658049531,76.6418658049531,BBH,0.581542357407793,39.9199542314318,MATH Level 5,0.081570996978852,8.1570996978852,GPQA,0.305369127516779,7.38255033557047,MUSR,0.48071875,20.4231770833333,MMLU-PRO,0.399185505319149,33.2428339243499,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-03,2024-06-13,0,CohereForAI/c4ai-command-r-plus,cc-by-nc-4.0,1700,103.811,28.6315317116708 CohereForAI/c4ai-command-r-plus-08-2024_float16_2d8cf3ab0af78b9e43546486b096f86adf3ba4d0_True,CohereForAI/c4ai-command-r-plus-08-2024,2d8cf3ab0af78b9e43546486b096f86adf3ba4d0,float16,chatmodels,Original,CohereForCausalLM,33.5845340114894,TRUE,IFEval,0.753953953288386,75.3953953288386,BBH,0.599599991302719,42.836865407707,MATH Level 5,0.120090634441088,12.0090634441088,GPQA,0.350671140939597,13.4228187919463,MUSR,0.482947916666667,19.83515625,MMLU-PRO,0.442071143617021,38.0079048463357,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-21,2024-09-19,0,CohereForAI/c4ai-command-r-plus-08-2024,cc-by-nc-4.0,216,103.811,22.3188766676731 CohereForAI/c4ai-command-r-v01_float16_16881ccde1c68bbc7041280e6a66637bc46bfe88_True,CohereForAI/c4ai-command-r-v01,16881ccde1c68bbc7041280e6a66637bc46bfe88,float16,chatmodels,Original,CohereForCausalLM,25.3499784613365,TRUE,IFEval,0.674819478982433,67.4819478982433,BBH,0.540641551276786,34.5566592570583,MATH Level 5,0,0,GPQA,0.307046979865772,7.60626398210291,MUSR,0.451697916666667,16.12890625,MMLU-PRO,0.336934840425532,26.3260933806147,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-11,2024-06-13,0,CohereForAI/c4ai-command-r-v01,cc-by-nc-4.0,1073,34.981,13.3954372669898 -CohereForAI/c4ai-command-r7b-12-2024_bfloat16_a9650f3bda8b0e00825ee36592e086b4ee621102_True,CohereForAI/c4ai-command-r7b-12-2024,a9650f3bda8b0e00825ee36592e086b4ee621102,bfloat16,chatmodels,Original,Cohere2ForCausalLM,31.0762402648343,TRUE,IFEval,0.771314556487897,77.1314556487897,BBH,0.550264215185564,36.0245641700103,MATH Level 5,0.266616314199396,26.6616314199396,GPQA,0.308724832214765,7.82997762863535,MUSR,0.412510416666667,10.23046875,MMLU-PRO,0.357214095744681,28.5793439716312,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2024-12-20,0,CohereForAI/c4ai-command-r7b-12-2024,cc-by-nc-4.0,329,8.028,2.45480693599537 +CohereForAI/c4ai-command-r7b-12-2024_bfloat16_a9650f3bda8b0e00825ee36592e086b4ee621102_True,CohereForAI/c4ai-command-r7b-12-2024,a9650f3bda8b0e00825ee36592e086b4ee621102,bfloat16,chatmodels,Original,Cohere2ForCausalLM,31.0762402648343,TRUE,IFEval,0.771314556487897,77.1314556487897,BBH,0.550264215185564,36.0245641700103,MATH Level 5,0.266616314199396,26.6616314199396,GPQA,0.308724832214765,7.82997762863535,MUSR,0.412510416666667,10.23046875,MMLU-PRO,0.357214095744681,28.5793439716312,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2024-12-20,0,CohereForAI/c4ai-command-r7b-12-2024,cc-by-nc-4.0,331,8.028,2.45480693599537 Columbia-NLP/LION-Gemma-2b-dpo-v1.0_float16_a5f780075831374f8850324448acf94976dea504_True,Columbia-NLP/LION-Gemma-2b-dpo-v1.0,a5f780075831374f8850324448acf94976dea504,float16,chatmodels,Original,GemmaForCausalLM,11.4839947622434,TRUE,IFEval,0.327831265486686,32.7831265486686,BBH,0.391995636132075,14.5859760938158,MATH Level 5,0.0430513595166163,4.30513595166163,GPQA,0.249161073825503,0,MUSR,0.412010416666667,9.83463541666667,MMLU-PRO,0.16655585106383,7.39509456264775,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-28,2024-07-04,0,Columbia-NLP/LION-Gemma-2b-dpo-v1.0,"",0,2.506,0.97964847425047 Columbia-NLP/LION-Gemma-2b-dpo-v1.0_bfloat16_a5f780075831374f8850324448acf94976dea504_True,Columbia-NLP/LION-Gemma-2b-dpo-v1.0,a5f780075831374f8850324448acf94976dea504,bfloat16,chatmodels,Original,GemmaForCausalLM,11.1487995452652,TRUE,IFEval,0.310245703621945,31.0245703621945,BBH,0.388103091595545,14.2430456477269,MATH Level 5,0.0468277945619336,4.68277945619336,GPQA,0.253355704697987,0.447427293064876,MUSR,0.408072916666667,9.10911458333334,MMLU-PRO,0.166472739361702,7.38585992907801,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-28,2024-07-04,0,Columbia-NLP/LION-Gemma-2b-dpo-v1.0,"",0,2.506,0.99456912017475 Columbia-NLP/LION-Gemma-2b-odpo-v1.0_bfloat16_090d9f59c3b47ab8dd099ddd278c058aa6d2d529_True,Columbia-NLP/LION-Gemma-2b-odpo-v1.0,090d9f59c3b47ab8dd099ddd278c058aa6d2d529,bfloat16,chatmodels,Original,GemmaForCausalLM,11.4567947643227,TRUE,IFEval,0.306648581319787,30.6648581319787,BBH,0.389583621070688,14.0239216654163,MATH Level 5,0.0430513595166163,4.30513595166163,GPQA,0.24244966442953,0,MUSR,0.427916666666667,12.05625,MMLU-PRO,0.169215425531915,7.69060283687943,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-28,2024-07-13,0,Columbia-NLP/LION-Gemma-2b-odpo-v1.0,"",4,2.506,0.962068098338517 @@ -145,7 +145,7 @@ CombinHorizon/YiSM-blossom5.1-34B-SLERP_bfloat16_ebd8d6507623008567a0548cd0ff9e2 CombinHorizon/huihui-ai-abliterated-Qwen2.5-32B-Inst-BaseMerge-TIES_bfloat16_3284c32f13733d1cd17c723ed754f2c01b65a15c_True,CombinHorizon/huihui-ai-abliterated-Qwen2.5-32B-Inst-BaseMerge-TIES,3284c32f13733d1cd17c723ed754f2c01b65a15c,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,35.7509991621967,TRUE,IFEval,0.820623722833194,82.0623722833194,BBH,0.692924708291253,56.044781840899,MATH Level 5,0,0,GPQA,0.338926174496644,11.8568232662192,MUSR,0.420729166666667,12.0911458333333,MMLU-PRO,0.572057845744681,52.450871749409,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-07,2024-12-07,1,CombinHorizon/huihui-ai-abliterated-Qwen2.5-32B-Inst-BaseMerge-TIES (Merge),apache-2.0,1,32.764,13.0004215620151 CombinHorizon/huihui-ai-abliteratedV2-Qwen2.5-14B-Inst-BaseMerge-TIES_bfloat16_d92237b4b4deccb92a72b5209c79978f09fe3f08_True,CombinHorizon/huihui-ai-abliteratedV2-Qwen2.5-14B-Inst-BaseMerge-TIES,d92237b4b4deccb92a72b5209c79978f09fe3f08,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,32.3398261648922,TRUE,IFEval,0.817576253230318,81.7576253230318,BBH,0.633589155642108,47.7673460059098,MATH Level 5,0,0,GPQA,0.314597315436242,8.61297539149888,MUSR,0.42603125,12.45390625,MMLU-PRO,0.491023936170213,43.4471040189125,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-07,2024-12-07,1,CombinHorizon/huihui-ai-abliteratedV2-Qwen2.5-14B-Inst-BaseMerge-TIES (Merge),apache-2.0,2,14.77,1.66712961175144 CombinHorizon/zetasepic-abliteratedV2-Qwen2.5-32B-Inst-BaseMerge-TIES_bfloat16_d976a5d6768d54c5e59a88fe63238a055c30c06a_True,CombinHorizon/zetasepic-abliteratedV2-Qwen2.5-32B-Inst-BaseMerge-TIES,d976a5d6768d54c5e59a88fe63238a055c30c06a,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.0078306720072,TRUE,IFEval,0.832813601244697,83.2813601244697,BBH,0.695517442713859,56.8274069777257,MATH Level 5,0,0,GPQA,0.36744966442953,15.6599552572707,MUSR,0.431395833333333,14.2244791666667,MMLU-PRO,0.568484042553192,52.0537825059102,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-07,2024-12-20,1,CombinHorizon/zetasepic-abliteratedV2-Qwen2.5-32B-Inst-BaseMerge-TIES (Merge),apache-2.0,3,32.764,3.68331757286267 -ContactDoctor/Bio-Medical-Llama-3-8B_float16_5436cda92c65b0ef520d278d864305c0f429824b_False,ContactDoctor/Bio-Medical-Llama-3-8B,5436cda92c65b0ef520d278d864305c0f429824b,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.0055694875385,FALSE,IFEval,0.442236598890943,44.2236598890943,BBH,0.486311802622738,26.1958112960282,MATH Level 5,0.0725075528700906,7.25075528700906,GPQA,0.333892617449664,11.1856823266219,MUSR,0.351395833333333,1.7578125,MMLU-PRO,0.364777260638298,29.4196956264775,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-09,2024-12-24,1,meta-llama/Meta-Llama-3-8B-Instruct,other,38,4.015,0.617558255108524 +ContactDoctor/Bio-Medical-Llama-3-8B_float16_5436cda92c65b0ef520d278d864305c0f429824b_False,ContactDoctor/Bio-Medical-Llama-3-8B,5436cda92c65b0ef520d278d864305c0f429824b,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.0055694875385,FALSE,IFEval,0.442236598890943,44.2236598890943,BBH,0.486311802622738,26.1958112960282,MATH Level 5,0.0725075528700906,7.25075528700906,GPQA,0.333892617449664,11.1856823266219,MUSR,0.351395833333333,1.7578125,MMLU-PRO,0.364777260638298,29.4196956264775,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-09,2024-12-24,1,meta-llama/Meta-Llama-3-8B-Instruct,other,39,4.015,0.617558255108524 CoolSpring/Qwen2-0.5B-Abyme_bfloat16_a48b7c04b854e5c60fe3464f96904bfc53c8640c_True,CoolSpring/Qwen2-0.5B-Abyme,a48b7c04b854e5c60fe3464f96904bfc53c8640c,bfloat16,chatmodels,Original,Qwen2ForCausalLM,4.79858438213377,TRUE,IFEval,0.191518504235429,19.1518504235429,BBH,0.286183429648183,2.27648357059719,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.253355704697987,0.447427293064876,MUSR,0.35421875,1.47734375,MMLU-PRO,0.133311170212766,3.70124113475177,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-18,2024-09-04,1,Qwen/Qwen2-0.5B,apache-2.0,0,0.494,1.17779730854258 CoolSpring/Qwen2-0.5B-Abyme-merge2_bfloat16_02c4c601453f7ecbfab5c95bf5afa889350026ba_True,CoolSpring/Qwen2-0.5B-Abyme-merge2,02c4c601453f7ecbfab5c95bf5afa889350026ba,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,6.11884829377557,TRUE,IFEval,0.202184647845494,20.2184647845494,BBH,0.299427230091387,3.70904139433551,MATH Level 5,0.0211480362537764,2.11480362537764,GPQA,0.26006711409396,1.34228187919463,MUSR,0.368729166666667,3.89114583333333,MMLU-PRO,0.148936170212766,5.43735224586288,TRUE,TRUE,FALSE,FALSE,FALSE,2024-07-27,2024-07-27,1,CoolSpring/Qwen2-0.5B-Abyme-merge2 (Merge),apache-2.0,0,0.63,0.609695444210368 CoolSpring/Qwen2-0.5B-Abyme-merge3_bfloat16_86fed893893cc2a6240f0ea09ce2eeda1a5178cc_True,CoolSpring/Qwen2-0.5B-Abyme-merge3,86fed893893cc2a6240f0ea09ce2eeda1a5178cc,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,6.70690303165168,TRUE,IFEval,0.238604680026773,23.8604680026773,BBH,0.300314045259337,4.30114916286149,MATH Level 5,0.0249244712990937,2.49244712990937,GPQA,0.264261744966443,1.90156599552573,MUSR,0.35009375,2.12838541666667,MMLU-PRO,0.150016622340426,5.5574024822695,TRUE,TRUE,FALSE,FALSE,FALSE,2024-07-27,2024-07-27,1,CoolSpring/Qwen2-0.5B-Abyme-merge3 (Merge),apache-2.0,0,0.63,0.610171331712806 @@ -158,7 +158,7 @@ CultriX/Qwen2.5-14B-Broca_bfloat16_51204ee25a629abfd6d5e77a850b5e7a36c78462_Fals CultriX/Qwen2.5-14B-Brocav3_bfloat16_6f3fe686a79dcbcd5835ca100e194c49f493167b_False,CultriX/Qwen2.5-14B-Brocav3,6f3fe686a79dcbcd5835ca100e194c49f493167b,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,38.7642540094264,FALSE,IFEval,0.695177684100409,69.5177684100409,BBH,0.645235347618276,49.0491117834814,MATH Level 5,0.322507552870091,32.2507552870091,GPQA,0.359060402684564,14.5413870246085,MUSR,0.475635416666667,19.2544270833333,MMLU-PRO,0.531748670212766,47.9720744680851,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,CultriX/Qwen2.5-14B-Brocav3 (Merge),"",2,14.766,1.8167389899472 CultriX/Qwen2.5-14B-Brocav6_bfloat16_bd981505b6950df69216b260c3c0d86124fded7b_False,CultriX/Qwen2.5-14B-Brocav6,bd981505b6950df69216b260c3c0d86124fded7b,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,38.3175682007454,FALSE,IFEval,0.699523929839493,69.9523929839493,BBH,0.638883526662656,47.819224806074,MATH Level 5,0.29607250755287,29.607250755287,GPQA,0.36744966442953,15.6599552572707,MUSR,0.474208333333333,18.8760416666667,MMLU-PRO,0.531914893617021,47.9905437352246,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,CultriX/Qwen2.5-14B-Brocav6 (Merge),"",2,14.766,1.7914011355599 CultriX/Qwen2.5-14B-Brocav7_float16_06acee7f6e9796081ced6201001784907c77f96f_False,CultriX/Qwen2.5-14B-Brocav7,06acee7f6e9796081ced6201001784907c77f96f,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,38.5222137472979,FALSE,IFEval,0.67237152976325,67.237152976325,BBH,0.644402698132718,48.9053607833169,MATH Level 5,0.318731117824773,31.8731117824773,GPQA,0.36744966442953,15.6599552572707,MUSR,0.479604166666667,20.1505208333333,MMLU-PRO,0.525764627659575,47.3071808510638,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,CultriX/Qwen2.5-14B-Brocav7 (Merge),"",1,14.766,1.70134942259186 -CultriX/Qwen2.5-14B-Emerged_bfloat16_8bf0e31b23ee22858bbde2cee44dde88963f5084_False,CultriX/Qwen2.5-14B-Emerged,8bf0e31b23ee22858bbde2cee44dde88963f5084,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.6626166580798,FALSE,IFEval,0.700023714854364,70.0023714854364,BBH,0.626003368070331,45.9324193686847,MATH Level 5,0.307401812688822,30.7401812688822,GPQA,0.357382550335571,14.3176733780761,MUSR,0.46909375,18.4700520833333,MMLU-PRO,0.518617021276596,46.5130023640662,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,CultriX/Qwen2.5-14B-Emerged (Merge),"",0,14.766,1.80736016762088 +CultriX/Qwen2.5-14B-Emerged_bfloat16_8bf0e31b23ee22858bbde2cee44dde88963f5084_False,CultriX/Qwen2.5-14B-Emerged,8bf0e31b23ee22858bbde2cee44dde88963f5084,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.6626166580798,FALSE,IFEval,0.700023714854364,70.0023714854364,BBH,0.626003368070331,45.9324193686847,MATH Level 5,0.307401812688822,30.7401812688822,GPQA,0.357382550335571,14.3176733780761,MUSR,0.46909375,18.4700520833333,MMLU-PRO,0.518617021276596,46.5130023640662,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,CultriX/Qwen2.5-14B-Emerged (Merge),"",1,14.766,1.80736016762088 CultriX/Qwen2.5-14B-Emergedv3_bfloat16_f4df1b9c2bf37bbfd6b2e8f2ff244c6029a5d546_False,CultriX/Qwen2.5-14B-Emergedv3,f4df1b9c2bf37bbfd6b2e8f2ff244c6029a5d546,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,34.8420924559616,FALSE,IFEval,0.638849364131615,63.8849364131615,BBH,0.619072841105603,44.7316082426086,MATH Level 5,0.206948640483384,20.6948640483384,GPQA,0.360738255033557,14.7651006711409,MUSR,0.4728125,18.6015625,MMLU-PRO,0.517370345744681,46.3744828605201,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,CultriX/Qwen2.5-14B-Emergedv3 (Merge),"",1,14.766,1.91892827649725 CultriX/Qwen2.5-14B-FinalMerge_bfloat16_8fd624d0d8989a312d344772814da3575423897a_False,CultriX/Qwen2.5-14B-FinalMerge,8fd624d0d8989a312d344772814da3575423897a,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,28.0570148706014,FALSE,IFEval,0.489097816017057,48.9097816017057,BBH,0.571494531001145,38.1624794834235,MATH Level 5,0.130664652567976,13.0664652567976,GPQA,0.354865771812081,13.9821029082774,MUSR,0.43790625,14.5049479166667,MMLU-PRO,0.457446808510638,39.7163120567376,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-22,2024-12-23,1,CultriX/Qwen2.5-14B-FinalMerge (Merge),"",1,14.766,1.94394149594043 CultriX/Qwen2.5-14B-MegaMerge-pt2_bfloat16_20397f6cafc09c2cb74f105867cd99b3c68c71dc_False,CultriX/Qwen2.5-14B-MegaMerge-pt2,20397f6cafc09c2cb74f105867cd99b3c68c71dc,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.6943142526711,FALSE,IFEval,0.568307645935008,56.8307645935008,BBH,0.657770333051015,50.9079030473653,MATH Level 5,0.273413897280967,27.3413897280967,GPQA,0.379194630872483,17.2259507829978,MUSR,0.472875,18.7427083333333,MMLU-PRO,0.542054521276596,49.1171690307329,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-24,2024-10-25,1,CultriX/Qwen2.5-14B-MegaMerge-pt2 (Merge),apache-2.0,2,14.766,2.25043378483341 @@ -266,6 +266,7 @@ DreadPoor/Aurora_faustus-8B-LORABLATED_bfloat16_97746081f7c681dcf7fad10c57de9a34 DreadPoor/Aurora_faustus-8B-LORABLATED_ALT_float16_3ca36587d26bfd936aa1358adc1eabf377aa1e98_True,DreadPoor/Aurora_faustus-8B-LORABLATED_ALT,3ca36587d26bfd936aa1358adc1eabf377aa1e98,float16,basemergesandmoerges,Original,LlamaForCausalLM,28.9341526463057,TRUE,IFEval,0.737792390856261,73.7792390856261,BBH,0.538767072119121,34.2115201181568,MATH Level 5,0.154078549848943,15.4078549848943,GPQA,0.298657718120805,6.48769574944072,MUSR,0.422520833333333,13.7817708333333,MMLU-PRO,0.369431515957447,29.936835106383,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-29,0,Removed,"",0,8.03,0.795116097836909 DreadPoor/BaeZel-8B-LINEAR_bfloat16_1deac3287de191794c50543d69d523f43654a803_True,DreadPoor/BaeZel-8B-LINEAR,1deac3287de191794c50543d69d523f43654a803,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,30.2964594445972,TRUE,IFEval,0.737792390856261,73.7792390856261,BBH,0.546380055432138,35.535376069864,MATH Level 5,0.178247734138973,17.8247734138973,GPQA,0.321308724832215,9.50782997762864,MUSR,0.422708333333333,13.3385416666667,MMLU-PRO,0.386136968085106,31.7929964539007,TRUE,TRUE,FALSE,FALSE,FALSE,2024-11-08,2024-11-08,1,DreadPoor/BaeZel-8B-LINEAR (Merge),apache-2.0,1,8.03,0.665068820106972 DreadPoor/BaeZel-8B-Model_Stock_bfloat16_cb6aa300413e77d5e3ce97373ba3df0a0f1f374c_True,DreadPoor/BaeZel-8B-Model_Stock,cb6aa300413e77d5e3ce97373ba3df0a0f1f374c,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,29.9709105793553,TRUE,IFEval,0.771314556487897,77.1314556487897,BBH,0.540768055021693,34.6436329400534,MATH Level 5,0.160876132930514,16.0876132930514,GPQA,0.313758389261745,8.50111856823266,MUSR,0.419916666666667,11.45625,MMLU-PRO,0.388048537234043,32.0053930260047,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-28,2024-12-29,1,DreadPoor/BaeZel-8B-Model_Stock (Merge),apache-2.0,1,8.03,0.662303005645527 +DreadPoor/BaeZel_V3-8B-Model_Stock_bfloat16_65014ed04553da3c0e126e7b1d29705120cdd3e6_True,DreadPoor/BaeZel_V3-8B-Model_Stock,65014ed04553da3c0e126e7b1d29705120cdd3e6,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,30.5555492913144,TRUE,IFEval,0.783179740865348,78.3179740865348,BBH,0.539231076759135,34.4086587964804,MATH Level 5,0.1797583081571,17.97583081571,GPQA,0.320469798657718,9.39597315436242,MUSR,0.4174375,11.1463541666667,MMLU-PRO,0.388796542553192,32.0885047281324,TRUE,TRUE,FALSE,FALSE,FALSE,2025-01-08,2025-01-09,1,DreadPoor/BaeZel_V3-8B-Model_Stock (Merge),apache-2.0,1,8.03,0.662295385777838 DreadPoor/Casuar-9B-Model_Stock_bfloat16_d69d1242cef7da8da9be79796649529a4e42adf0_True,DreadPoor/Casuar-9B-Model_Stock,d69d1242cef7da8da9be79796649529a4e42adf0,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,30.2323823814163,TRUE,IFEval,0.776485281275904,77.6485281275904,BBH,0.610668187730687,43.9272676831237,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.344798657718121,12.6398210290828,MUSR,0.416541666666667,11.2010416666667,MMLU-PRO,0.415641622340426,35.0712913711584,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-20,2024-12-21,1,DreadPoor/Casuar-9B-Model_Stock (Merge),apache-2.0,2,9.242,1.65042822526681 DreadPoor/Condensed_Milk-8B-Model_Stock_bfloat16_6e5b73099b9d5a794c9c744c4c5c158b1feb8916_True,DreadPoor/Condensed_Milk-8B-Model_Stock,6e5b73099b9d5a794c9c744c4c5c158b1feb8916,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,30.0705832175764,TRUE,IFEval,0.753629259254334,75.3629259254334,BBH,0.543486412212191,35.120620252448,MATH Level 5,0.173716012084592,17.3716012084592,GPQA,0.321308724832215,9.50782997762864,MUSR,0.416010416666667,11.1013020833333,MMLU-PRO,0.387632978723404,31.959219858156,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-11-27,0,Removed,"",0,8.03,0.654664190642245 DreadPoor/CoolerCoder-8B-LINEAR_bfloat16_db14b0fa821b0b6b07802111fd19ba722344a32b_True,DreadPoor/CoolerCoder-8B-LINEAR,db14b0fa821b0b6b07802111fd19ba722344a32b,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,19.1480108797525,TRUE,IFEval,0.451928660398853,45.1928660398853,BBH,0.476150483549654,26.365382993394,MATH Level 5,0.0619335347432024,6.19335347432024,GPQA,0.290268456375839,5.36912751677852,MUSR,0.396354166666667,7.77760416666667,MMLU-PRO,0.315907579787234,23.9897310874705,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-11-20,0,Removed,"",0,8.03,1.44402112216066 @@ -299,8 +300,8 @@ DreadPoor/WIP_Damascus-8B-TIES_bfloat16_c7720a0b0a8d24e62bf71b0e955b1aca8e62f1cb DreadPoor/felix_dies-mistral-7B-model_stock_bfloat16_bb317aa7565625327e18c5158aebd4710aa1d925_False,DreadPoor/felix_dies-mistral-7B-model_stock,bb317aa7565625327e18c5158aebd4710aa1d925,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,18.1018281017421,FALSE,IFEval,0.300778600779266,30.0778600779266,BBH,0.490091807352742,28.8907980509645,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.291946308724832,5.59284116331097,MUSR,0.451822916666667,15.4778645833333,MMLU-PRO,0.310920877659575,23.4356530732861,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-30,0,Removed,"",0,7.242,0.661571667363575 DreadPoor/remember_to_breathe-8b-Model-Stock_bfloat16_fa88f1b06cf9ca7bd0d859c6a4b2240485363ae0_True,DreadPoor/remember_to_breathe-8b-Model-Stock,fa88f1b06cf9ca7bd0d859c6a4b2240485363ae0,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,28.1684073595337,TRUE,IFEval,0.710415032114789,71.0415032114789,BBH,0.541165443559992,34.6789907623163,MATH Level 5,0.143504531722054,14.3504531722054,GPQA,0.301174496644295,6.82326621923937,MUSR,0.414458333333333,11.440625,MMLU-PRO,0.37608045212766,30.6756057919622,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-06,0,Removed,"",0,8.03,0.663540162076869 EVA-UNIT-01/EVA-Qwen2.5-14B-v0.2_bfloat16__False,EVA-UNIT-01/EVA-Qwen2.5-14B-v0.2,"",bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,33.7748419372041,FALSE,IFEval,0.403842914577765,40.3842914577765,BBH,0.609023754004659,43.6078492579707,MATH Level 5,0.338368580060423,33.8368580060423,GPQA,0.394295302013423,19.2393736017897,MUSR,0.479447916666667,19.6309895833333,MMLU-PRO,0.513547207446809,45.9496897163121,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-06,2024-12-26,1,Qwen/Qwen2.5-14B,apache-2.0,13,14.77,2.3326730254844 -EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2_bfloat16_2590214b30391392b9a84e7cbe40fff3a92c6814_True,EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2,2590214b30391392b9a84e7cbe40fff3a92c6814,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,43.5418377172999,TRUE,IFEval,0.687883704127271,68.7883704127271,BBH,0.708801222804876,59.0667326828602,MATH Level 5,0.390483383685801,39.0483383685801,GPQA,0.408557046979866,21.1409395973154,MUSR,0.471979166666667,19.7307291666667,MMLU-PRO,0.581283244680851,53.4759160756501,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-21,2024-11-27,1,Qwen/Qwen2.5-72B,other,11,72.706,22.95509846631 -EleutherAI/gpt-j-6b_bfloat16_47e169305d2e8376be1d31e765533382721b2cc1_False,EleutherAI/gpt-j-6b,47e169305d2e8376be1d31e765533382721b2cc1,bfloat16,pretrained,Original,GPTJForCausalLM,6.55782365211081,FALSE,IFEval,0.252218557870894,25.2218557870894,BBH,0.319104443103728,4.91281806832369,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.245805369127517,0,MUSR,0.36575,5.25208333333333,MMLU-PRO,0.124085771276596,2.67619680851064,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-19,0,EleutherAI/gpt-j-6b,apache-2.0,1467,6,0.767432156385538 +EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2_bfloat16_2590214b30391392b9a84e7cbe40fff3a92c6814_True,EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2,2590214b30391392b9a84e7cbe40fff3a92c6814,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,43.5418377172999,TRUE,IFEval,0.687883704127271,68.7883704127271,BBH,0.708801222804876,59.0667326828602,MATH Level 5,0.390483383685801,39.0483383685801,GPQA,0.408557046979866,21.1409395973154,MUSR,0.471979166666667,19.7307291666667,MMLU-PRO,0.581283244680851,53.4759160756501,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-21,2024-11-27,1,Qwen/Qwen2.5-72B,other,12,72.706,22.95509846631 +EleutherAI/gpt-j-6b_bfloat16_47e169305d2e8376be1d31e765533382721b2cc1_False,EleutherAI/gpt-j-6b,47e169305d2e8376be1d31e765533382721b2cc1,bfloat16,pretrained,Original,GPTJForCausalLM,6.55782365211081,FALSE,IFEval,0.252218557870894,25.2218557870894,BBH,0.319104443103728,4.91281806832369,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.245805369127517,0,MUSR,0.36575,5.25208333333333,MMLU-PRO,0.124085771276596,2.67619680851064,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-19,0,EleutherAI/gpt-j-6b,apache-2.0,1468,6,0.767432156385538 EleutherAI/gpt-neo-1.3B_bfloat16_dbe59a7f4a88d01d1ba9798d78dbe3fe038792c8_False,EleutherAI/gpt-neo-1.3B,dbe59a7f4a88d01d1ba9798d78dbe3fe038792c8,bfloat16,pretrained,Original,GPTNeoForCausalLM,5.34073838155464,FALSE,IFEval,0.207905025332784,20.7905025332784,BBH,0.303923158693564,3.02456918093099,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.255872483221477,0.782997762863532,MUSR,0.38165625,4.87369791666667,MMLU-PRO,0.116356382978723,1.81737588652482,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,EleutherAI/gpt-neo-1.3B,mit,271,1.366,0.359424061519048 EleutherAI/gpt-neo-125m_bfloat16_21def0189f5705e2521767faed922f1f15e7d7db_False,EleutherAI/gpt-neo-125m,21def0189f5705e2521767faed922f1f15e7d7db,bfloat16,pretrained,Original,GPTNeoForCausalLM,4.3821456739786,FALSE,IFEval,0.190544422133273,19.0544422133273,BBH,0.311515688579152,3.4367389514267,MATH Level 5,0.00453172205438066,0.453172205438066,GPQA,0.253355704697987,0.447427293064876,MUSR,0.359333333333333,2.61666666666667,MMLU-PRO,0.102559840425532,0.28442671394799,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-10,0,EleutherAI/gpt-neo-125m,mit,192,0.15,0.202902486593259 EleutherAI/gpt-neo-2.7B_bfloat16_e24fa291132763e59f4a5422741b424fb5d59056_False,EleutherAI/gpt-neo-2.7B,e24fa291132763e59f4a5422741b424fb5d59056,bfloat16,pretrained,Original,GPTNeoForCausalLM,6.3555191000811,FALSE,IFEval,0.258962885144749,25.8962885144749,BBH,0.313951603331525,4.17860266708101,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.265939597315436,2.12527964205817,MUSR,0.355364583333333,3.52057291666667,MMLU-PRO,0.116273271276596,1.80814125295508,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,EleutherAI/gpt-neo-2.7B,mit,455,2.718,0.508381401623291 @@ -316,7 +317,7 @@ Enno-Ai/EnnoAi-Pro-Llama-3-8B-v0.3_bfloat16_cf29b8b484a909132e3a1f85ce891d28347c Enno-Ai/EnnoAi-Pro-Llama-3.1-8B-v0.9_bfloat16_c740871122fd471a1a225cf2b4368e333752d74c_True,Enno-Ai/EnnoAi-Pro-Llama-3.1-8B-v0.9,c740871122fd471a1a225cf2b4368e333752d74c,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,14.9456940802696,TRUE,IFEval,0.468914701879901,46.8914701879901,BBH,0.416027208361901,17.4982963743828,MATH Level 5,0,0,GPQA,0.265939597315436,2.12527964205817,MUSR,0.383177083333333,5.43046875,MMLU-PRO,0.259557845744681,17.7286495271868,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-22,2024-09-06,0,Enno-Ai/EnnoAi-Pro-Llama-3.1-8B-v0.9,apache-2.0,0,8.03,0.932571245200544 EnnoAi/EnnoAi-Pro-Llama-3.1-8B-v1.0_bfloat16_c740871122fd471a1a225cf2b4368e333752d74c_True,EnnoAi/EnnoAi-Pro-Llama-3.1-8B-v1.0,c740871122fd471a1a225cf2b4368e333752d74c,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,14.9710896602936,TRUE,IFEval,0.470438436681339,47.0438436681339,BBH,0.416027208361901,17.4982963743828,MATH Level 5,0,0,GPQA,0.265939597315436,2.12527964205817,MUSR,0.383177083333333,5.43046875,MMLU-PRO,0.259557845744681,17.7286495271868,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-22,2024-09-06,0,EnnoAi/EnnoAi-Pro-Llama-3.1-8B-v1.0,apache-2.0,0,8.03,0.94564159228199 Epiculous/Azure_Dusk-v0.2_bfloat16_ebddf1b2efbe7f9cae066d263b0991ded89c88e8_True,Epiculous/Azure_Dusk-v0.2,ebddf1b2efbe7f9cae066d263b0991ded89c88e8,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,14.0508272195609,TRUE,IFEval,0.346715603487635,34.6715603487635,BBH,0.41197218735536,17.3964143923793,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.260906040268456,1.45413870246085,MUSR,0.383458333333333,6.365625,MMLU-PRO,0.303440824468085,22.6045360520095,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-09,2024-09-14,0,Epiculous/Azure_Dusk-v0.2,apache-2.0,7,12.248,1.99141139139846 -Epiculous/Crimson_Dawn-v0.2_bfloat16_4cceb1e25026afef241ad5325097e88eccd8f37a_True,Epiculous/Crimson_Dawn-v0.2,4cceb1e25026afef241ad5325097e88eccd8f37a,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,14.8845408807215,TRUE,IFEval,0.310345438990767,31.0345438990767,BBH,0.448237964896454,21.6882485139553,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.276006711409396,3.4675615212528,MUSR,0.415177083333333,10.8971354166667,MMLU-PRO,0.272107712765957,19.1230791962175,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-02,2024-09-05,0,Epiculous/Crimson_Dawn-v0.2,apache-2.0,10,12.248,3.49238397097534 +Epiculous/Crimson_Dawn-v0.2_bfloat16_4cceb1e25026afef241ad5325097e88eccd8f37a_True,Epiculous/Crimson_Dawn-v0.2,4cceb1e25026afef241ad5325097e88eccd8f37a,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,14.8845408807215,TRUE,IFEval,0.310345438990767,31.0345438990767,BBH,0.448237964896454,21.6882485139553,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.276006711409396,3.4675615212528,MUSR,0.415177083333333,10.8971354166667,MMLU-PRO,0.272107712765957,19.1230791962175,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-02,2024-09-05,0,Epiculous/Crimson_Dawn-v0.2,apache-2.0,11,12.248,3.49238397097534 Epiculous/NovaSpark_bfloat16_a46340895859e470c3e69661f0b894677cf4c5cb_True,Epiculous/NovaSpark,a46340895859e470c3e69661f0b894677cf4c5cb,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.2285617567326,TRUE,IFEval,0.640847396020337,64.0847396020337,BBH,0.50639586637683,29.526910688444,MATH Level 5,0.150302114803625,15.0302114803625,GPQA,0.297818791946309,6.3758389261745,MUSR,0.388197916666667,6.92473958333333,MMLU-PRO,0.364860372340426,29.4289302600473,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-13,2024-10-20,1,Epiculous/NovaSpark (Merge),apache-2.0,7,8.03,0.818185024708442 Epiculous/Violet_Twilight-v0.2_bfloat16_30c8bad3c1f565150afbf2fc90cacf4f45d096f6_True,Epiculous/Violet_Twilight-v0.2,30c8bad3c1f565150afbf2fc90cacf4f45d096f6,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,18.5527734874264,TRUE,IFEval,0.45317756885065,45.317756885065,BBH,0.461455247684589,23.9405372559019,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.265939597315436,2.12527964205817,MUSR,0.4299375,13.6088541666667,MMLU-PRO,0.31108710106383,23.4541223404255,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-12,2024-09-16,0,Epiculous/Violet_Twilight-v0.2,apache-2.0,22,12.248,1.77043599040323 EpistemeAI/Alpaca-Llama3.1-8B_float16_3152dfa17322dff7c6af6dbf3daceaf5db51e230_False,EpistemeAI/Alpaca-Llama3.1-8B,3152dfa17322dff7c6af6dbf3daceaf5db51e230,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,13.9221057683322,FALSE,IFEval,0.159869147196106,15.9869147196106,BBH,0.475526085397429,25.9352265551177,MATH Level 5,0.0468277945619335,4.68277945619335,GPQA,0.290268456375839,5.36912751677852,MUSR,0.340260416666667,6.59921875,MMLU-PRO,0.324634308510638,24.9593676122931,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-11,2024-08-13,2,meta-llama/Meta-Llama-3.1-8B,apache-2.0,0,8,0.920852587327145 @@ -382,6 +383,7 @@ FlofloB/40k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit_flo FlofloB/83k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit_float16_4c4d3660d0288295f89880a3a86f4eb9ecc9d344_True,FlofloB/83k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit,4c4d3660d0288295f89880a3a86f4eb9ecc9d344,float16,continuouslypretrained,Original,Qwen2ForCausalLM,7.92393644843285,TRUE,IFEval,0.286939764269915,28.6939764269915,BBH,0.334653407016045,8.13227333094577,MATH Level 5,0,0,GPQA,0.273489932885906,3.13199105145414,MUSR,0.328947916666667,1.41848958333333,MMLU-PRO,0.155501994680851,6.16688829787234,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-26,2024-11-26,3,Qwen/Qwen2.5-0.5B,apache-2.0,2,0.5,0.492186391170671 FlofloB/smollm2-135M_pretrained_200k_fineweb_uncovai_selected_float16_381cdec29375aeaf0fb1bcc8ab2218443fc1cadd_False,FlofloB/smollm2-135M_pretrained_200k_fineweb_uncovai_selected,381cdec29375aeaf0fb1bcc8ab2218443fc1cadd,float16,pretrained,Original,LlamaForCausalLM,3.36614510698747,FALSE,IFEval,0.134515308270943,13.4515308270943,BBH,0.2927186496606,2.3223515642593,MATH Level 5,0,0,GPQA,0.250838926174497,0.111856823266221,MUSR,0.36603125,2.85390625,MMLU-PRO,0.113115026595745,1.45722517730496,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-08,1,HuggingFaceTB/SmolLM2-135M,apache-2.0,1,0.135,0.341144816261861 FlofloB/smollm2-135M_pretrained_400k_fineweb_uncovai_selected_float16_ecac44607d60c294b460a8786f6253d561f3de85_False,FlofloB/smollm2-135M_pretrained_400k_fineweb_uncovai_selected,ecac44607d60c294b460a8786f6253d561f3de85,float16,pretrained,Original,LlamaForCausalLM,4.27403784467981,FALSE,IFEval,0.158420768006667,15.8420768006667,BBH,0.292517172055552,2.0734660328778,MATH Level 5,0,0,GPQA,0.254194630872483,0.559284116331097,MUSR,0.382,5.41666666666667,MMLU-PRO,0.11577460106383,1.75273345153664,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-09,2025-01-09,2,HuggingFaceTB/SmolLM2-135M,apache-2.0,1,0.135,0.335764947536955 +FlofloB/smollm2-135M_pretrained_600k_fineweb_uncovai_selected_float16_66e4931a5409bb8739522ff5df3b4f3373738fad_False,FlofloB/smollm2-135M_pretrained_600k_fineweb_uncovai_selected,66e4931a5409bb8739522ff5df3b4f3373738fad,float16,pretrained,Original,LlamaForCausalLM,4.53172520867728,FALSE,IFEval,0.160593890876208,16.0593890876208,BBH,0.29834447696551,2.16515642593,MATH Level 5,0,0,GPQA,0.260906040268456,1.45413870246085,MUSR,0.384635416666667,5.71276041666667,MMLU-PRO,0.116190159574468,1.79890661938534,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-09,2025-01-09,3,HuggingFaceTB/SmolLM2-135M,apache-2.0,0,0.135,0.337787917026515 FlofloB/smollm2_pretrained_200k_fineweb_float16_c3086ab3555e766f0b3903b8b9a1a290e3e25f3d_False,FlofloB/smollm2_pretrained_200k_fineweb,c3086ab3555e766f0b3903b8b9a1a290e3e25f3d,float16,pretrained,Original,LlamaForCausalLM,3.94265871187253,FALSE,IFEval,0.152700390519377,15.2700390519377,BBH,0.299468427221449,2.87252300062131,MATH Level 5,0,0,GPQA,0.24748322147651,0,MUSR,0.3699375,3.7421875,MMLU-PRO,0.115940824468085,1.77120271867612,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-08,1,HuggingFaceTB/SmolLM2-135M,apache-2.0,1,0.135,0.329732062205357 FlofloB/test_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit_float16_cfd97ca5927a2e09ec30001a576d82dd8b635e09_True,FlofloB/test_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit,cfd97ca5927a2e09ec30001a576d82dd8b635e09,float16,continuouslypretrained,Original,MistralForCausalLM,24.4605262218316,TRUE,IFEval,0.521546164177715,52.1546164177715,BBH,0.524082918977825,32.8824331703226,MATH Level 5,0.108761329305136,10.8761329305136,GPQA,0.311241610738255,8.165548098434,MUSR,0.424416666666667,12.4520833333333,MMLU-PRO,0.372091090425532,30.2323433806147,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-21,2024-11-21,1,unsloth/phi-3-mini-4k-instruct-bnb-4bit,apache-2.0,1,16,1.00880120220156 FuJhen/ft-openhermes-25-mistral-7b-irca-dpo-pairs_bfloat16_24c0bea14d53e6f67f1fbe2eca5bfe7cae389b33_True,FuJhen/ft-openhermes-25-mistral-7b-irca-dpo-pairs,24c0bea14d53e6f67f1fbe2eca5bfe7cae389b33,bfloat16,chatmodels,Adapter,?,19.6155249432558,TRUE,IFEval,0.542004104664512,54.2004104664513,BBH,0.477303238955481,26.5968609704319,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.278523489932886,3.80313199105145,MUSR,0.417375,11.2052083333333,MMLU-PRO,0.295628324468085,21.7364804964539,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-12,2024-09-12,1,FuJhen/ft-openhermes-25-mistral-7b-irca-dpo-pairs (Merge),apache-2.0,0,14.483,1.00204821775228 @@ -440,15 +442,15 @@ HuggingFaceTB/SmolLM-360M_bfloat16_318cc630b73730bfd712e5873063156ffb8936b5_Fals HuggingFaceTB/SmolLM-360M-Instruct_bfloat16_8e951de8c220295ea4f85d078c4e320df7137535_True,HuggingFaceTB/SmolLM-360M-Instruct,8e951de8c220295ea4f85d078c4e320df7137535,bfloat16,chatmodels,Original,LlamaForCausalLM,4.70678415207999,TRUE,IFEval,0.195165494221998,19.5165494221998,BBH,0.288511143632177,2.08037429085374,MATH Level 5,0,0,GPQA,0.264261744966443,1.90156599552573,MUSR,0.347177083333333,2.89713541666667,MMLU-PRO,0.116605718085106,1.84507978723404,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-15,2024-08-20,1,HuggingFaceTB/SmolLM-360M,apache-2.0,77,0.362,0.366501024298985 HuggingFaceTB/SmolLM2-1.7B_bfloat16_4fa12cab4f5f53670b05125fb9d2873af587d231_False,HuggingFaceTB/SmolLM2-1.7B,4fa12cab4f5f53670b05125fb9d2873af587d231,bfloat16,pretrained,Original,LlamaForCausalLM,9.49550422402913,FALSE,IFEval,0.244000363480011,24.4000363480011,BBH,0.345259437716626,9.30178845955168,MATH Level 5,0.0211480362537764,2.11480362537764,GPQA,0.279362416107383,3.91498881431767,MUSR,0.348541666666667,4.60104166666667,MMLU-PRO,0.21376329787234,12.64036643026,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-30,2024-11-06,0,HuggingFaceTB/SmolLM2-1.7B,apache-2.0,88,1.71,0.325025991140308 HuggingFaceTB/SmolLM2-1.7B-Instruct_bfloat16_d1bb90bcfbe0f211109880f4da18da66f229c4f6_True,HuggingFaceTB/SmolLM2-1.7B-Instruct,d1bb90bcfbe0f211109880f4da18da66f229c4f6,bfloat16,chatmodels,Original,LlamaForCausalLM,14.7453390971056,TRUE,IFEval,0.536783512192095,53.6783512192095,BBH,0.359861753141516,10.9179892262081,MATH Level 5,0.0415407854984894,4.15407854984894,GPQA,0.279362416107383,3.91498881431767,MUSR,0.342125,4.09895833333334,MMLU-PRO,0.205369015957447,11.7076684397163,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,1,HuggingFaceTB/SmolLM2-1.7B-Instruct (Merge),apache-2.0,465,1.711,0.63234061656892 -HuggingFaceTB/SmolLM2-135M_bfloat16_28e66ca6931668447a3bac213f23d990ad3b0e2b_False,HuggingFaceTB/SmolLM2-135M,28e66ca6931668447a3bac213f23d990ad3b0e2b,bfloat16,pretrained,Original,LlamaForCausalLM,5.55767745404167,FALSE,IFEval,0.183300309844546,18.3300309844546,BBH,0.304423424687714,3.70807758683998,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.248322147651007,0,MUSR,0.411177083333333,10.03046875,MMLU-PRO,0.109458111702128,1.05090130023641,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,0,HuggingFaceTB/SmolLM2-135M,apache-2.0,44,0.135,0.333904566630153 -HuggingFaceTB/SmolLM2-135M-Instruct_bfloat16_5a33ba103645800d7b3790c4448546c1b73efc71_True,HuggingFaceTB/SmolLM2-135M-Instruct,5a33ba103645800d7b3790c4448546c1b73efc71,bfloat16,chatmodels,Original,LlamaForCausalLM,6.46736472035882,TRUE,IFEval,0.288313896018121,28.8313896018121,BBH,0.312432132806668,4.72080766080528,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.235738255033557,0,MUSR,0.36621875,3.67734375,MMLU-PRO,0.111452792553191,1.27253250591016,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,1,HuggingFaceTB/SmolLM2-135M-Instruct (Merge),apache-2.0,85,0.135,0.338375628206877 -HuggingFaceTB/SmolLM2-135M-Instruct_float16_5a33ba103645800d7b3790c4448546c1b73efc71_False,HuggingFaceTB/SmolLM2-135M-Instruct,5a33ba103645800d7b3790c4448546c1b73efc71,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,2.99259897065637,FALSE,IFEval,0.0592516744460254,5.92516744460254,BBH,0.313475029473359,4.79627574466244,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.234060402684564,0,MUSR,0.387145833333333,6.05989583333334,MMLU-PRO,0.109208776595745,1.02319739952719,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-14,1,HuggingFaceTB/SmolLM2-135M-Instruct (Merge),apache-2.0,85,0.135,0.348753843693507 +HuggingFaceTB/SmolLM2-135M_bfloat16_28e66ca6931668447a3bac213f23d990ad3b0e2b_False,HuggingFaceTB/SmolLM2-135M,28e66ca6931668447a3bac213f23d990ad3b0e2b,bfloat16,pretrained,Original,LlamaForCausalLM,5.55767745404167,FALSE,IFEval,0.183300309844546,18.3300309844546,BBH,0.304423424687714,3.70807758683998,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.248322147651007,0,MUSR,0.411177083333333,10.03046875,MMLU-PRO,0.109458111702128,1.05090130023641,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,0,HuggingFaceTB/SmolLM2-135M,apache-2.0,45,0.135,0.333904566630153 +HuggingFaceTB/SmolLM2-135M-Instruct_bfloat16_5a33ba103645800d7b3790c4448546c1b73efc71_True,HuggingFaceTB/SmolLM2-135M-Instruct,5a33ba103645800d7b3790c4448546c1b73efc71,bfloat16,chatmodels,Original,LlamaForCausalLM,6.46736472035882,TRUE,IFEval,0.288313896018121,28.8313896018121,BBH,0.312432132806668,4.72080766080528,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.235738255033557,0,MUSR,0.36621875,3.67734375,MMLU-PRO,0.111452792553191,1.27253250591016,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,1,HuggingFaceTB/SmolLM2-135M-Instruct (Merge),apache-2.0,86,0.135,0.338375628206877 +HuggingFaceTB/SmolLM2-135M-Instruct_float16_5a33ba103645800d7b3790c4448546c1b73efc71_False,HuggingFaceTB/SmolLM2-135M-Instruct,5a33ba103645800d7b3790c4448546c1b73efc71,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,2.99259897065637,FALSE,IFEval,0.0592516744460254,5.92516744460254,BBH,0.313475029473359,4.79627574466244,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.234060402684564,0,MUSR,0.387145833333333,6.05989583333334,MMLU-PRO,0.109208776595745,1.02319739952719,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-14,1,HuggingFaceTB/SmolLM2-135M-Instruct (Merge),apache-2.0,86,0.135,0.348753843693507 HuggingFaceTB/SmolLM2-360M_bfloat16_3ce05f63c246c44616da500b47b01f082f4d3bcc_False,HuggingFaceTB/SmolLM2-360M,3ce05f63c246c44616da500b47b01f082f4d3bcc,bfloat16,pretrained,Original,LlamaForCausalLM,6.10022494870461,FALSE,IFEval,0.211452279950531,21.1452279950531,BBH,0.323347804430236,5.54360315536951,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.245805369127517,0,MUSR,0.395427083333333,7.72838541666667,MMLU-PRO,0.116938164893617,1.882018321513,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,0,HuggingFaceTB/SmolLM2-360M,apache-2.0,29,0.36,0.386657809372346 HuggingFaceTB/SmolLM2-360M-Instruct_float16_4873f67095301d304753fae05bc09ec766634e50_False,HuggingFaceTB/SmolLM2-360M-Instruct,4873f67095301d304753fae05bc09ec766634e50,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,3.10001953986204,FALSE,IFEval,0.0830319108853398,8.30319108853398,BBH,0.305270340184432,3.29904732932332,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.26510067114094,2.01342281879195,MUSR,0.34228125,2.75182291666667,MMLU-PRO,0.112616356382979,1.40181737588652,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-14,0,HuggingFaceTB/SmolLM2-360M-Instruct,apache-2.0,68,0.362,0.392381869271762 HuggingFaceTB/SmolLM2-360M-Instruct_bfloat16_4873f67095301d304753fae05bc09ec766634e50_True,HuggingFaceTB/SmolLM2-360M-Instruct,4873f67095301d304753fae05bc09ec766634e50,bfloat16,chatmodels,Original,LlamaForCausalLM,8.00109713938091,TRUE,IFEval,0.38415958545548,38.415958545548,BBH,0.314350505388885,4.17386363636364,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.25503355704698,0.671140939597318,MUSR,0.346125,2.765625,MMLU-PRO,0.111702127659574,1.30023640661938,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,0,HuggingFaceTB/SmolLM2-360M-Instruct,apache-2.0,68,0.36,0.375819270764297 -HumanLLMs/Humanish-LLama3-8B-Instruct_bfloat16_42f73ada2b7fb16f18a75404d72b7911bf1e65ce_True,HumanLLMs/Humanish-LLama3-8B-Instruct,42f73ada2b7fb16f18a75404d72b7911bf1e65ce,bfloat16,chatmodels,Original,LlamaForCausalLM,22.5649106964196,TRUE,IFEval,0.649790334091322,64.9790334091322,BBH,0.496770966278965,28.012476599572,MATH Level 5,0.0959214501510574,9.59214501510574,GPQA,0.255872483221477,0.782997762863532,MUSR,0.35815625,2.00286458333333,MMLU-PRO,0.370179521276596,30.0199468085106,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-04,2024-10-05,1,meta-llama/Meta-Llama-3-8B-Instruct,llama3,5,8.03,0.748278140670569 +HumanLLMs/Humanish-LLama3-8B-Instruct_bfloat16_42f73ada2b7fb16f18a75404d72b7911bf1e65ce_True,HumanLLMs/Humanish-LLama3-8B-Instruct,42f73ada2b7fb16f18a75404d72b7911bf1e65ce,bfloat16,chatmodels,Original,LlamaForCausalLM,22.5649106964196,TRUE,IFEval,0.649790334091322,64.9790334091322,BBH,0.496770966278965,28.012476599572,MATH Level 5,0.0959214501510574,9.59214501510574,GPQA,0.255872483221477,0.782997762863532,MUSR,0.35815625,2.00286458333333,MMLU-PRO,0.370179521276596,30.0199468085106,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-04,2024-10-05,1,meta-llama/Meta-Llama-3-8B-Instruct,llama3,6,8.03,0.748278140670569 HumanLLMs/Humanish-Mistral-Nemo-Instruct-2407_bfloat16_45b80bdce8d447ef494af06751904afcc607eb37_True,HumanLLMs/Humanish-Mistral-Nemo-Instruct-2407,45b80bdce8d447ef494af06751904afcc607eb37,bfloat16,chatmodels,Original,MistralForCausalLM,23.0068996717315,TRUE,IFEval,0.545126929879387,54.5126929879387,BBH,0.526178077253261,32.7096134212256,MATH Level 5,0.0838368580060423,8.38368580060423,GPQA,0.287751677852349,5.03355704697987,MUSR,0.396760416666667,9.39505208333333,MMLU-PRO,0.352061170212766,28.0067966903073,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-06,2024-10-06,2,mistralai/Mistral-Nemo-Base-2407,apache-2.0,6,12.248,1.6202833064409 -HumanLLMs/Humanish-Qwen2.5-7B-Instruct_bfloat16_7d2c71d926832d6e257ad2776011494dbac2d151_True,HumanLLMs/Humanish-Qwen2.5-7B-Instruct,7d2c71d926832d6e257ad2776011494dbac2d151,bfloat16,chatmodels,Original,Qwen2ForCausalLM,26.6653740968198,TRUE,IFEval,0.728425023382403,72.8425023382403,BBH,0.536368145780707,34.4789975866187,MATH Level 5,0,0,GPQA,0.298657718120805,6.48769574944072,MUSR,0.3980625,8.42447916666667,MMLU-PRO,0.439827127659575,37.7585697399527,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-05,2024-10-05,2,Qwen/Qwen2.5-7B,apache-2.0,5,7.616,1.19339271863324 +HumanLLMs/Humanish-Qwen2.5-7B-Instruct_bfloat16_7d2c71d926832d6e257ad2776011494dbac2d151_True,HumanLLMs/Humanish-Qwen2.5-7B-Instruct,7d2c71d926832d6e257ad2776011494dbac2d151,bfloat16,chatmodels,Original,Qwen2ForCausalLM,26.6653740968198,TRUE,IFEval,0.728425023382403,72.8425023382403,BBH,0.536368145780707,34.4789975866187,MATH Level 5,0,0,GPQA,0.298657718120805,6.48769574944072,MUSR,0.3980625,8.42447916666667,MMLU-PRO,0.439827127659575,37.7585697399527,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-05,2024-10-05,2,Qwen/Qwen2.5-7B,apache-2.0,6,7.616,1.19339271863324 IDEA-CCNL/Ziya-LLaMA-13B-v1_float16_64d931f346e1a49ea3bbca07a83137075bab1c66_False,IDEA-CCNL/Ziya-LLaMA-13B-v1,64d931f346e1a49ea3bbca07a83137075bab1c66,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,3.90642483860041,FALSE,IFEval,0.169686432000426,16.9686432000426,BBH,0.287702924454095,1.46361704609892,MATH Level 5,0,0,GPQA,0.249161073825503,0,MUSR,0.375052083333333,3.88151041666667,MMLU-PRO,0.110123005319149,1.12477836879433,TRUE,FALSE,FALSE,FALSE,TRUE,2023-05-16,2024-06-12,0,IDEA-CCNL/Ziya-LLaMA-13B-v1,gpl-3.0,273,13,1.10825743033459 INSAIT-Institute/BgGPT-Gemma-2-27B-IT-v1.0_float16_2ce5574f5d0daf61b39cffd80023dd73782b87e3_True,INSAIT-Institute/BgGPT-Gemma-2-27B-IT-v1.0,2ce5574f5d0daf61b39cffd80023dd73782b87e3,float16,continuouslypretrained,Original,Gemma2ForCausalLM,1.67806280680869,TRUE,IFEval,0,0,BBH,0.291177810298844,2.34704095752041,MATH Level 5,0,0,GPQA,0.26006711409396,1.34228187919463,MUSR,0.35753125,4.52473958333333,MMLU-PRO,0.116688829787234,1.85431442080378,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-15,2024-12-15,1,INSAIT-Institute/BgGPT-Gemma-2-27B-IT-v1.0 (Merge),gemma,14,27.227,10.3631218286217 IlyaGusev/gemma-2-2b-it-abliterated_float16__True,IlyaGusev/gemma-2-2b-it-abliterated,"",float16,chatmodels,Original,Gemma2ForCausalLM,15.711285136931,TRUE,IFEval,0.533086654521115,53.3086654521115,BBH,0.411860132621199,16.7963345046618,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.26510067114094,2.01342281879195,MUSR,0.3781875,4.90677083333334,MMLU-PRO,0.253823138297872,17.0914598108747,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-31,2025-01-07,0,IlyaGusev/gemma-2-2b-it-abliterated,gemma,44,2.614,2.5991223070719 @@ -719,7 +721,7 @@ Lyte/Llama-3.2-1B-Instruct-COT-RL-Expriement1-EP04_bfloat16_59d93307c6f2cb7a29c5 Lyte/Llama-3.2-3B-Overthinker_float16_0e7af37fb3381365905fc2df24811c0e6d2ba5b2_True,Lyte/Llama-3.2-3B-Overthinker,0e7af37fb3381365905fc2df24811c0e6d2ba5b2,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.0778462402,TRUE,IFEval,0.640797528335926,64.0797528335926,BBH,0.432009309795252,20.0955822264572,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.259228187919463,1.23042505592841,MUSR,0.34190625,3.90494791666667,MMLU-PRO,0.298537234042553,22.0596926713948,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-17,2024-10-18,2,meta-llama/Llama-3.2-3B-Instruct,apache-2.0,19,3.213,0.733639697394509 M4-ai/TinyMistral-248M-v3_bfloat16_fa23fe617768c671f0bbbff1edf4556cfe844167_False,M4-ai/TinyMistral-248M-v3,fa23fe617768c671f0bbbff1edf4556cfe844167,bfloat16,pretrained,Original,MistralForCausalLM,4.13010760928209,FALSE,IFEval,0.163866319144315,16.3866319144315,BBH,0.288454993899557,1.77755393038632,MATH Level 5,0,0,GPQA,0.240771812080537,0,MUSR,0.379333333333333,5.15,MMLU-PRO,0.113198138297872,1.4664598108747,TRUE,FALSE,FALSE,FALSE,FALSE,2024-02-05,2024-10-18,0,M4-ai/TinyMistral-248M-v3,apache-2.0,5,0.248,0.234183611420779 MEscriva/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis_float16_7a9d848188a674302d64a865786d4508be19571a_False,MEscriva/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis,7a9d848188a674302d64a865786d4508be19571a,float16,fine-tunedondomain-specificdatasets,Adapter,?,3.81803368483764,FALSE,IFEval,0.0866290331874981,8.66290331874981,BBH,0.305728612437881,3.23777427104784,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.251677852348993,0.223713646532442,MUSR,0.40171875,8.61484375,MMLU-PRO,0.115442154255319,1.71579491725768,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-11-19,0,Removed,"",0,0.63,1.05155623119269 -MLP-KTLim/llama-3-Korean-Bllossom-8B_bfloat16_8a738f9f622ffc2b0a4a6b81dabbca80406248bf_True,MLP-KTLim/llama-3-Korean-Bllossom-8B,8a738f9f622ffc2b0a4a6b81dabbca80406248bf,bfloat16,chatmodels,Original,LlamaForCausalLM,20.333975762059,TRUE,IFEval,0.5112800702137,51.12800702137,BBH,0.490045564701877,26.9275279730551,MATH Level 5,0.0981873111782478,9.81873111782478,GPQA,0.26258389261745,1.67785234899329,MUSR,0.367458333333333,3.63229166666667,MMLU-PRO,0.359375,28.8194444444444,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-25,2024-07-09,1,MLP-KTLim/llama-3-Korean-Bllossom-8B (Merge),llama3,290,8.03,0.774720564334845 +MLP-KTLim/llama-3-Korean-Bllossom-8B_bfloat16_8a738f9f622ffc2b0a4a6b81dabbca80406248bf_True,MLP-KTLim/llama-3-Korean-Bllossom-8B,8a738f9f622ffc2b0a4a6b81dabbca80406248bf,bfloat16,chatmodels,Original,LlamaForCausalLM,20.333975762059,TRUE,IFEval,0.5112800702137,51.12800702137,BBH,0.490045564701877,26.9275279730551,MATH Level 5,0.0981873111782478,9.81873111782478,GPQA,0.26258389261745,1.67785234899329,MUSR,0.367458333333333,3.63229166666667,MMLU-PRO,0.359375,28.8194444444444,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-25,2024-07-09,1,MLP-KTLim/llama-3-Korean-Bllossom-8B (Merge),llama3,291,8.03,0.774720564334845 MTSAIR/Cotype-Nano_bfloat16_91817ff717dd16d216304fa9d749e08fce2aa38d_True,MTSAIR/Cotype-Nano,91817ff717dd16d216304fa9d749e08fce2aa38d,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,13.2588792361465,TRUE,IFEval,0.374792217981622,37.4792217981622,BBH,0.386494096960149,14.4468700232412,MATH Level 5,0.0641993957703928,6.41993957703928,GPQA,0.27013422818792,2.68456375838927,MUSR,0.328916666666667,2.11458333333333,MMLU-PRO,0.247672872340426,16.4080969267139,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-22,2024-12-01,0,MTSAIR/Cotype-Nano,other,46,1.544,0.49328801555598 MTSAIR/MultiVerse_70B_bfloat16_063430cdc4d972a0884e3e3e3d45ea4afbdf71a2_False,MTSAIR/MultiVerse_70B,063430cdc4d972a0884e3e3e3d45ea4afbdf71a2,bfloat16,chatmodels,Original,LlamaForCausalLM,32.0051903084749,FALSE,IFEval,0.524918327814643,52.4918327814643,BBH,0.618313428493118,46.135898982415,MATH Level 5,0.178247734138973,17.8247734138973,GPQA,0.354026845637584,13.8702460850112,MUSR,0.473989583333333,18.8153645833333,MMLU-PRO,0.486037234042553,42.8930260047281,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-25,2024-06-29,0,MTSAIR/MultiVerse_70B,other,39,72.289,13.6018173834864 Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.1_bfloat16_1ed587f54f70334f495efb9c027acb03e96fe24f_True,Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.1,1ed587f54f70334f495efb9c027acb03e96fe24f,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,15.9289113532727,TRUE,IFEval,0.436141659685191,43.6141659685191,BBH,0.461510274452737,23.9901243984113,MATH Level 5,0.0558912386706949,5.58912386706949,GPQA,0.26258389261745,1.67785234899329,MUSR,0.327739583333333,0,MMLU-PRO,0.286319813829787,20.702201536643,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-06,2024-09-17,1,meta-llama/Meta-Llama-3-8B,llama3,4,8.03,0.8335691386634 @@ -785,7 +787,7 @@ MaziyarPanahi/calme-3.1-instruct-78b_bfloat16_7ccd7f1a55ae79af7969f721bb7055511c MaziyarPanahi/calme-3.1-llamaloi-3b_bfloat16_62547548c06bb22f0b82c2bda7ac466507314a4b_True,MaziyarPanahi/calme-3.1-llamaloi-3b,62547548c06bb22f0b82c2bda7ac466507314a4b,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.0052338092847,TRUE,IFEval,0.73751756450662,73.751756450662,BBH,0.458734000499888,23.7691655758483,MATH Level 5,0.167673716012085,16.7673716012085,GPQA,0.281040268456376,4.13870246085012,MUSR,0.351520833333333,1.10677083333333,MMLU-PRO,0.320478723404255,24.4976359338062,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,meta-llama/Llama-3.2-3B,llama3.2,1,3.213,1.19291766447292 MaziyarPanahi/calme-3.2-baguette-3b_bfloat16_bba8e602432bd467b64cabf9cb62326893060e60_True,MaziyarPanahi/calme-3.2-baguette-3b,bba8e602432bd467b64cabf9cb62326893060e60,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.1406481081638,TRUE,IFEval,0.633828242396841,63.3828242396841,BBH,0.470862269902714,25.8657466507311,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.294463087248322,5.92841163310962,MUSR,0.40209375,8.59505208333333,MMLU-PRO,0.333776595744681,25.9751773049645,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,1,3.085,0.776012497501503 MaziyarPanahi/calme-3.2-instruct-3b_bfloat16_12347f5991157e752de6ba9f773a1bbc22445e3a_True,MaziyarPanahi/calme-3.2-instruct-3b,12347f5991157e752de6ba9f773a1bbc22445e3a,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.6566062728784,TRUE,IFEval,0.553319636342682,55.3319636342682,BBH,0.486564111037674,27.9767982423931,MATH Level 5,0.0989425981873112,9.89425981873112,GPQA,0.283557046979866,4.47427293064877,MUSR,0.404697916666667,8.78723958333333,MMLU-PRO,0.365275930851064,29.475103427896,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,0,3.086,0.743433169169365 -MaziyarPanahi/calme-3.2-instruct-78b_bfloat16_731f4daf584f822f1393731ccff1d58c7f06b99e_True,MaziyarPanahi/calme-3.2-instruct-78b,731f4daf584f822f1393731ccff1d58c7f06b99e,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,52.0184433947031,TRUE,IFEval,0.806260721552148,80.6260721552148,BBH,0.731861627209267,62.6094432829016,MATH Level 5,0.399546827794562,39.9546827794562,GPQA,0.402684563758389,20.3579418344519,MUSR,0.602364583333333,38.52890625,MMLU-PRO,0.730302526595745,70.0336140661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-11-28,1,Removed,other,50,77.965,33.0055653548694 +MaziyarPanahi/calme-3.2-instruct-78b_bfloat16_731f4daf584f822f1393731ccff1d58c7f06b99e_True,MaziyarPanahi/calme-3.2-instruct-78b,731f4daf584f822f1393731ccff1d58c7f06b99e,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,52.0184433947031,TRUE,IFEval,0.806260721552148,80.6260721552148,BBH,0.731861627209267,62.6094432829016,MATH Level 5,0.399546827794562,39.9546827794562,GPQA,0.402684563758389,20.3579418344519,MUSR,0.602364583333333,38.52890625,MMLU-PRO,0.730302526595745,70.0336140661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-11-28,1,Removed,other,51,77.965,33.0055653548694 MaziyarPanahi/calme-3.3-baguette-3b_bfloat16_66f9438922503e5616b6b4488e96fd9342d5efb0_True,MaziyarPanahi/calme-3.3-baguette-3b,66f9438922503e5616b6b4488e96fd9342d5efb0,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,21.0626896485596,TRUE,IFEval,0.635951497581971,63.5951497581971,BBH,0.467821729595752,25.5965941060964,MATH Level 5,0,0,GPQA,0.280201342281879,4.0268456375839,MUSR,0.392822916666667,7.13619791666667,MMLU-PRO,0.334192154255319,26.0213504728132,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,1,3.086,0.746922918806257 MaziyarPanahi/calme-3.3-instruct-3b_bfloat16_ea7d7fb442c981ecd44c5a9060ac6b062927f231_True,MaziyarPanahi/calme-3.3-instruct-3b,ea7d7fb442c981ecd44c5a9060ac6b062927f231,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,21.5477931531294,TRUE,IFEval,0.642321263137364,64.2321263137364,BBH,0.469334094276887,25.6821378185791,MATH Level 5,0,0,GPQA,0.282718120805369,4.36241610738255,MUSR,0.407427083333333,9.39505208333333,MMLU-PRO,0.330535239361702,25.6150265957447,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,3,3.086,0.752548515201209 Minami-su/Amara-o1-7B-Qwen_bfloat16_835395d4e693cd8cfb5143f12fae53673164846f_True,Minami-su/Amara-o1-7B-Qwen,835395d4e693cd8cfb5143f12fae53673164846f,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,25.8535285767209,TRUE,IFEval,0.738991431623647,73.8991431623648,BBH,0.519942007788045,32.7968298710958,MATH Level 5,0,0,GPQA,0.293624161073826,5.8165548098434,MUSR,0.400666666666667,8.35,MMLU-PRO,0.408327792553192,34.2586436170213,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-08,0,Minami-su/Amara-o1-7B-Qwen,apache-2.0,1,7.616,0.637559535560653 @@ -816,7 +818,7 @@ NCSOFT/Llama-VARCO-8B-Instruct_bfloat16_fe2d9358a2d35451c04e4589b47e361cfacd350d NLPark/AnFeng_v3.1-Avocet_float16_5170739731033323e6e66a0f68d34790042a3b2a_False,NLPark/AnFeng_v3.1-Avocet,5170739731033323e6e66a0f68d34790042a3b2a,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,28.2776632974634,FALSE,IFEval,0.509631112115853,50.9631112115853,BBH,0.582852329074409,40.3090336514533,MATH Level 5,0.152567975830816,15.2567975830816,GPQA,0.324664429530201,9.95525727069351,MUSR,0.447572916666667,14.9799479166667,MMLU-PRO,0.443816489361702,38.2018321513002,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-03,2024-08-07,0,NLPark/AnFeng_v3.1-Avocet,cc-by-nc-nd-4.0,0,34.393,3.17200803334586 NLPark/B-and-W_Flycatcher-3AD1E_bfloat16_21044e39f6854f5a6df84c5074d449b7eb96b522_True,NLPark/B-and-W_Flycatcher-3AD1E,21044e39f6854f5a6df84c5074d449b7eb96b522,bfloat16,chatmodels,Original,LlamaForCausalLM,29.2840499717512,TRUE,IFEval,0.490846509483725,49.0846509483725,BBH,0.606511752853436,43.7424580109235,MATH Level 5,0.166918429003021,16.6918429003021,GPQA,0.330536912751678,10.738255033557,MUSR,0.442270833333333,13.8838541666667,MMLU-PRO,0.47406914893617,41.5632387706856,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-28,2024-09-28,0,NLPark/B-and-W_Flycatcher-3AD1E,apache-2.0,0,14.77,1.55132229692418 NLPark/Shi-Ci-Robin-Test_3AD80_bfloat16_995887837a259817570489183cbe8b1abffd23b1_True,NLPark/Shi-Ci-Robin-Test_3AD80,995887837a259817570489183cbe8b1abffd23b1,bfloat16,chatmodels,Original,LlamaForCausalLM,38.5165993626602,TRUE,IFEval,0.722654778210703,72.2654778210703,BBH,0.670480515757033,52.2656617511021,MATH Level 5,0.272658610271903,27.2658610271903,GPQA,0.35989932885906,14.6532438478747,MUSR,0.46959375,18.8658854166667,MMLU-PRO,0.512051196808511,45.7834663120567,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-25,2024-10-25,1,NLPark/Shi-Ci-Robin-Test_3AD80 (Merge),llama3.1,0,70.554,12.446754480357 -NTQAI/Nxcode-CQ-7B-orpo_bfloat16_74f3b3c06de36b261af9ef857279d6e33f893336_True,NTQAI/Nxcode-CQ-7B-orpo,74f3b3c06de36b261af9ef857279d6e33f893336,bfloat16,chatmodels,Original,Qwen2ForCausalLM,12.2982509985398,TRUE,IFEval,0.400721197533655,40.0721197533655,BBH,0.414302324917822,17.5800048700814,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.254194630872483,0.559284116331097,MUSR,0.39396875,7.04609375,MMLU-PRO,0.161153590425532,6.79484338061466,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-24,2024-08-10,0,NTQAI/Nxcode-CQ-7B-orpo,other,111,7.25,0.842174913393591 +NTQAI/Nxcode-CQ-7B-orpo_bfloat16_74f3b3c06de36b261af9ef857279d6e33f893336_True,NTQAI/Nxcode-CQ-7B-orpo,74f3b3c06de36b261af9ef857279d6e33f893336,bfloat16,chatmodels,Original,Qwen2ForCausalLM,12.2982509985398,TRUE,IFEval,0.400721197533655,40.0721197533655,BBH,0.414302324917822,17.5800048700814,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.254194630872483,0.559284116331097,MUSR,0.39396875,7.04609375,MMLU-PRO,0.161153590425532,6.79484338061466,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-24,2024-08-10,0,NTQAI/Nxcode-CQ-7B-orpo,other,112,7.25,0.842174913393591 NYTK/PULI-GPTrio_float16_16a56dd22d184e4b7b49d90461fa8d4810639463_False,NYTK/PULI-GPTrio,16a56dd22d184e4b7b49d90461fa8d4810639463,float16,pretrained,Original,GPTNeoXForCausalLM,5.77078732696787,FALSE,IFEval,0.217971648559156,21.7971648559156,BBH,0.306002909062375,3.0152211415705,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.265939597315436,2.12527964205817,MUSR,0.381875,5.334375,MMLU-PRO,0.113696808510638,1.52186761229314,TRUE,FALSE,FALSE,FALSE,FALSE,2023-06-08,2024-08-24,0,NYTK/PULI-GPTrio,cc-by-nc-4.0,10,7.673,0.722046995347682 NYTK/PULI-LlumiX-32K_float16_a589894397a36b61c578d0dd4778ee6e5fe471ff_False,NYTK/PULI-LlumiX-32K,a589894397a36b61c578d0dd4778ee6e5fe471ff,float16,continuouslypretrained,Original,LlamaForCausalLM,6.40581630535552,FALSE,IFEval,0.169961258350067,16.9961258350067,BBH,0.318935822429494,5.10704712990773,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.253355704697987,0.447427293064876,MUSR,0.396416666666667,7.71875,MMLU-PRO,0.168051861702128,7.56131796690307,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-12,2024-08-24,0,NYTK/PULI-LlumiX-32K,llama2,9,6.738,0.822569739962814 Naveenpoliasetty/llama3-8B-V2_float16_e0458381d02bc411b9e576796d185f23dcc11f71_False,Naveenpoliasetty/llama3-8B-V2,e0458381d02bc411b9e576796d185f23dcc11f71,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.8458629712676,FALSE,IFEval,0.412261687877055,41.2261687877055,BBH,0.518865758006506,30.8732094250396,MATH Level 5,0.0800604229607251,8.00604229607251,GPQA,0.290268456375839,5.36912751677852,MUSR,0.408135416666667,9.18359375,MMLU-PRO,0.373753324468085,30.4170360520095,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-18,2024-06-26,1,Naveenpoliasetty/llama3-8B-V2 (Merge),"",1,8.03,0.75201223968556 @@ -829,7 +831,7 @@ Nekochu/Luminia-8B-RP_float16_619be17206729d86b898b9d1b3369a7135c1a9b9_False,Nek NeverSleep/Lumimaid-v0.2-12B_bfloat16_b04f4e8f9a0c64fbb271d1135b208c90c3aa0ad0_False,NeverSleep/Lumimaid-v0.2-12B,b04f4e8f9a0c64fbb271d1135b208c90c3aa0ad0,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,17.7948471656574,FALSE,IFEval,0.109934972539528,10.9934972539528,BBH,0.539561052585082,34.4098894348544,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.314597315436242,8.61297539149888,MUSR,0.482114583333333,21.29765625,MMLU-PRO,0.351146941489362,27.9052157210402,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-25,2024-07-31,0,NeverSleep/Lumimaid-v0.2-12B,cc-by-nc-4.0,82,12.248,1.56419336368199 NeverSleep/Lumimaid-v0.2-8B_bfloat16_4563201f29ef18c62d16e9f6fffd3931a63ccb51_False,NeverSleep/Lumimaid-v0.2-8B,4563201f29ef18c62d16e9f6fffd3931a63ccb51,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.3868203470804,FALSE,IFEval,0.503810999259742,50.3810999259742,BBH,0.523776760122662,31.9633737811802,MATH Level 5,0.141993957703928,14.1993957703927,GPQA,0.311241610738255,8.165548098434,MUSR,0.430302083333333,12.32109375,MMLU-PRO,0.363613696808511,29.2904107565012,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-24,2024-08-09,0,NeverSleep/Lumimaid-v0.2-8B,cc-by-nc-4.0,67,8.03,0.73969553455627 Nexusflow/NexusRaven-V2-13B_bfloat16_cdab7132db4a4fd64513123374ea1451d85a7ace_False,Nexusflow/NexusRaven-V2-13B,cdab7132db4a4fd64513123374ea1451d85a7ace,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,8.31183115135613,FALSE,IFEval,0.179078179231107,17.9078179231107,BBH,0.394886046405073,15.3364483952296,MATH Level 5,0.0188821752265861,1.88821752265861,GPQA,0.26006711409396,1.34228187919463,MUSR,0.3736875,3.7109375,MMLU-PRO,0.187167553191489,9.68528368794326,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-04,2024-06-12,1,codellama/CodeLlama-13b-Instruct-hf,other,466,13,1.08980491321583 -Nitral-AI/Captain-Eris_Violet-V0.420-12B_bfloat16_b1a87ce62601e19fff206a16590d28f009965799_False,Nitral-AI/Captain-Eris_Violet-V0.420-12B,b1a87ce62601e19fff206a16590d28f009965799,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,23.4755631156729,FALSE,IFEval,0.433918669131239,43.3918669131239,BBH,0.547809941761137,35.3269407502337,MATH Level 5,0.0981873111782477,9.81873111782477,GPQA,0.311241610738255,8.165548098434,MUSR,0.4330625,13.8994791666667,MMLU-PRO,0.372257313829787,30.2508126477541,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-16,2025-01-04,1,Nitral-AI/Captain-Eris_Violet-V0.420-12B (Merge),other,19,12.248,2.01942194101833 +Nitral-AI/Captain-Eris_Violet-V0.420-12B_bfloat16_b1a87ce62601e19fff206a16590d28f009965799_False,Nitral-AI/Captain-Eris_Violet-V0.420-12B,b1a87ce62601e19fff206a16590d28f009965799,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,23.4755631156729,FALSE,IFEval,0.433918669131239,43.3918669131239,BBH,0.547809941761137,35.3269407502337,MATH Level 5,0.0981873111782477,9.81873111782477,GPQA,0.311241610738255,8.165548098434,MUSR,0.4330625,13.8994791666667,MMLU-PRO,0.372257313829787,30.2508126477541,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-16,2025-01-04,1,Nitral-AI/Captain-Eris_Violet-V0.420-12B (Merge),other,20,12.248,2.01942194101833 Nitral-AI/Captain_BMO-12B_bfloat16_ba2950f1c9831c6aacd6141851e7b9724be6759a_False,Nitral-AI/Captain_BMO-12B,ba2950f1c9831c6aacd6141851e7b9724be6759a,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,23.0971914892988,FALSE,IFEval,0.475059508770063,47.5059508770063,BBH,0.528596065042497,32.4406978474883,MATH Level 5,0.132930513595166,13.2930513595166,GPQA,0.319630872483222,9.2841163310962,MUSR,0.374802083333333,7.51692708333334,MMLU-PRO,0.35688164893617,28.5424054373522,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-01,2025-01-04,0,Nitral-AI/Captain_BMO-12B,other,18,12.248,2.28723110704441 Nitral-AI/Hathor_Stable-v0.2-L3-8B_bfloat16_1c9f391c3e349f8ba51b5696290ee6db6a2b63fd_True,Nitral-AI/Hathor_Stable-v0.2-L3-8B,1c9f391c3e349f8ba51b5696290ee6db6a2b63fd,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.8424280376059,TRUE,IFEval,0.717484053422696,71.7484053422696,BBH,0.528581917830168,32.826028565586,MATH Level 5,0.100453172205438,10.0453172205438,GPQA,0.286912751677852,4.92170022371365,MUSR,0.3780625,5.5578125,MMLU-PRO,0.369597739361702,29.9553043735225,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-09,2024-07-02,0,Nitral-AI/Hathor_Stable-v0.2-L3-8B,other,59,8.03,0.808422964725621 Nohobby/MS-Schisandra-22B-v0.1_bfloat16_df698b7b740fb3b5193d61cd51e5e3a42c3b1e1c_False,Nohobby/MS-Schisandra-22B-v0.1,df698b7b740fb3b5193d61cd51e5e3a42c3b1e1c,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,29.6962364114623,FALSE,IFEval,0.633128986644326,63.3128986644326,BBH,0.578994971489652,40.0113996162222,MATH Level 5,0.197885196374622,19.7885196374622,GPQA,0.332214765100671,10.9619686800895,MUSR,0.39284375,9.70546875,MMLU-PRO,0.409574468085106,34.3971631205674,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-26,2024-10-30,1,Nohobby/MS-Schisandra-22B-v0.1 (Merge),other,5,22.247,1.6005536479262 @@ -847,12 +849,12 @@ NotASI/FineTome-Llama3.2-3B-1002_float16_7c8497a24a381e3bfd77bc92e5685442768790d NotASI/FineTome-v1.5-Llama3.2-1B-1007_float16_5e329d987e9f74dd2703a4fefa56ab8c72b5702b_True,NotASI/FineTome-v1.5-Llama3.2-1B-1007,5e329d987e9f74dd2703a4fefa56ab8c72b5702b,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,8.94045538932633,TRUE,IFEval,0.392377779846363,39.2377779846363,BBH,0.324056711214857,5.80172467354176,MATH Level 5,0.013595166163142,1.3595166163142,GPQA,0.25,0,MUSR,0.347458333333333,2.49895833333333,MMLU-PRO,0.142702792553192,4.74475472813239,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-07,2024-10-07,1,NotASI/FineTome-v1.5-Llama3.2-1B-1007 (Merge),llama3.2,1,1.236,0.474231520771542 NotASI/FineTome-v1.5-Llama3.2-3B-1007_float16_6c6e71fbcff6c00d04a3fd69084af20bf2a943c8_True,NotASI/FineTome-v1.5-Llama3.2-3B-1007,6c6e71fbcff6c00d04a3fd69084af20bf2a943c8,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,16.9626388108139,TRUE,IFEval,0.550771951754678,55.0771951754678,BBH,0.431237293532158,19.4572192788493,MATH Level 5,0.0551359516616314,5.51359516616314,GPQA,0.261744966442953,1.56599552572707,MUSR,0.364541666666667,4.06770833333333,MMLU-PRO,0.244847074468085,16.0941193853428,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-07,2024-10-07,1,NotASI/FineTome-v1.5-Llama3.2-3B-1007 (Merge),llama3.2,1,3.213,0.725378525425475 NousResearch/Hermes-2-Pro-Llama-3-8B_float16_bc265d1781299ed2045214289c927c207439a729_True,NousResearch/Hermes-2-Pro-Llama-3-8B,bc265d1781299ed2045214289c927c207439a729,float16,chatmodels,Original,LlamaForCausalLM,21.7049203338117,TRUE,IFEval,0.536183991808402,53.6183991808402,BBH,0.507112624310082,30.667993420825,MATH Level 5,0.0619335347432024,6.19335347432024,GPQA,0.292785234899329,5.70469798657718,MUSR,0.426239583333333,11.2466145833333,MMLU-PRO,0.305186170212766,22.798463356974,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-30,2024-06-13,1,NousResearch/Meta-Llama-3-8B,llama3,414,8.031,0.749983206264044 -NousResearch/Hermes-2-Pro-Mistral-7B_bfloat16_09317b1d8da639b5d9af77c06aa17cde0f0f91c0_True,NousResearch/Hermes-2-Pro-Mistral-7B,09317b1d8da639b5d9af77c06aa17cde0f0f91c0,bfloat16,chatmodels,Original,MistralForCausalLM,21.7021075222127,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.499543533049808,29.427578860536,MATH Level 5,0.0521148036253777,5.21148036253777,GPQA,0.273489932885906,3.13199105145414,MUSR,0.43759375,14.1325520833333,MMLU-PRO,0.294630984042553,21.625664893617,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-11,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,487,7.242,0.472797519360034 +NousResearch/Hermes-2-Pro-Mistral-7B_bfloat16_09317b1d8da639b5d9af77c06aa17cde0f0f91c0_True,NousResearch/Hermes-2-Pro-Mistral-7B,09317b1d8da639b5d9af77c06aa17cde0f0f91c0,bfloat16,chatmodels,Original,MistralForCausalLM,21.7021075222127,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.499543533049808,29.427578860536,MATH Level 5,0.0521148036253777,5.21148036253777,GPQA,0.273489932885906,3.13199105145414,MUSR,0.43759375,14.1325520833333,MMLU-PRO,0.294630984042553,21.625664893617,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-11,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,488,7.242,0.472797519360034 NousResearch/Hermes-2-Theta-Llama-3-8B_bfloat16_885173e97ab8572b444f7db1290d5d0386e26816_True,NousResearch/Hermes-2-Theta-Llama-3-8B,885173e97ab8572b444f7db1290d5d0386e26816,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.7757883439893,TRUE,IFEval,0.651788365980044,65.1788365980044,BBH,0.520667226091187,32.0460738480758,MATH Level 5,0.0959214501510574,9.59214501510574,GPQA,0.303691275167785,7.15883668903803,MUSR,0.394895833333333,8.36197916666667,MMLU-PRO,0.336851728723404,26.3168587470449,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-05,2024-07-11,2,NousResearch/Meta-Llama-3-8B,apache-2.0,196,8.03,0.743922417596867 NousResearch/Hermes-3-Llama-3.1-70B_bfloat16_093242c69a91f8d9d5b8094c380b88772f9bd7f8_True,NousResearch/Hermes-3-Llama-3.1-70B,093242c69a91f8d9d5b8094c380b88772f9bd7f8,bfloat16,chatmodels,Original,LlamaForCausalLM,37.4825450944456,TRUE,IFEval,0.76614383169989,76.614383169989,BBH,0.675578064138748,53.7654086913006,MATH Level 5,0.148036253776435,14.8036253776435,GPQA,0.361577181208054,14.8769574944072,MUSR,0.494895833333333,23.4286458333333,MMLU-PRO,0.47265625,41.40625,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-29,2024-08-28,1,meta-llama/Meta-Llama-3.1-70B,llama3,102,70.554,11.2078909209213 NousResearch/Hermes-3-Llama-3.1-8B_bfloat16_aabb745a717e133b74dcae23195d2635cf5f38cc_True,NousResearch/Hermes-3-Llama-3.1-8B,aabb745a717e133b74dcae23195d2635cf5f38cc,bfloat16,chatmodels,Original,LlamaForCausalLM,23.49087671148,TRUE,IFEval,0.617017291896612,61.7017291896612,BBH,0.517745254014125,30.724096614148,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.297818791946309,6.3758389261745,MUSR,0.4369375,13.6171875,MMLU-PRO,0.31391289893617,23.7680998817967,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-28,2024-08-28,1,meta-llama/Meta-Llama-3.1-8B,llama3,276,8.03,0.905807900142943 -NousResearch/Hermes-3-Llama-3.2-3B_bfloat16_f6a109fe836b13b6905f8c16a7388f2f557c3974_True,NousResearch/Hermes-3-Llama-3.2-3B,f6a109fe836b13b6905f8c16a7388f2f557c3974,bfloat16,chatmodels,Original,LlamaForCausalLM,15.116238224353,TRUE,IFEval,0.38248624760081,38.248624760081,BBH,0.435199015067149,20.1871880374546,MATH Level 5,0.0317220543806647,3.17220543806647,GPQA,0.275167785234899,3.35570469798658,MUSR,0.403020833333333,8.57760416666667,MMLU-PRO,0.254404920212766,17.1561022458629,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-03,2024-12-20,1,Removed,llama3,119,3.213,1.10155586552599 -NousResearch/Nous-Hermes-2-Mistral-7B-DPO_bfloat16_ebec0a691037d38955727d6949798429a63929dd_True,NousResearch/Nous-Hermes-2-Mistral-7B-DPO,ebec0a691037d38955727d6949798429a63929dd,bfloat16,chatmodels,Original,MistralForCausalLM,21.0376463902847,TRUE,IFEval,0.57625101397625,57.625101397625,BBH,0.485265366546524,27.7925456583661,MATH Level 5,0.0438066465256798,4.38066465256798,GPQA,0.292785234899329,5.70469798657718,MUSR,0.399979166666667,8.33072916666667,MMLU-PRO,0.301529255319149,22.3921394799054,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-18,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,172,7.242,0.474598918698818 +NousResearch/Hermes-3-Llama-3.2-3B_bfloat16_f6a109fe836b13b6905f8c16a7388f2f557c3974_True,NousResearch/Hermes-3-Llama-3.2-3B,f6a109fe836b13b6905f8c16a7388f2f557c3974,bfloat16,chatmodels,Original,LlamaForCausalLM,15.116238224353,TRUE,IFEval,0.38248624760081,38.248624760081,BBH,0.435199015067149,20.1871880374546,MATH Level 5,0.0317220543806647,3.17220543806647,GPQA,0.275167785234899,3.35570469798658,MUSR,0.403020833333333,8.57760416666667,MMLU-PRO,0.254404920212766,17.1561022458629,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-03,2024-12-20,1,Removed,llama3,121,3.213,1.10155586552599 +NousResearch/Nous-Hermes-2-Mistral-7B-DPO_bfloat16_ebec0a691037d38955727d6949798429a63929dd_True,NousResearch/Nous-Hermes-2-Mistral-7B-DPO,ebec0a691037d38955727d6949798429a63929dd,bfloat16,chatmodels,Original,MistralForCausalLM,21.0376463902847,TRUE,IFEval,0.57625101397625,57.625101397625,BBH,0.485265366546524,27.7925456583661,MATH Level 5,0.0438066465256798,4.38066465256798,GPQA,0.292785234899329,5.70469798657718,MUSR,0.399979166666667,8.33072916666667,MMLU-PRO,0.301529255319149,22.3921394799054,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-18,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,173,7.242,0.474598918698818 NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO_bfloat16_286ae6737d048ad1d965c2e830864df02db50f2f_True,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,286ae6737d048ad1d965c2e830864df02db50f2f,bfloat16,chatmodels,Original,MixtralForCausalLM,27.290249854483,TRUE,IFEval,0.58968980083955,58.968980083955,BBH,0.553885138403382,37.1077837913399,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.321308724832215,9.50782997762864,MUSR,0.459541666666667,16.6760416666667,MMLU-PRO,0.366605718085106,29.6228575650118,TRUE,FALSE,TRUE,FALSE,TRUE,2024-01-11,2024-07-27,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,420,46.703,12.8651437241499 NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT_bfloat16_4c06af2684730f75a6874b95e8bf6058105d9612_True,NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT,4c06af2684730f75a6874b95e8bf6058105d9612,bfloat16,chatmodels,Original,MixtralForCausalLM,21.8410108914617,TRUE,IFEval,0.573078321076965,57.3078321076965,BBH,0.505786845402664,30.5943127788644,MATH Level 5,0.0211480362537764,2.11480362537764,GPQA,0.302013422818792,6.93512304250559,MUSR,0.421375,11.1385416666667,MMLU-PRO,0.306599069148936,22.9554521276596,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-26,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,55,46.703,10.3879398461721 NousResearch/Nous-Hermes-2-SOLAR-10.7B_bfloat16_14c1fbe2f71acdcd58247b30d5439bd572d52386_True,NousResearch/Nous-Hermes-2-SOLAR-10.7B,14c1fbe2f71acdcd58247b30d5439bd572d52386,bfloat16,chatmodels,Original,LlamaForCausalLM,23.3621906922798,TRUE,IFEval,0.527866062048697,52.7866062048698,BBH,0.541429484114017,34.9908945844652,MATH Level 5,0.054380664652568,5.4380664652568,GPQA,0.293624161073826,5.8165548098434,MUSR,0.43728125,13.8268229166667,MMLU-PRO,0.345827792553192,27.3141991725768,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-01,2024-06-12,1,upstage/SOLAR-10.7B-v1.0,apache-2.0,203,10.732,0.643444138017228 @@ -904,7 +906,7 @@ OpenScholar/Llama-3.1_OpenScholar-8B_bfloat16_e26aeb22af568bd8d01ffde86ebbd13c3c Orenguteng/Llama-3.1-8B-Lexi-Uncensored_bfloat16_56ac439ab4c7826871493ffbe2d49f2100a98e97_True,Orenguteng/Llama-3.1-8B-Lexi-Uncensored,56ac439ab4c7826871493ffbe2d49f2100a98e97,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,26.8604132222972,TRUE,IFEval,0.77768432204329,77.768432204329,BBH,0.505726165264264,29.2425432417686,MATH Level 5,0.13821752265861,13.821752265861,GPQA,0.271812080536913,2.9082774049217,MUSR,0.387114583333333,6.42265625,MMLU-PRO,0.378989361702128,30.9988179669031,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-26,2024-07-29,0,Orenguteng/Llama-3.1-8B-Lexi-Uncensored,llama3.1,42,8.03,0.856735067560064 Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2_bfloat16_2340f8fbcd2452125a798686ca90b882a08fb0d9_True,Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2,2340f8fbcd2452125a798686ca90b882a08fb0d9,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,27.9251209060615,TRUE,IFEval,0.779158189160317,77.9158189160317,BBH,0.508400801878393,29.6870327456312,MATH Level 5,0.169184290030212,16.9184290030212,GPQA,0.282718120805369,4.36241610738255,MUSR,0.384291666666667,7.76979166666667,MMLU-PRO,0.378075132978723,30.8972369976359,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-09,2024-08-28,0,Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2,llama3.1,150,8.03,0.869686314484719 Orion-zhen/Qwen2.5-7B-Instruct-Uncensored_bfloat16_33c24657b4394fc430ad90b5d413e5985ce8e292_True,Orion-zhen/Qwen2.5-7B-Instruct-Uncensored,33c24657b4394fc430ad90b5d413e5985ce8e292,bfloat16,chatmodels,Original,Qwen2ForCausalLM,27.9897115235622,TRUE,IFEval,0.720431787656751,72.0431787656751,BBH,0.54739186521573,35.8324528622882,MATH Level 5,0.013595166163142,1.3595166163142,GPQA,0.302852348993289,7.04697986577182,MUSR,0.436135416666667,13.58359375,MMLU-PRO,0.442652925531915,38.0725472813239,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-26,2024-10-19,1,Orion-zhen/Qwen2.5-7B-Instruct-Uncensored (Merge),gpl-3.0,14,7.616,1.11681194245401 -Orion-zhen/phi-4-abliterated_bfloat16_90e3bfb1a9507d931c19faa5c2084d3f8d0bfb77_False,Orion-zhen/phi-4-abliterated,90e3bfb1a9507d931c19faa5c2084d3f8d0bfb77,bfloat16,fine-tunedondomain-specificdatasets,Original,Phi3ForCausalLM,29.7021385186012,FALSE,IFEval,0.0576027163481784,5.76027163481784,BBH,0.669823930666478,52.4571292257837,MATH Level 5,0.285498489425982,28.5498489425982,GPQA,0.404362416107383,20.5816554809843,MUSR,0.500625,23.178125,MMLU-PRO,0.529172207446809,47.6858008274232,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-17,2024-12-20,1,Orion-zhen/phi-4-abliterated (Merge),gpl-3.0,20,14.66,0.894350962480824 +Orion-zhen/phi-4-abliterated_bfloat16_90e3bfb1a9507d931c19faa5c2084d3f8d0bfb77_False,Orion-zhen/phi-4-abliterated,90e3bfb1a9507d931c19faa5c2084d3f8d0bfb77,bfloat16,fine-tunedondomain-specificdatasets,Original,Phi3ForCausalLM,29.7021385186012,FALSE,IFEval,0.0576027163481784,5.76027163481784,BBH,0.669823930666478,52.4571292257837,MATH Level 5,0.285498489425982,28.5498489425982,GPQA,0.404362416107383,20.5816554809843,MUSR,0.500625,23.178125,MMLU-PRO,0.529172207446809,47.6858008274232,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-17,2024-12-20,1,Orion-zhen/phi-4-abliterated (Merge),gpl-3.0,21,14.66,0.894350962480824 P0x0/Astra-v1-12B_bfloat16_c706e253f8d8fa838b505cbec0e1a6aeec545abc_False,P0x0/Astra-v1-12B,c706e253f8d8fa838b505cbec0e1a6aeec545abc,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,19.674299882431,FALSE,IFEval,0.280594378471345,28.0594378471345,BBH,0.521450648413898,31.8099073411794,MATH Level 5,0.109516616314199,10.9516616314199,GPQA,0.313758389261745,8.50111856823266,MUSR,0.4051875,11.3817708333333,MMLU-PRO,0.346077127659575,27.3419030732861,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-21,2024-09-23,1,mistralai/Mistral-Nemo-Base-2407,apache-2.0,2,12.248,1.60567337209763 PJMixers/LLaMa-3-CursedStock-v2.0-8B_bfloat16_d47cc29df363f71ffaf6cd21ac4bdeefa27359db_True,PJMixers/LLaMa-3-CursedStock-v2.0-8B,d47cc29df363f71ffaf6cd21ac4bdeefa27359db,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,24.2038982437966,TRUE,IFEval,0.633079118959915,63.3079118959915,BBH,0.527115950402997,32.5636117089159,MATH Level 5,0.0966767371601208,9.66767371601208,GPQA,0.274328859060403,3.24384787472036,MUSR,0.385625,8.03645833333334,MMLU-PRO,0.355634973404255,28.4038859338062,TRUE,TRUE,FALSE,FALSE,FALSE,2024-06-26,2024-06-27,1,PJMixers/LLaMa-3-CursedStock-v2.0-8B (Merge),llama3,11,8.03,1.40269205586454 PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B_bfloat16_c5b8d7fa43a013e434630a7f89f3bf15ac19606f_True,PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B,c5b8d7fa43a013e434630a7f89f3bf15ac19606f,bfloat16,chatmodels,Original,LlamaForCausalLM,28.7938572465617,TRUE,IFEval,0.787101557201559,78.7101557201559,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.194108761329305,19.4108761329305,GPQA,0.291946308724832,5.59284116331097,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376745345744681,30.7494828605201,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-18,2024-12-18,1,PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B (Merge),llama3.1,1,13.047,1.29636573579394 @@ -919,7 +921,7 @@ Parissa3/test-model_bfloat16_7021138dac98d930f1ce0ebe186583c0813d6f48_False,Pari PocketDoc/Dans-Instruct-CoreCurriculum-12b_bfloat16_c50db5ba880b7edc0efd32a7f3b9d2f051c3f4a6_True,PocketDoc/Dans-Instruct-CoreCurriculum-12b,c50db5ba880b7edc0efd32a7f3b9d2f051c3f4a6,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,9.40282371026575,TRUE,IFEval,0.219145201398955,21.9145201398955,BBH,0.378873907524027,13.23256495304,MATH Level 5,0.0490936555891239,4.90936555891239,GPQA,0.282718120805369,4.36241610738255,MUSR,0.4095625,9.56197916666667,MMLU-PRO,0.121924867021277,2.4360963356974,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-01,0,Removed,"",0,12,1.5885381520372 PocketDoc/Dans-PersonalityEngine-V1.1.0-12b_bfloat16_e58b4d12f79522209478fed022b65675a18b877f_True,PocketDoc/Dans-PersonalityEngine-V1.1.0-12b,e58b4d12f79522209478fed022b65675a18b877f,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,26.1385999215711,TRUE,IFEval,0.707467297880734,70.7467297880734,BBH,0.536104624319959,33.666618823463,MATH Level 5,0.0506042296072508,5.06042296072508,GPQA,0.286912751677852,4.92170022371365,MUSR,0.458677083333333,17.3013020833333,MMLU-PRO,0.326213430851064,25.1348256501182,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,PocketDoc/Dans-PersonalityEngine-V1.1.0-12b (Merge),apache-2.0,19,12.248,2.11734611148732 PocketDoc/Dans-PersonalityEngine-v1.0.0-8b_bfloat16_c64612e1eee1ddb3aa064a25eba8921ec3d94325_True,PocketDoc/Dans-PersonalityEngine-v1.0.0-8b,c64612e1eee1ddb3aa064a25eba8921ec3d94325,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.7794202230361,TRUE,IFEval,0.498190357141274,49.8190357141274,BBH,0.473255442591494,25.6879597690821,MATH Level 5,0.0558912386706949,5.58912386706949,GPQA,0.285234899328859,4.6979865771812,MUSR,0.35415625,3.93619791666667,MMLU-PRO,0.306515957446809,22.9462174940898,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-08,2024-10-08,1,PocketDoc/Dans-PersonalityEngine-v1.0.0-8b (Merge),apache-2.0,4,8.03,0.900974258409386 -PowerInfer/SmallThinker-3B-Preview_bfloat16_f335f911ad120220287e737eeeffe7a3ff54b60b_True,PowerInfer/SmallThinker-3B-Preview,f335f911ad120220287e737eeeffe7a3ff54b60b,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,19.5695095292787,TRUE,IFEval,0.619965026130667,61.9965026130667,BBH,0.449492201666092,22.0621046421687,MATH Level 5,0.0589123867069487,5.89123867069487,GPQA,0.260906040268456,1.45413870246085,MUSR,0.352479166666667,3.59322916666667,MMLU-PRO,0.301778590425532,22.4198433806147,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-12,2025-01-07,1,PowerInfer/SmallThinker-3B-Preview (Merge),"",333,3.397,0.737944081449492 +PowerInfer/SmallThinker-3B-Preview_bfloat16_f335f911ad120220287e737eeeffe7a3ff54b60b_True,PowerInfer/SmallThinker-3B-Preview,f335f911ad120220287e737eeeffe7a3ff54b60b,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,19.5695095292787,TRUE,IFEval,0.619965026130667,61.9965026130667,BBH,0.449492201666092,22.0621046421687,MATH Level 5,0.0589123867069487,5.89123867069487,GPQA,0.260906040268456,1.45413870246085,MUSR,0.352479166666667,3.59322916666667,MMLU-PRO,0.301778590425532,22.4198433806147,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-12,2025-01-07,1,PowerInfer/SmallThinker-3B-Preview (Merge),"",340,3.397,0.737944081449492 PranavHarshan/LaMistral-V4_bfloat16_b373c2a1ab08823b6b119899f807793c96ef7888_True,PranavHarshan/LaMistral-V4,b373c2a1ab08823b6b119899f807793c96ef7888,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.2107651768593,TRUE,IFEval,0.623861354539289,62.3861354539289,BBH,0.518425534258647,31.0913486817948,MATH Level 5,0.0687311178247734,6.87311178247734,GPQA,0.328020134228188,10.4026845637584,MUSR,0.364291666666667,5.63645833333333,MMLU-PRO,0.359873670212766,28.8748522458629,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-01,2024-10-05,1,PranavHarshan/LaMistral-V4 (Merge),apache-2.0,1,8.03,0.697232370090008 PranavHarshan/MedNarra-X1_bfloat16_9fe294e7fd69ec56f0b7fa1a23759eed070f44bf_False,PranavHarshan/MedNarra-X1,9fe294e7fd69ec56f0b7fa1a23759eed070f44bf,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.128681543434,FALSE,IFEval,0.43384331351924,43.384331351924,BBH,0.463716681797742,23.5234951323421,MATH Level 5,0.0468277945619335,4.68277945619335,GPQA,0.307885906040268,7.71812080536913,MUSR,0.35403125,2.45390625,MMLU-PRO,0.343085106382979,27.0094562647754,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-08,2024-10-09,1,PranavHarshan/MedNarra-X1 (Merge),"",0,8.03,0.676160938867545 Pretergeek/OpenChat-3.5-0106_10.7B_48Layers-Appended_bfloat16_1091b30480f4cc91f26cb1bd7579e527f490f8d2_True,Pretergeek/OpenChat-3.5-0106_10.7B_48Layers-Appended,1091b30480f4cc91f26cb1bd7579e527f490f8d2,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,22.7106998558598,TRUE,IFEval,0.596059566394943,59.6059566394943,BBH,0.461963788442602,24.0571725122886,MATH Level 5,0.0777945619335348,7.77945619335348,GPQA,0.307046979865772,7.60626398210291,MUSR,0.42540625,11.77578125,MMLU-PRO,0.328956117021277,25.4395685579196,TRUE,TRUE,FALSE,FALSE,FALSE,2024-07-27,2024-07-31,1,Pretergeek/OpenChat-3.5-0106_10.7B_48Layers-Appended (Merge),apache-2.0,2,10.732,0.83609961028351 @@ -937,7 +939,7 @@ PrimeIntellect/INTELLECT-1-Instruct_bfloat16_a672cbe91f9bd4df58f90619ca3c2acb2eb PuxAI/LUA_model_float16_f098319bc21c8710652f75febe0d8a110058458f_False,PuxAI/LUA_model,f098319bc21c8710652f75febe0d8a110058458f,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,5.14872374821187,FALSE,IFEval,0.228213362766349,22.8213362766349,BBH,0.287677810298844,1.8156684085008,MATH Level 5,0,0,GPQA,0.26006711409396,1.34228187919463,MUSR,0.348385416666667,3.54817708333333,MMLU-PRO,0.112283909574468,1.36487884160756,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-18,0,PuxAI/LUA_model,"",0,7.386,0.630092113903009 PygmalionAI/pygmalion-6b_float16_2a0d74449c8fbf0378194e95f64aa92e16297294_False,PygmalionAI/pygmalion-6b,2a0d74449c8fbf0378194e95f64aa92e16297294,float16,fine-tunedondomain-specificdatasets,Original,GPTJForCausalLM,5.3923596589092,FALSE,IFEval,0.20910406610017,20.910406610017,BBH,0.3198894464386,5.08957714398891,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.249161073825503,0,MUSR,0.368354166666667,3.7109375,MMLU-PRO,0.118351063829787,2.03900709219858,TRUE,FALSE,FALSE,FALSE,TRUE,2023-01-07,2024-06-12,0,PygmalionAI/pygmalion-6b,creativeml-openrail-m,737,6,31.9231192804799 Q-bert/MetaMath-1B_float16_da62756f069aba78d07d4c76108e246cb91dbc35_True,Q-bert/MetaMath-1B,da62756f069aba78d07d4c76108e246cb91dbc35,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,11.3242479106733,TRUE,IFEval,0.530039184918239,53.0039184918239,BBH,0.345068636779295,8.43461064483256,MATH Level 5,0,0,GPQA,0.251677852348993,0.223713646532442,MUSR,0.328916666666667,0.78125,MMLU-PRO,0.14951795212766,5.50199468085107,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-30,0,Removed,"",0,1.236,0.465027993931676 -Qwen/QwQ-32B-Preview_bfloat16_1032e81cb936c486aae1d33da75b2fbcd5deed4a_True,Qwen/QwQ-32B-Preview,1032e81cb936c486aae1d33da75b2fbcd5deed4a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,30.444123257489,TRUE,IFEval,0.403543708471301,40.3543708471301,BBH,0.669138148225274,53.3876763517132,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.281879194630873,4.25055928411634,MUSR,0.410989583333333,9.80703125,MMLU-PRO,0.56781914893617,51.9799054373523,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-27,2024-11-29,2,Qwen/Qwen2.5-32B,apache-2.0,1528,32.764,10.2103897762396 +Qwen/QwQ-32B-Preview_bfloat16_1032e81cb936c486aae1d33da75b2fbcd5deed4a_True,Qwen/QwQ-32B-Preview,1032e81cb936c486aae1d33da75b2fbcd5deed4a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,30.444123257489,TRUE,IFEval,0.403543708471301,40.3543708471301,BBH,0.669138148225274,53.3876763517132,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.281879194630873,4.25055928411634,MUSR,0.410989583333333,9.80703125,MMLU-PRO,0.56781914893617,51.9799054373523,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-27,2024-11-29,2,Qwen/Qwen2.5-32B,apache-2.0,1535,32.764,10.2103897762396 Qwen/Qwen1.5-0.5B_bfloat16_8f445e3628f3500ee69f24e1303c9f10f5342a39_False,Qwen/Qwen1.5-0.5B,8f445e3628f3500ee69f24e1303c9f10f5342a39,bfloat16,pretrained,Original,Qwen2ForCausalLM,5.13701708767239,FALSE,IFEval,0.17056077873376,17.056077873376,BBH,0.315353865914256,5.03547583679937,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.254194630872483,0.559284116331097,MUSR,0.361625,4.303125,MMLU-PRO,0.130734707446809,3.41496749408983,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-22,2024-06-13,0,Qwen/Qwen1.5-0.5B,other,149,0.62,0.978737373550742 Qwen/Qwen1.5-0.5B-Chat_bfloat16_4d14e384a4b037942bb3f3016665157c8bcb70ea_True,Qwen/Qwen1.5-0.5B-Chat,4d14e384a4b037942bb3f3016665157c8bcb70ea,bfloat16,chatmodels,Original,Qwen2ForCausalLM,5.56486903979377,TRUE,IFEval,0.180727137328954,18.0727137328954,BBH,0.316666215203671,4.31803263693806,MATH Level 5,0,0,GPQA,0.269295302013423,2.57270693512304,MUSR,0.383708333333333,6.06354166666667,MMLU-PRO,0.121259973404255,2.36221926713948,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-31,2024-06-12,0,Qwen/Qwen1.5-0.5B-Chat,other,75,0.62,0.54974439031725 Qwen/Qwen1.5-1.8B_bfloat16_7846de7ed421727b318d6605a0bfab659da2c067_False,Qwen/Qwen1.5-1.8B,7846de7ed421727b318d6605a0bfab659da2c067,bfloat16,pretrained,Original,Qwen2ForCausalLM,9.18137570437486,FALSE,IFEval,0.215423963971152,21.5423963971152,BBH,0.347612155836631,9.75990158772794,MATH Level 5,0.0264350453172205,2.64350453172205,GPQA,0.305369127516779,7.38255033557047,MUSR,0.360510416666667,3.96380208333333,MMLU-PRO,0.188164893617021,9.79609929078014,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-22,2024-06-13,0,Qwen/Qwen1.5-1.8B,other,45,1.837,0.948870786599621 @@ -950,12 +952,12 @@ Qwen/Qwen1.5-32B_bfloat16_cefef80dc06a65f89d1d71d0adbc56d335ca2490_False,Qwen/Qw Qwen/Qwen1.5-32B-Chat_bfloat16_0997b012af6ddd5465d40465a8415535b2f06cfc_True,Qwen/Qwen1.5-32B-Chat,0997b012af6ddd5465d40465a8415535b2f06cfc,bfloat16,chatmodels,Original,Qwen2ForCausalLM,27.1930170704966,TRUE,IFEval,0.553219900973861,55.3219900973861,BBH,0.606689975793023,44.5548540239164,MATH Level 5,0.0717522658610272,7.17522658610272,GPQA,0.306208053691275,7.49440715883669,MUSR,0.415979166666667,10.1973958333333,MMLU-PRO,0.445728058510638,38.4142287234043,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-03,2024-06-12,0,Qwen/Qwen1.5-32B-Chat,other,108,32.512,46.0594497310076 Qwen/Qwen1.5-4B_bfloat16_a66363a0c24e2155c561e4b53c658b1d3965474e_False,Qwen/Qwen1.5-4B,a66363a0c24e2155c561e4b53c658b1d3965474e,bfloat16,pretrained,Original,Qwen2ForCausalLM,11.3275986698975,FALSE,IFEval,0.244474660567295,24.4474660567295,BBH,0.405389702967255,16.2491425810953,MATH Level 5,0.0264350453172205,2.64350453172205,GPQA,0.276845637583893,3.57941834451902,MUSR,0.360447916666667,4.82265625,MMLU-PRO,0.246010638297872,16.2234042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-22,2024-06-13,0,Qwen/Qwen1.5-4B,other,34,3.95,1.63868216690388 Qwen/Qwen1.5-4B-Chat_bfloat16_a7a4d4945d28bac955554c9abd2f74a71ebbf22f_True,Qwen/Qwen1.5-4B-Chat,a7a4d4945d28bac955554c9abd2f74a71ebbf22f,bfloat16,chatmodels,Original,Qwen2ForCausalLM,12.3377534239841,TRUE,IFEval,0.315665766832006,31.5665766832006,BBH,0.400554856114861,16.2970785289083,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.266778523489933,2.23713646532438,MUSR,0.39778125,7.35598958333333,MMLU-PRO,0.239611037234043,15.5123374704492,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-30,2024-06-12,0,Qwen/Qwen1.5-4B-Chat,other,38,3.95,0.866150647838799 -Qwen/Qwen1.5-7B_bfloat16_831096e3a59a0789a541415da25ef195ceb802fe_False,Qwen/Qwen1.5-7B,831096e3a59a0789a541415da25ef195ceb802fe,bfloat16,pretrained,Original,Qwen2ForCausalLM,15.357503964068,FALSE,IFEval,0.268429987987429,26.8429987987429,BBH,0.455989640769345,23.0757687543405,MATH Level 5,0.0528700906344411,5.28700906344411,GPQA,0.298657718120805,6.48769574944072,MUSR,0.410333333333333,9.15833333333333,MMLU-PRO,0.291638962765957,21.2932180851064,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-22,2024-06-09,0,Qwen/Qwen1.5-7B,other,47,7.721,1.82735405409524 +Qwen/Qwen1.5-7B_bfloat16_831096e3a59a0789a541415da25ef195ceb802fe_False,Qwen/Qwen1.5-7B,831096e3a59a0789a541415da25ef195ceb802fe,bfloat16,pretrained,Original,Qwen2ForCausalLM,15.357503964068,FALSE,IFEval,0.268429987987429,26.8429987987429,BBH,0.455989640769345,23.0757687543405,MATH Level 5,0.0528700906344411,5.28700906344411,GPQA,0.298657718120805,6.48769574944072,MUSR,0.410333333333333,9.15833333333333,MMLU-PRO,0.291638962765957,21.2932180851064,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-22,2024-06-09,0,Qwen/Qwen1.5-7B,other,48,7.721,1.82735405409524 Qwen/Qwen1.5-7B-Chat_bfloat16_5f4f5e69ac7f1d508f8369e977de208b4803444b_True,Qwen/Qwen1.5-7B-Chat,5f4f5e69ac7f1d508f8369e977de208b4803444b,bfloat16,chatmodels,Original,Qwen2ForCausalLM,16.5761729315825,TRUE,IFEval,0.437115741787347,43.7115741787347,BBH,0.451005311652135,22.3791295999528,MATH Level 5,0,0,GPQA,0.302852348993289,7.04697986577182,MUSR,0.37790625,4.63828125,MMLU-PRO,0.295129654255319,21.6810726950355,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-30,2024-06-12,0,Qwen/Qwen1.5-7B-Chat,other,164,7.721,1.07882659669136 Qwen/Qwen1.5-MoE-A2.7B_bfloat16_1a758c50ecb6350748b9ce0a99d2352fd9fc11c9_False,Qwen/Qwen1.5-MoE-A2.7B,1a758c50ecb6350748b9ce0a99d2352fd9fc11c9,bfloat16,pretrained,Original,Qwen2MoeForCausalLM,12.4227579773455,FALSE,IFEval,0.265982038768246,26.5982038768246,BBH,0.411351543301077,18.8378585005472,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.259228187919463,1.23042505592841,MUSR,0.40134375,7.96796875,MMLU-PRO,0.277759308510638,19.7510342789598,TRUE,FALSE,TRUE,FALSE,TRUE,2024-02-29,2024-06-13,0,Qwen/Qwen1.5-MoE-A2.7B,other,196,14.316,9.54561289606972 Qwen/Qwen1.5-MoE-A2.7B-Chat_bfloat16_ec052fda178e241c7c443468d2fa1db6618996be_True,Qwen/Qwen1.5-MoE-A2.7B-Chat,ec052fda178e241c7c443468d2fa1db6618996be,bfloat16,chatmodels,Original,Qwen2MoeForCausalLM,14.8234980434335,TRUE,IFEval,0.379538513366756,37.9538513366756,BBH,0.427208862063582,20.041818895541,MATH Level 5,0,0,GPQA,0.274328859060403,3.24384787472036,MUSR,0.389875,6.334375,MMLU-PRO,0.292303856382979,21.3670951536643,TRUE,FALSE,TRUE,FALSE,TRUE,2024-03-14,2024-06-12,0,Qwen/Qwen1.5-MoE-A2.7B-Chat,other,114,14.316,8.90197153753581 Qwen/Qwen2-0.5B_bfloat16_ff3a49fac17555b8dfc4db6709f480cc8f16a9fe_False,Qwen/Qwen2-0.5B,ff3a49fac17555b8dfc4db6709f480cc8f16a9fe,bfloat16,pretrained,Original,Qwen2ForCausalLM,7.28706205765386,FALSE,IFEval,0.187321861549577,18.7321861549577,BBH,0.323911742482544,7.91851204090326,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.260906040268456,1.45413870246085,MUSR,0.375208333333333,4.60104166666667,MMLU-PRO,0.171958111702128,7.99534574468085,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-31,2024-11-30,0,Qwen/Qwen2-0.5B,apache-2.0,122,0.494,1.79993829168931 -Qwen/Qwen2-0.5B-Instruct_bfloat16_c291d6fce4804a1d39305f388dd32897d1f7acc4_True,Qwen/Qwen2-0.5B-Instruct,c291d6fce4804a1d39305f388dd32897d1f7acc4,bfloat16,chatmodels,Original,Qwen2ForCausalLM,6.41054699783957,TRUE,IFEval,0.224666108148601,22.4666108148601,BBH,0.317251793848635,5.87604425940848,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.246644295302013,0,MUSR,0.335270833333333,2.40885416666667,MMLU-PRO,0.153091755319149,5.89908392434988,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-03,2024-06-12,1,Qwen/Qwen2-0.5B,apache-2.0,169,0.494,0.557847723145263 +Qwen/Qwen2-0.5B-Instruct_bfloat16_c291d6fce4804a1d39305f388dd32897d1f7acc4_True,Qwen/Qwen2-0.5B-Instruct,c291d6fce4804a1d39305f388dd32897d1f7acc4,bfloat16,chatmodels,Original,Qwen2ForCausalLM,6.41054699783957,TRUE,IFEval,0.224666108148601,22.4666108148601,BBH,0.317251793848635,5.87604425940848,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.246644295302013,0,MUSR,0.335270833333333,2.40885416666667,MMLU-PRO,0.153091755319149,5.89908392434988,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-03,2024-06-12,1,Qwen/Qwen2-0.5B,apache-2.0,170,0.494,0.557847723145263 Qwen/Qwen2-1.5B_bfloat16_8a16abf2848eda07cc5253dec660bf1ce007ad7a_False,Qwen/Qwen2-1.5B,8a16abf2848eda07cc5253dec660bf1ce007ad7a,bfloat16,pretrained,Original,Qwen2ForCausalLM,10.4454529355615,FALSE,IFEval,0.211327056654122,21.1327056654122,BBH,0.357479317205775,11.7818336534835,MATH Level 5,0.0702416918429003,7.02416918429003,GPQA,0.264261744966443,1.90156599552573,MUSR,0.3658125,3.59322916666667,MMLU-PRO,0.255152925531915,17.2392139479905,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-31,2024-06-09,0,Qwen/Qwen2-1.5B,apache-2.0,83,1.544,1.10819489200472 Qwen/Qwen2-1.5B-Instruct_bfloat16_ba1cf1846d7df0a0591d6c00649f57e798519da8_True,Qwen/Qwen2-1.5B-Instruct,ba1cf1846d7df0a0591d6c00649f57e798519da8,bfloat16,chatmodels,Original,Qwen2ForCausalLM,13.990879413369,TRUE,IFEval,0.337123277348546,33.7123277348546,BBH,0.385223240837606,13.6953468275027,MATH Level 5,0.0626888217522659,6.26888217522659,GPQA,0.261744966442953,1.56599552572707,MUSR,0.42928125,12.0268229166667,MMLU-PRO,0.250083111702128,16.6759013002364,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-03,2024-06-12,0,Qwen/Qwen2-1.5B-Instruct,apache-2.0,134,1.544,0.658823938556274 Qwen/Qwen2-57B-A14B_bfloat16_973e466c39ba76372a2ae464dbca0af3f5a5a2a9_False,Qwen/Qwen2-57B-A14B,973e466c39ba76372a2ae464dbca0af3f5a5a2a9,bfloat16,pretrained,Original,Qwen2MoeForCausalLM,25.0338731324107,FALSE,IFEval,0.311269653408512,31.1269653408512,BBH,0.561820493868417,38.8759890503419,MATH Level 5,0.186555891238671,18.6555891238671,GPQA,0.306208053691275,7.49440715883669,MUSR,0.417375,10.5385416666667,MMLU-PRO,0.491605718085106,43.5117464539007,TRUE,FALSE,TRUE,FALSE,TRUE,2024-05-22,2024-06-13,0,Qwen/Qwen2-57B-A14B,apache-2.0,48,57.409,107.031477464734 @@ -966,9 +968,9 @@ Qwen/Qwen2-7B_bfloat16_453ed1575b739b5b03ce3758b23befdb0967f40e_False,Qwen/Qwen2 Qwen/Qwen2-7B-Instruct_bfloat16_41c66b0be1c3081f13defc6bdf946c2ef240d6a6_True,Qwen/Qwen2-7B-Instruct,41c66b0be1c3081f13defc6bdf946c2ef240d6a6,bfloat16,chatmodels,Original,Qwen2ForCausalLM,24.9029516291134,TRUE,IFEval,0.567907596288958,56.7907596288958,BBH,0.554478156379319,37.8083909231017,MATH Level 5,0.0944108761329305,9.44108761329305,GPQA,0.297818791946309,6.3758389261745,MUSR,0.392791666666667,7.365625,MMLU-PRO,0.384724069148936,31.6360076832151,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-04,2024-06-12,1,Qwen/Qwen2-7B,apache-2.0,607,7.616,1.04203898585749 Qwen/Qwen2-Math-72B-Instruct_bfloat16_5c267882f3377bcfc35882f8609098a894eeeaa8_True,Qwen/Qwen2-Math-72B-Instruct,5c267882f3377bcfc35882f8609098a894eeeaa8,bfloat16,chatmodels,Original,Qwen2ForCausalLM,35.1508663678517,TRUE,IFEval,0.569381463405985,56.9381463405985,BBH,0.634337660025181,47.9601995073491,MATH Level 5,0.381419939577039,38.1419939577039,GPQA,0.368288590604027,15.7718120805369,MUSR,0.451697916666667,15.72890625,MMLU-PRO,0.427277260638298,36.364140070922,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-08,2024-08-19,0,Qwen/Qwen2-Math-72B-Instruct,other,87,72.706,12.1682476948271 Qwen/Qwen2-Math-7B_bfloat16_47a44ff4136da8960adbab02b2326787086bcf6c_True,Qwen/Qwen2-Math-7B,47a44ff4136da8960adbab02b2326787086bcf6c,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,11.9413924471103,TRUE,IFEval,0.26870481433707,26.870481433707,BBH,0.386954741074792,14.0644944888713,MATH Level 5,0.243202416918429,24.3202416918429,GPQA,0.263422818791946,1.78970917225951,MUSR,0.359333333333333,2.41666666666667,MMLU-PRO,0.11968085106383,2.18676122931442,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-08,2024-08-19,0,Qwen/Qwen2-Math-7B,apache-2.0,13,7.616,1.5630360629051 -Qwen/Qwen2-VL-72B-Instruct_bfloat16_f400120e59a6196b024298b7d09fb517f742db7d_True,Qwen/Qwen2-VL-72B-Instruct,f400120e59a6196b024298b7d09fb517f742db7d,bfloat16,multimodal,Original,Qwen2VLForConditionalGeneration,37.9127528860119,TRUE,IFEval,0.598232689264485,59.8232689264485,BBH,0.694628729233868,56.3112338791251,MATH Level 5,0.246978851963746,24.6978851963746,GPQA,0.38758389261745,18.34451901566,MUSR,0.44921875,15.8856770833333,MMLU-PRO,0.57172539893617,52.41393321513,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-10-20,1,Qwen/Qwen2-VL-72B-Instruct (Merge),other,253,73.406,27.2497165156002 -Qwen/Qwen2-VL-7B-Instruct_bfloat16_51c47430f97dd7c74aa1fa6825e68a813478097f_True,Qwen/Qwen2-VL-7B-Instruct,51c47430f97dd7c74aa1fa6825e68a813478097f,bfloat16,multimodal,Original,Qwen2VLForConditionalGeneration,24.2148096194201,TRUE,IFEval,0.459921896124505,45.9921896124505,BBH,0.546450715906999,35.8771031449895,MATH Level 5,0.0619335347432024,6.19335347432024,GPQA,0.319630872483222,9.2841163310962,MUSR,0.4375,13.5541666666667,MMLU-PRO,0.409491356382979,34.3879284869976,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-28,2024-10-20,1,Qwen/Qwen2-VL-7B-Instruct (Merge),apache-2.0,1036,8.291,1.05438228472396 -Qwen/Qwen2.5-0.5B_bfloat16_2630d3d2321bc1f1878f702166d1b2af019a7310_False,Qwen/Qwen2.5-0.5B,2630d3d2321bc1f1878f702166d1b2af019a7310,bfloat16,pretrained,Original,Qwen2ForCausalLM,6.31089339476025,FALSE,IFEval,0.162717146061339,16.271714606134,BBH,0.327481481511966,6.95396163488226,MATH Level 5,0.0249244712990937,2.49244712990937,GPQA,0.246644295302013,0,MUSR,0.343333333333333,2.08333333333333,MMLU-PRO,0.190575132978723,10.0639036643026,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-0.5B,apache-2.0,155,0.5,1.16534262881835 +Qwen/Qwen2-VL-72B-Instruct_bfloat16_f400120e59a6196b024298b7d09fb517f742db7d_True,Qwen/Qwen2-VL-72B-Instruct,f400120e59a6196b024298b7d09fb517f742db7d,bfloat16,multimodal,Original,Qwen2VLForConditionalGeneration,37.9127528860119,TRUE,IFEval,0.598232689264485,59.8232689264485,BBH,0.694628729233868,56.3112338791251,MATH Level 5,0.246978851963746,24.6978851963746,GPQA,0.38758389261745,18.34451901566,MUSR,0.44921875,15.8856770833333,MMLU-PRO,0.57172539893617,52.41393321513,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-10-20,1,Qwen/Qwen2-VL-72B-Instruct (Merge),other,255,73.406,27.2497165156002 +Qwen/Qwen2-VL-7B-Instruct_bfloat16_51c47430f97dd7c74aa1fa6825e68a813478097f_True,Qwen/Qwen2-VL-7B-Instruct,51c47430f97dd7c74aa1fa6825e68a813478097f,bfloat16,multimodal,Original,Qwen2VLForConditionalGeneration,24.2148096194201,TRUE,IFEval,0.459921896124505,45.9921896124505,BBH,0.546450715906999,35.8771031449895,MATH Level 5,0.0619335347432024,6.19335347432024,GPQA,0.319630872483222,9.2841163310962,MUSR,0.4375,13.5541666666667,MMLU-PRO,0.409491356382979,34.3879284869976,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-28,2024-10-20,1,Qwen/Qwen2-VL-7B-Instruct (Merge),apache-2.0,1039,8.291,1.05438228472396 +Qwen/Qwen2.5-0.5B_bfloat16_2630d3d2321bc1f1878f702166d1b2af019a7310_False,Qwen/Qwen2.5-0.5B,2630d3d2321bc1f1878f702166d1b2af019a7310,bfloat16,pretrained,Original,Qwen2ForCausalLM,6.31089339476025,FALSE,IFEval,0.162717146061339,16.271714606134,BBH,0.327481481511966,6.95396163488226,MATH Level 5,0.0249244712990937,2.49244712990937,GPQA,0.246644295302013,0,MUSR,0.343333333333333,2.08333333333333,MMLU-PRO,0.190575132978723,10.0639036643026,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-0.5B,apache-2.0,157,0.5,1.16534262881835 Qwen/Qwen2.5-0.5B-Instruct_bfloat16_a8b602d9dafd3a75d382e62757d83d89fca3be54_True,Qwen/Qwen2.5-0.5B-Instruct,a8b602d9dafd3a75d382e62757d83d89fca3be54,bfloat16,chatmodels,Original,Qwen2ForCausalLM,8.14064731927608,TRUE,IFEval,0.307122878407071,30.7122878407071,BBH,0.334072921493727,8.43486361058883,MATH Level 5,0,0,GPQA,0.25755033557047,1.00671140939597,MUSR,0.332885416666667,0.944010416666666,MMLU-PRO,0.169714095744681,7.74601063829787,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-19,1,Qwen/Qwen2.5-0.5B,apache-2.0,179,0.5,0.63082445281977 Qwen/Qwen2.5-0.5B-Instruct_float16_7ae557604adf67be50417f59c2c2f167def9a775_True,Qwen/Qwen2.5-0.5B-Instruct,7ae557604adf67be50417f59c2c2f167def9a775,float16,chatmodels,Original,Qwen2ForCausalLM,8.38297184669106,TRUE,IFEval,0.315291205113543,31.5291205113543,BBH,0.332191642954914,8.16950226818277,MATH Level 5,0,0,GPQA,0.259228187919463,1.23042505592841,MUSR,0.3341875,1.3734375,MMLU-PRO,0.171958111702128,7.99534574468085,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-0.5B,apache-2.0,179,0.494,0.618575974583338 Qwen/Qwen2.5-1.5B_bfloat16_e5dfabbcffd9b0c7b31d89b82c5a6b72e663f32c_False,Qwen/Qwen2.5-1.5B,e5dfabbcffd9b0c7b31d89b82c5a6b72e663f32c,bfloat16,pretrained,Original,Qwen2ForCausalLM,13.8023486940494,FALSE,IFEval,0.267430417957686,26.7430417957686,BBH,0.407795094513661,16.6604651676919,MATH Level 5,0.088368580060423,8.8368580060423,GPQA,0.285234899328859,4.6979865771812,MUSR,0.35759375,5.26588541666667,MMLU-PRO,0.285488696808511,20.6098552009456,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-1.5B,apache-2.0,53,1.5,1.24850101000351 @@ -976,17 +978,17 @@ Qwen/Qwen2.5-1.5B-Instruct_bfloat16_5fee7c4ed634dc66c6e318c8ac2897b8b9154536_Tru Qwen/Qwen2.5-14B_bfloat16_83a1904df002b00bc8db6f877821cb77dbb363b0_False,Qwen/Qwen2.5-14B,83a1904df002b00bc8db6f877821cb77dbb363b0,bfloat16,pretrained,Original,Qwen2ForCausalLM,31.7496528240654,FALSE,IFEval,0.369446402212795,36.9446402212795,BBH,0.616051493531774,45.0783124049849,MATH Level 5,0.277945619335347,27.7945619335347,GPQA,0.381711409395973,17.5615212527964,MUSR,0.450239583333333,15.91328125,MMLU-PRO,0.52485039893617,47.2055998817967,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-14B,apache-2.0,50,14.77,5.58592135172473 Qwen/Qwen2.5-14B-Instruct_bfloat16_f55224c616ca27d4bcf28969a156de12c98981cf_True,Qwen/Qwen2.5-14B-Instruct,f55224c616ca27d4bcf28969a156de12c98981cf,bfloat16,chatmodels,Original,Qwen2ForCausalLM,32.1830727842617,TRUE,IFEval,0.815777692079239,81.5777692079239,BBH,0.639045370590622,48.3607066128271,MATH Level 5,0,0,GPQA,0.322147651006711,9.61968680089485,MUSR,0.4100625,10.1578125,MMLU-PRO,0.490442154255319,43.3824615839244,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-18,1,Qwen/Qwen2.5-14B,apache-2.0,158,14.77,1.7736503203376 Qwen/Qwen2.5-32B_bfloat16_ff23665d01c3665be5fdb271d18a62090b65c06d_False,Qwen/Qwen2.5-32B,ff23665d01c3665be5fdb271d18a62090b65c06d,bfloat16,pretrained,Original,Qwen2ForCausalLM,37.9827910715109,FALSE,IFEval,0.407664995545154,40.7664995545154,BBH,0.677052244872651,53.954752851332,MATH Level 5,0.354984894259819,35.4984894259819,GPQA,0.411912751677852,21.5883668903803,MUSR,0.497833333333333,22.6958333333333,MMLU-PRO,0.580535239361702,53.3928043735225,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-32B,apache-2.0,60,32.764,5.87488554274725 -Qwen/Qwen2.5-32B-Instruct_bfloat16_70e8dfb9ad18a7d499f765fe206ff065ed8ca197_True,Qwen/Qwen2.5-32B-Instruct,70e8dfb9ad18a7d499f765fe206ff065ed8ca197,bfloat16,chatmodels,Original,Qwen2ForCausalLM,36.174184974139,TRUE,IFEval,0.834612162395777,83.4612162395777,BBH,0.691252508013434,56.4893482615939,MATH Level 5,0,0,GPQA,0.338087248322148,11.744966442953,MUSR,0.426125,13.4989583333333,MMLU-PRO,0.566655585106383,51.8506205673759,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-32B,apache-2.0,172,32.764,5.75248317034287 -Qwen/Qwen2.5-3B_bfloat16_e4aa5ac50aa507415cda96cc99eb77ad0a3d2d34_False,Qwen/Qwen2.5-3B,e4aa5ac50aa507415cda96cc99eb77ad0a3d2d34,bfloat16,pretrained,Original,Qwen2ForCausalLM,17.1083089890835,FALSE,IFEval,0.268954152759124,26.8954152759124,BBH,0.461247534101163,24.3042417263717,MATH Level 5,0.088368580060423,8.8368580060423,GPQA,0.297818791946309,6.3758389261745,MUSR,0.430333333333333,11.7583333333333,MMLU-PRO,0.3203125,24.4791666666667,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-27,0,Qwen/Qwen2.5-3B,other,46,3.086,3.81050747400589 -Qwen/Qwen2.5-3B-Instruct_bfloat16_82f42baa094a9600e39ccd80d34058aeeb3abbc1_True,Qwen/Qwen2.5-3B-Instruct,82f42baa094a9600e39ccd80d34058aeeb3abbc1,bfloat16,chatmodels,Original,Qwen2ForCausalLM,21.0313443188007,TRUE,IFEval,0.647491987925371,64.7491987925372,BBH,0.469276665604885,25.8013939440886,MATH Level 5,0,0,GPQA,0.272651006711409,3.02013422818792,MUSR,0.396791666666667,7.565625,MMLU-PRO,0.325465425531915,25.0517139479905,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-3B,other,137,3,1.38847430558096 +Qwen/Qwen2.5-32B-Instruct_bfloat16_70e8dfb9ad18a7d499f765fe206ff065ed8ca197_True,Qwen/Qwen2.5-32B-Instruct,70e8dfb9ad18a7d499f765fe206ff065ed8ca197,bfloat16,chatmodels,Original,Qwen2ForCausalLM,36.174184974139,TRUE,IFEval,0.834612162395777,83.4612162395777,BBH,0.691252508013434,56.4893482615939,MATH Level 5,0,0,GPQA,0.338087248322148,11.744966442953,MUSR,0.426125,13.4989583333333,MMLU-PRO,0.566655585106383,51.8506205673759,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-32B,apache-2.0,173,32.764,5.75248317034287 +Qwen/Qwen2.5-3B_bfloat16_e4aa5ac50aa507415cda96cc99eb77ad0a3d2d34_False,Qwen/Qwen2.5-3B,e4aa5ac50aa507415cda96cc99eb77ad0a3d2d34,bfloat16,pretrained,Original,Qwen2ForCausalLM,17.1083089890835,FALSE,IFEval,0.268954152759124,26.8954152759124,BBH,0.461247534101163,24.3042417263717,MATH Level 5,0.088368580060423,8.8368580060423,GPQA,0.297818791946309,6.3758389261745,MUSR,0.430333333333333,11.7583333333333,MMLU-PRO,0.3203125,24.4791666666667,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-27,0,Qwen/Qwen2.5-3B,other,48,3.086,3.81050747400589 +Qwen/Qwen2.5-3B-Instruct_bfloat16_82f42baa094a9600e39ccd80d34058aeeb3abbc1_True,Qwen/Qwen2.5-3B-Instruct,82f42baa094a9600e39ccd80d34058aeeb3abbc1,bfloat16,chatmodels,Original,Qwen2ForCausalLM,21.0313443188007,TRUE,IFEval,0.647491987925371,64.7491987925372,BBH,0.469276665604885,25.8013939440886,MATH Level 5,0,0,GPQA,0.272651006711409,3.02013422818792,MUSR,0.396791666666667,7.565625,MMLU-PRO,0.325465425531915,25.0517139479905,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-3B,other,138,3,1.38847430558096 Qwen/Qwen2.5-72B_bfloat16_587cc4061cf6a7cc0d429d05c109447e5cf063af_False,Qwen/Qwen2.5-72B,587cc4061cf6a7cc0d429d05c109447e5cf063af,bfloat16,pretrained,Original,Qwen2ForCausalLM,38.3656148716295,FALSE,IFEval,0.413710067066495,41.3710067066495,BBH,0.679732067069485,54.6150578016369,MATH Level 5,0.386706948640483,38.6706948640483,GPQA,0.405201342281879,20.6935123042506,MUSR,0.477125,19.640625,MMLU-PRO,0.596825132978723,55.2027925531915,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-72B,other,54,72.706,18.0919265899938 -Qwen/Qwen2.5-72B-Instruct_bfloat16_a13fff9ad76700c7ecff2769f75943ba8395b4a7_True,Qwen/Qwen2.5-72B-Instruct,a13fff9ad76700c7ecff2769f75943ba8395b4a7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,38.2120812616148,TRUE,IFEval,0.863837949972739,86.3837949972739,BBH,0.727274732174482,61.8732556687879,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.375,16.6666666666667,MUSR,0.420604166666667,11.7421875,MMLU-PRO,0.562583111702128,51.3981235224587,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-72B,other,667,72.706,33.0067683243991 -Qwen/Qwen2.5-7B_bfloat16_57597c00770845ceba45271ba1b24c94bbcc7baf_False,Qwen/Qwen2.5-7B,57597c00770845ceba45271ba1b24c94bbcc7baf,bfloat16,pretrained,Original,Qwen2ForCausalLM,24.9869343450417,FALSE,IFEval,0.337447971382598,33.7447971382598,BBH,0.541630376778862,35.8134732875478,MATH Level 5,0.188821752265861,18.8821752265861,GPQA,0.324664429530201,9.95525727069351,MUSR,0.442427083333333,14.13671875,MMLU-PRO,0.436502659574468,37.3891843971631,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-7B,apache-2.0,96,7.616,3.02796087914288 -Qwen/Qwen2.5-7B-Instruct_bfloat16_52e20a6f5f475e5c8f6a8ebda4ae5fa6b1ea22ac_True,Qwen/Qwen2.5-7B-Instruct,52e20a6f5f475e5c8f6a8ebda4ae5fa6b1ea22ac,bfloat16,chatmodels,Original,Qwen2ForCausalLM,26.8667753266146,TRUE,IFEval,0.7585251576927,75.85251576927,BBH,0.53942319682991,34.8921167587655,MATH Level 5,0,0,GPQA,0.291107382550336,5.48098434004475,MUSR,0.40203125,8.45390625,MMLU-PRO,0.428690159574468,36.5211288416076,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-18,1,Qwen/Qwen2.5-7B,apache-2.0,415,7.616,2.16827148311528 +Qwen/Qwen2.5-72B-Instruct_bfloat16_a13fff9ad76700c7ecff2769f75943ba8395b4a7_True,Qwen/Qwen2.5-72B-Instruct,a13fff9ad76700c7ecff2769f75943ba8395b4a7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,38.2120812616148,TRUE,IFEval,0.863837949972739,86.3837949972739,BBH,0.727274732174482,61.8732556687879,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.375,16.6666666666667,MUSR,0.420604166666667,11.7421875,MMLU-PRO,0.562583111702128,51.3981235224587,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-72B,other,668,72.706,33.0067683243991 +Qwen/Qwen2.5-7B_bfloat16_57597c00770845ceba45271ba1b24c94bbcc7baf_False,Qwen/Qwen2.5-7B,57597c00770845ceba45271ba1b24c94bbcc7baf,bfloat16,pretrained,Original,Qwen2ForCausalLM,24.9869343450417,FALSE,IFEval,0.337447971382598,33.7447971382598,BBH,0.541630376778862,35.8134732875478,MATH Level 5,0.188821752265861,18.8821752265861,GPQA,0.324664429530201,9.95525727069351,MUSR,0.442427083333333,14.13671875,MMLU-PRO,0.436502659574468,37.3891843971631,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-7B,apache-2.0,97,7.616,3.02796087914288 +Qwen/Qwen2.5-7B-Instruct_bfloat16_52e20a6f5f475e5c8f6a8ebda4ae5fa6b1ea22ac_True,Qwen/Qwen2.5-7B-Instruct,52e20a6f5f475e5c8f6a8ebda4ae5fa6b1ea22ac,bfloat16,chatmodels,Original,Qwen2ForCausalLM,26.8667753266146,TRUE,IFEval,0.7585251576927,75.85251576927,BBH,0.53942319682991,34.8921167587655,MATH Level 5,0,0,GPQA,0.291107382550336,5.48098434004475,MUSR,0.40203125,8.45390625,MMLU-PRO,0.428690159574468,36.5211288416076,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-18,1,Qwen/Qwen2.5-7B,apache-2.0,419,7.616,2.16827148311528 Qwen/Qwen2.5-Coder-14B_bfloat16_1db30eb5ec86a6e51d8981818ee2910370b3010d_True,Qwen/Qwen2.5-Coder-14B,1db30eb5ec86a6e51d8981818ee2910370b3010d,bfloat16,pretrained,Original,Qwen2ForCausalLM,24.7661116962997,TRUE,IFEval,0.347265256186917,34.7265256186917,BBH,0.586486009174123,40.523002115363,MATH Level 5,0.221299093655589,22.1299093655589,GPQA,0.292785234899329,5.70469798657718,MUSR,0.387364583333333,6.38723958333334,MMLU-PRO,0.452127659574468,39.1252955082742,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-08,2024-11-12,1,Qwen/Qwen2.5-Coder-14B (Merge),apache-2.0,23,14.77,3.63262520075326 Qwen/Qwen2.5-Coder-14B-Instruct_bfloat16_1a62978099f9b19f72fdd191988ff958abb18561_True,Qwen/Qwen2.5-Coder-14B-Instruct,1a62978099f9b19f72fdd191988ff958abb18561,bfloat16,chatmodels,Original,Qwen2ForCausalLM,31.1787254167968,TRUE,IFEval,0.690756082749327,69.0756082749327,BBH,0.614029642366133,44.2200182156684,MATH Level 5,0.268126888217523,26.8126888217523,GPQA,0.304530201342282,7.27069351230425,MUSR,0.391458333333333,7.03229166666667,MMLU-PRO,0.393949468085106,32.6610520094563,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-11-12,1,Qwen/Qwen2.5-Coder-14B-Instruct (Merge),apache-2.0,70,14.77,1.38321406525897 Qwen/Qwen2.5-Coder-32B_float16_2e12b5f7bc878d424d222e224ed40aee564ec45f_False,Qwen/Qwen2.5-Coder-32B,2e12b5f7bc878d424d222e224ed40aee564ec45f,float16,pretrained,Original,Qwen2ForCausalLM,33.2120108702677,FALSE,IFEval,0.436341130422834,43.6341130422834,BBH,0.640395506550809,48.5112134061417,MATH Level 5,0.305891238670695,30.5891238670695,GPQA,0.346476510067114,12.8635346756152,MUSR,0.4528125,15.8682291666667,MMLU-PRO,0.530252659574468,47.8058510638298,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-08,2024-12-10,1,Qwen/Qwen2.5-Coder-32B (Merge),apache-2.0,93,32.764,4.6902502672998 -Qwen/Qwen2.5-Coder-32B-Instruct_float16_b47205940b83b5b484577359f71ee7b88472df67_False,Qwen/Qwen2.5-Coder-32B-Instruct,b47205940b83b5b484577359f71ee7b88472df67,float16,chatmodels,Original,Qwen2ForCausalLM,38.7525412608276,FALSE,IFEval,0.726526726862503,72.6526726862503,BBH,0.662522222240513,52.2665152094361,MATH Level 5,0.427492447129909,42.7492447129909,GPQA,0.348993288590604,13.1991051454139,MUSR,0.438583333333333,13.7229166666667,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-12-10,1,Qwen/Qwen2.5-Coder-32B-Instruct (Merge),apache-2.0,1442,32.764,4.69438966297979 +Qwen/Qwen2.5-Coder-32B-Instruct_float16_b47205940b83b5b484577359f71ee7b88472df67_False,Qwen/Qwen2.5-Coder-32B-Instruct,b47205940b83b5b484577359f71ee7b88472df67,float16,chatmodels,Original,Qwen2ForCausalLM,38.7525412608276,FALSE,IFEval,0.726526726862503,72.6526726862503,BBH,0.662522222240513,52.2665152094361,MATH Level 5,0.427492447129909,42.7492447129909,GPQA,0.348993288590604,13.1991051454139,MUSR,0.438583333333333,13.7229166666667,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-12-10,1,Qwen/Qwen2.5-Coder-32B-Instruct (Merge),apache-2.0,1451,32.764,4.69438966297979 Qwen/Qwen2.5-Coder-7B_bfloat16_097b213c52760d22753af1aa5cbdba94b5c99506_True,Qwen/Qwen2.5-Coder-7B,097b213c52760d22753af1aa5cbdba94b5c99506,bfloat16,pretrained,Original,Qwen2ForCausalLM,19.2094905389622,TRUE,IFEval,0.344592348302504,34.4592348302504,BBH,0.485564055342148,28.4389441152555,MATH Level 5,0.191842900302115,19.1842900302115,GPQA,0.259228187919463,1.23042505592841,MUSR,0.344854166666667,2.1734375,MMLU-PRO,0.367935505319149,29.7706117021277,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-21,1,Qwen/Qwen2.5-Coder-7B (Merge),apache-2.0,84,7.616,2.30176716800796 Qwen/Qwen2.5-Coder-7B-Instruct_bfloat16_3030861ab8e72c6155e1821631bf977ef40d3e5b_True,Qwen/Qwen2.5-Coder-7B-Instruct,3030861ab8e72c6155e1821631bf977ef40d3e5b,bfloat16,chatmodels,Original,Qwen2ForCausalLM,22.4254329651823,TRUE,IFEval,0.610147741326347,61.0147741326347,BBH,0.500797698622455,28.9385040453791,MATH Level 5,0.033987915407855,3.3987915407855,GPQA,0.291946308724832,5.59284116331097,MUSR,0.407270833333333,9.47552083333333,MMLU-PRO,0.335189494680851,26.1321660756501,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-11-07,1,Qwen/Qwen2.5-Coder-7B-Instruct (Merge),apache-2.0,383,7.616,1.77985748125157 Qwen/Qwen2.5-Coder-7B-Instruct_float16_f784f10a7b2aac91bd26e6dbe7dccce691cd4ac5_True,Qwen/Qwen2.5-Coder-7B-Instruct,f784f10a7b2aac91bd26e6dbe7dccce691cd4ac5,float16,chatmodels,Original,Qwen2ForCausalLM,22.5245158164521,TRUE,IFEval,0.614718945730661,61.4718945730661,BBH,0.499904855031131,28.7265779689503,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.293624161073826,5.8165548098434,MUSR,0.4099375,9.87552083333333,MMLU-PRO,0.335438829787234,26.1598699763593,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-11-07,1,Qwen/Qwen2.5-Coder-7B-Instruct (Merge),apache-2.0,383,7.616,0.697647347897138 @@ -1041,8 +1043,8 @@ SanjiWatsuki/Silicon-Maid-7B_bfloat16_4e43d81f3fff1091df7cb2d85e9e306d25235701_T Sao10K/Fimbulvetr-11B-v2_float16_b2dcd534dc3a53ff84e60a53b87816185169be19_True,Sao10K/Fimbulvetr-11B-v2,b2dcd534dc3a53ff84e60a53b87816185169be19,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.0696190015868,TRUE,IFEval,0.510005673834315,51.0005673834315,BBH,0.454449506518434,22.6551208100587,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.291946308724832,5.59284116331097,MUSR,0.435364583333333,14.9205729166667,MMLU-PRO,0.330119680851064,25.568853427896,TRUE,FALSE,FALSE,FALSE,FALSE,2024-02-06,2024-07-01,0,Sao10K/Fimbulvetr-11B-v2,cc-by-nc-4.0,167,10.732,0.821204151076343 Sao10K/L3-70B-Euryale-v2.1_bfloat16_36ad832b771cd783ea7ad00ed39e61f679b1a7c6_True,Sao10K/L3-70B-Euryale-v2.1,36ad832b771cd783ea7ad00ed39e61f679b1a7c6,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,35.3480147060313,TRUE,IFEval,0.738441778924365,73.8441778924365,BBH,0.647132281126872,48.7011867294481,MATH Level 5,0.208459214501511,20.8459214501511,GPQA,0.331375838926175,10.8501118568233,MUSR,0.420916666666667,12.2479166666667,MMLU-PRO,0.510388962765958,45.598773640662,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-11,2024-07-01,0,Sao10K/L3-70B-Euryale-v2.1,cc-by-nc-4.0,126,70.554,8.61834854619988 Sao10K/L3-70B-Euryale-v2.1_float16_36ad832b771cd783ea7ad00ed39e61f679b1a7c6_True,Sao10K/L3-70B-Euryale-v2.1,36ad832b771cd783ea7ad00ed39e61f679b1a7c6,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,35.4732526687288,TRUE,IFEval,0.728100329348351,72.8100329348351,BBH,0.650277899274504,49.1930030798986,MATH Level 5,0.224320241691843,22.4320241691843,GPQA,0.331375838926175,10.8501118568233,MUSR,0.419583333333333,12.0479166666667,MMLU-PRO,0.509557845744681,45.5064273049645,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-11,2024-06-26,0,Sao10K/L3-70B-Euryale-v2.1,cc-by-nc-4.0,126,70.554,8.61645431985954 -Sao10K/L3-8B-Lunaris-v1_bfloat16_8479c2a7ee119c935b9a02c921cc2a85b698dfe8_True,Sao10K/L3-8B-Lunaris-v1,8479c2a7ee119c935b9a02c921cc2a85b698dfe8,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,25.6283363857046,TRUE,IFEval,0.68945730661312,68.945730661312,BBH,0.523529928251542,32.1143484550954,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.301174496644295,6.82326621923937,MUSR,0.372666666666667,5.55,MMLU-PRO,0.378740026595745,30.9711140661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-26,2024-07-22,0,Sao10K/L3-8B-Lunaris-v1,llama3,99,8.03,0.660498638520832 -Sao10K/L3-8B-Niitama-v1_float16_507a802294c653056dac604a704fd55c9a566695_True,Sao10K/L3-8B-Niitama-v1,507a802294c653056dac604a704fd55c9a566695,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.7660377976422,TRUE,IFEval,0.679065989352695,67.9065989352695,BBH,0.530298013178714,33.2097878209279,MATH Level 5,0.0966767371601208,9.66767371601208,GPQA,0.307885906040268,7.71812080536913,MUSR,0.380666666666667,6.08333333333334,MMLU-PRO,0.370096409574468,30.0107121749409,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-07,2025-01-07,0,Sao10K/L3-8B-Niitama-v1,cc-by-nc-4.0,34,8.03,0.530377216497447 +Sao10K/L3-8B-Lunaris-v1_bfloat16_8479c2a7ee119c935b9a02c921cc2a85b698dfe8_True,Sao10K/L3-8B-Lunaris-v1,8479c2a7ee119c935b9a02c921cc2a85b698dfe8,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,25.6283363857046,TRUE,IFEval,0.68945730661312,68.945730661312,BBH,0.523529928251542,32.1143484550954,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.301174496644295,6.82326621923937,MUSR,0.372666666666667,5.55,MMLU-PRO,0.378740026595745,30.9711140661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-26,2024-07-22,0,Sao10K/L3-8B-Lunaris-v1,llama3,100,8.03,0.660498638520832 +Sao10K/L3-8B-Niitama-v1_float16_507a802294c653056dac604a704fd55c9a566695_True,Sao10K/L3-8B-Niitama-v1,507a802294c653056dac604a704fd55c9a566695,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.7660377976422,TRUE,IFEval,0.679065989352695,67.9065989352695,BBH,0.530298013178714,33.2097878209279,MATH Level 5,0.0966767371601208,9.66767371601208,GPQA,0.307885906040268,7.71812080536913,MUSR,0.380666666666667,6.08333333333334,MMLU-PRO,0.370096409574468,30.0107121749409,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-07,2025-01-07,0,Sao10K/L3-8B-Niitama-v1,cc-by-nc-4.0,35,8.03,0.530377216497447 Sao10K/L3-8B-Stheno-v3.2_bfloat16_4bb828f6e1b1efd648c39b1ad682c44ff260f018_True,Sao10K/L3-8B-Stheno-v3.2,4bb828f6e1b1efd648c39b1ad682c44ff260f018,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.9095698218306,TRUE,IFEval,0.687284183743578,68.7284183743578,BBH,0.522778637171633,32.021597924075,MATH Level 5,0.0944108761329305,9.44108761329305,GPQA,0.310402684563758,8.05369127516779,MUSR,0.379364583333333,6.45390625,MMLU-PRO,0.376828457446809,30.7587174940898,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-05,2024-06-30,0,Sao10K/L3-8B-Stheno-v3.2,cc-by-nc-4.0,266,8.03,0.891672233627461 Sao10K/L3-8B-Stheno-v3.3-32K_bfloat16_1a59d163e079c7e7f1542553d085853119960f0c_True,Sao10K/L3-8B-Stheno-v3.3-32K,1a59d163e079c7e7f1542553d085853119960f0c,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,12.5870405203853,TRUE,IFEval,0.460371813454966,46.0371813454966,BBH,0.384401292300821,13.5120089831975,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.256711409395973,0.894854586129753,MUSR,0.372541666666667,4.06770833333333,MMLU-PRO,0.189577792553192,9.95308806146572,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-22,2024-06-26,0,Sao10K/L3-8B-Stheno-v3.3-32K,cc-by-nc-4.0,53,8.03,1.46863224607195 Sao10K/MN-12B-Lyra-v3_bfloat16_da76fa39d128ca84065427189bb228f2dfc6b8a3_True,Sao10K/MN-12B-Lyra-v3,da76fa39d128ca84065427189bb228f2dfc6b8a3,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,19.3964568922766,TRUE,IFEval,0.448606364446336,44.8606364446336,BBH,0.480395436039724,25.8709633830725,MATH Level 5,0.0793051359516616,7.93051359516616,GPQA,0.277684563758389,3.69127516778523,MUSR,0.40190625,9.03828125,MMLU-PRO,0.324883643617021,24.9870715130024,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-27,2024-09-03,0,Sao10K/MN-12B-Lyra-v3,cc-by-nc-4.0,34,12.248,2.08466477138094 @@ -1072,7 +1074,7 @@ SicariusSicariiStuff/2B-ad_float16_fa0e405edfb1c6e454b7a25852b5bbf5049cf132_Fals SicariusSicariiStuff/2B_or_not_2B_float16_abf87e8422284aa83a42efd7a91154f9af3c7ed3_False,SicariusSicariiStuff/2B_or_not_2B,abf87e8422284aa83a42efd7a91154f9af3c7ed3,float16,fine-tunedondomain-specificdatasets,Original,GemmaForCausalLM,6.57942454779956,FALSE,IFEval,0.206231687478114,20.6231687478114,BBH,0.341591702409202,7.68230049623281,MATH Level 5,0.0188821752265861,1.88821752265861,GPQA,0.24748322147651,0,MUSR,0.379083333333333,4.85208333333334,MMLU-PRO,0.139876994680851,4.43077718676123,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-11,2024-10-11,0,SicariusSicariiStuff/2B_or_not_2B,apache-2.0,25,2.506,0.877135651473592 SicariusSicariiStuff/Dusk_Rainbow_bfloat16_106058ac50593d65bc4b5ae75c8c010e87cd8487_False,SicariusSicariiStuff/Dusk_Rainbow,106058ac50593d65bc4b5ae75c8c010e87cd8487,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.6113025105056,FALSE,IFEval,0.358805746530317,35.8805746530317,BBH,0.477175042807362,25.9590368242234,MATH Level 5,0.0740181268882175,7.40181268882175,GPQA,0.308724832214765,7.82997762863535,MUSR,0.402520833333333,7.4484375,MMLU-PRO,0.344331781914894,27.1479757683215,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-16,2024-10-08,0,SicariusSicariiStuff/Dusk_Rainbow,apache-2.0,31,8.03,1.60465452429426 SicariusSicariiStuff/Impish_LLAMA_3B_bfloat16_72703d3083d1a67849cbea0b7add3c1270a77cc7_False,SicariusSicariiStuff/Impish_LLAMA_3B,72703d3083d1a67849cbea0b7add3c1270a77cc7,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,17.7793593770642,FALSE,IFEval,0.462994853654969,46.2994853654969,BBH,0.409051016278732,16.9857548569044,MATH Level 5,0.11178247734139,11.178247734139,GPQA,0.287751677852349,5.03355704697987,MUSR,0.367270833333333,5.60885416666667,MMLU-PRO,0.294132313829787,21.5702570921986,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-01,2024-10-07,0,SicariusSicariiStuff/Impish_LLAMA_3B,apache-2.0,16,3.213,0.722952381276759 -SicariusSicariiStuff/Impish_Mind_8B_float16_b408001bae902572570b4f55ebad3436c1c2cedb_False,SicariusSicariiStuff/Impish_Mind_8B,b408001bae902572570b4f55ebad3436c1c2cedb,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.1116149466646,FALSE,IFEval,0.317914245313546,31.7914245313546,BBH,0.467365716166271,24.5628541145626,MATH Level 5,0.104229607250755,10.4229607250755,GPQA,0.304530201342282,7.27069351230425,MUSR,0.406958333333333,8.96979166666667,MMLU-PRO,0.330867686170213,25.6519651300236,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-05,0,SicariusSicariiStuff/Impish_Mind_8B,apache-2.0,17,8.03,0.6847817336385 +SicariusSicariiStuff/Impish_Mind_8B_float16_b408001bae902572570b4f55ebad3436c1c2cedb_False,SicariusSicariiStuff/Impish_Mind_8B,b408001bae902572570b4f55ebad3436c1c2cedb,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.1116149466646,FALSE,IFEval,0.317914245313546,31.7914245313546,BBH,0.467365716166271,24.5628541145626,MATH Level 5,0.104229607250755,10.4229607250755,GPQA,0.304530201342282,7.27069351230425,MUSR,0.406958333333333,8.96979166666667,MMLU-PRO,0.330867686170213,25.6519651300236,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-05,0,SicariusSicariiStuff/Impish_Mind_8B,apache-2.0,18,8.03,0.6847817336385 SicariusSicariiStuff/LLAMA-3_8B_Unaligned_BETA_float16_9bc5b68a7448a4e46eeaf27a4ac477d79578db95_False,SicariusSicariiStuff/LLAMA-3_8B_Unaligned_BETA,9bc5b68a7448a4e46eeaf27a4ac477d79578db95,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.1533404966018,FALSE,IFEval,0.371320318975873,37.1320318975873,BBH,0.471723402848483,24.9980137538074,MATH Level 5,0.0845921450151058,8.45921450151058,GPQA,0.305369127516779,7.38255033557047,MUSR,0.411947916666667,9.56015625,MMLU-PRO,0.346492686170213,27.3880762411348,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-12,2024-10-18,0,SicariusSicariiStuff/LLAMA-3_8B_Unaligned_BETA,apache-2.0,41,8.03,0.749373219973464 SicariusSicariiStuff/Qwen2.5-14B_Uncencored_float16_1daf648ac2f837c66bf6bb00459e034987d9486f_False,SicariusSicariiStuff/Qwen2.5-14B_Uncencored,1daf648ac2f837c66bf6bb00459e034987d9486f,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,31.674586251327,FALSE,IFEval,0.315790990128415,31.5790990128415,BBH,0.630894194550783,46.7202351109504,MATH Level 5,0.314954682779456,31.4954682779456,GPQA,0.381711409395973,17.5615212527964,MUSR,0.451666666666667,15.2916666666667,MMLU-PRO,0.526595744680851,47.3995271867612,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-20,0,Removed,"",0,14,2.73919539073176 SicariusSicariiStuff/Qwen2.5-14B_Uncensored_float16_0710a2341d269dcd56f9136fed442373d4dadc5d_False,SicariusSicariiStuff/Qwen2.5-14B_Uncensored,0710a2341d269dcd56f9136fed442373d4dadc5d,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,31.6999818313509,FALSE,IFEval,0.317314724929853,31.7314724929853,BBH,0.630894194550783,46.7202351109504,MATH Level 5,0.314954682779456,31.4954682779456,GPQA,0.381711409395973,17.5615212527964,MUSR,0.451666666666667,15.2916666666667,MMLU-PRO,0.526595744680851,47.3995271867612,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-21,0,Removed,"",0,14,2.42088670104725 @@ -1090,7 +1092,7 @@ SkyOrbis/SKY-Ko-Llama3.2-3B-lora-epoch2_bfloat16_ff0f4aa3aee4535aaec8c4989014e11 SkyOrbis/SKY-Ko-Llama3.2-3B-lora-epoch3_bfloat16_879c73ee9539aca6cabff3a3fc5a8b37108dbd15_False,SkyOrbis/SKY-Ko-Llama3.2-3B-lora-epoch3,879c73ee9539aca6cabff3a3fc5a8b37108dbd15,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.294335452253,FALSE,IFEval,0.533112142448703,53.3112142448703,BBH,0.439962826803102,20.8061366293104,MATH Level 5,0.13821752265861,13.821752265861,GPQA,0.291946308724832,5.59284116331097,MUSR,0.352229166666667,5.96197916666667,MMLU-PRO,0.300448803191489,22.2720892434988,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-30,2024-12-31,1,SkyOrbis/SKY-Ko-Llama3.2-3B-lora-epoch3 (Merge),llama3.2,0,3.213,0.5666264985193 SkyOrbis/SKY-Ko-Qwen2.5-3B-Instruct_float16_3241e4efcc62259e56caa03f8b42c301edc9320a_False,SkyOrbis/SKY-Ko-Qwen2.5-3B-Instruct,3241e4efcc62259e56caa03f8b42c301edc9320a,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,15.4261460247146,FALSE,IFEval,0.35341006307708,35.341006307708,BBH,0.426482122833602,19.1506790305095,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.279362416107383,3.91498881431767,MUSR,0.402364583333333,9.26223958333333,MMLU-PRO,0.281166888297872,20.1296542553192,FALSE,FALSE,FALSE,FALSE,FALSE,2025-01-09,2025-01-09,1,SkyOrbis/SKY-Ko-Qwen2.5-3B-Instruct (Merge),"",0,3.086,0.729896414609141 Skywork/Skywork-Reward-Gemma-2-27B-v0.2_bfloat16_a92f2ec997c806de469ff287ef3b71982e886fc2_True,Skywork/Skywork-Reward-Gemma-2-27B-v0.2,a92f2ec997c806de469ff287ef3b71982e886fc2,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForSequenceClassification,30.8976015018891,TRUE,IFEval,0.780731791646166,78.0731791646166,BBH,0.635960062329604,48.1599042497272,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.343959731543624,12.5279642058166,MUSR,0.423145833333333,11.9932291666667,MMLU-PRO,0.410322473404255,34.480274822695,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-14,2024-12-27,2,google/gemma-2-27b,"",26,27.227,4.42896986339819 -Skywork/Skywork-o1-Open-Llama-3.1-8B_bfloat16_a41903315f39ebf1c08fdba0ef52758f7afe3682_True,Skywork/Skywork-o1-Open-Llama-3.1-8B,a41903315f39ebf1c08fdba0ef52758f7afe3682,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,12.0671940960369,TRUE,IFEval,0.351836460591231,35.1836460591231,BBH,0.451590897018972,23.017598928073,MATH Level 5,0,0,GPQA,0.259228187919463,1.23042505592841,MUSR,0.315645833333333,1.52239583333333,MMLU-PRO,0.203041888297872,11.4490986997636,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-26,2025-01-01,2,meta-llama/Meta-Llama-3.1-8B,other,99,8.03,0.698189034975431 +Skywork/Skywork-o1-Open-Llama-3.1-8B_bfloat16_a41903315f39ebf1c08fdba0ef52758f7afe3682_True,Skywork/Skywork-o1-Open-Llama-3.1-8B,a41903315f39ebf1c08fdba0ef52758f7afe3682,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,12.0671940960369,TRUE,IFEval,0.351836460591231,35.1836460591231,BBH,0.451590897018972,23.017598928073,MATH Level 5,0,0,GPQA,0.259228187919463,1.23042505592841,MUSR,0.315645833333333,1.52239583333333,MMLU-PRO,0.203041888297872,11.4490986997636,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-26,2025-01-01,2,meta-llama/Meta-Llama-3.1-8B,other,100,8.03,0.698189034975431 Solshine/Brimful-merged-replete_float16_01ce8c3df6edb87d31f0e9a9651cbcbc4d4823e8_True,Solshine/Brimful-merged-replete,01ce8c3df6edb87d31f0e9a9651cbcbc4d4823e8,float16,basemergesandmoerges,Original,Qwen2ForCausalLM,3.82947458763002,TRUE,IFEval,0.176056197555819,17.6056197555819,BBH,0.28834447696551,1.9921389967361,MATH Level 5,0,0,GPQA,0.25755033557047,1.00671140939597,MUSR,0.342125,1.43229166666667,MMLU-PRO,0.108460771276596,0.940085697399526,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-01,2024-10-01,1,Solshine/Brimful-merged-replete (Merge),"",2,12.277,2.16672326865895 Solshine/Llama-3-1-big-thoughtful-passthrough-merge-2_float16_d48047d6577e22fdda73a1be8e18971912db66d2_True,Solshine/Llama-3-1-big-thoughtful-passthrough-merge-2,d48047d6577e22fdda73a1be8e18971912db66d2,float16,basemergesandmoerges,Original,LlamaForCausalLM,6.77764579154096,TRUE,IFEval,0.254666507090077,25.4666507090077,BBH,0.320938084271446,5.00844230649227,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.259228187919463,1.23042505592841,MUSR,0.388947916666667,6.75182291666667,MMLU-PRO,0.118517287234043,2.05747635933806,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-19,2024-09-24,1,Solshine/Llama-3-1-big-thoughtful-passthrough-merge-2 (Merge),"",2,18.5,3.3813526961235 Stark2008/GutenLaserPi_bfloat16_d5ab84c6f8f0c88c16380242c7e11e8cefc934b7_False,Stark2008/GutenLaserPi,d5ab84c6f8f0c88c16380242c7e11e8cefc934b7,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,21.287431571598,FALSE,IFEval,0.42265300513748,42.265300513748,BBH,0.521234248248952,32.9777100670166,MATH Level 5,0.0717522658610272,7.17522658610272,GPQA,0.286912751677852,4.92170022371365,MUSR,0.462020833333333,16.9859375,MMLU-PRO,0.310588430851064,23.3987145390071,FALSE,FALSE,FALSE,FALSE,FALSE,2024-07-11,2024-07-11,1,Stark2008/GutenLaserPi (Merge),"",0,7.242,0.569965183743718 @@ -1132,6 +1134,7 @@ T145/ZEUS-8B-V2-ORPO_bfloat16_fee1b04ccafb9f6bbb4db88effd837ad72e00571_True,T145 T145/ZEUS-8B-V2-abliterated_bfloat16_d07c040573a4a468d774e5f47811be3e4c05e622_True,T145/ZEUS-8B-V2-abliterated,d07c040573a4a468d774e5f47811be3e4c05e622,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,29.7085890844159,TRUE,IFEval,0.789549506420741,78.9549506420741,BBH,0.512886862221066,30.9825641951907,MATH Level 5,0.20619335347432,20.619335347432,GPQA,0.312919463087248,8.38926174496644,MUSR,0.391083333333333,7.91875,MMLU-PRO,0.382480053191489,31.3866725768322,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-30,2024-12-31,1,T145/ZEUS-8B-V2-abliterated (Merge),llama3.1,1,8.03,1.37028218542924 T145/ZEUS-8B-V20_bfloat16_0daec2344934c6f945fe8df88de345f66c89fe84_True,T145/ZEUS-8B-V20,0daec2344934c6f945fe8df88de345f66c89fe84,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,30.7630357603013,TRUE,IFEval,0.795594577942083,79.5594577942083,BBH,0.524400505841583,32.221586977252,MATH Level 5,0.202416918429003,20.2416918429003,GPQA,0.322986577181208,9.73154362416107,MUSR,0.404322916666667,10.2736979166667,MMLU-PRO,0.392952127659575,32.5502364066194,FALSE,FALSE,FALSE,FALSE,FALSE,2025-01-07,2025-01-07,1,T145/ZEUS-8B-V20 (Merge),"",1,8.03,0.668387733941896 T145/ZEUS-8B-V21_bfloat16_8b3646b8e380835dc6955ae210743360b3f9c298_True,T145/ZEUS-8B-V21,8b3646b8e380835dc6955ae210743360b3f9c298,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,10.8269429600709,TRUE,IFEval,0.378514563580189,37.8514563580189,BBH,0.339757539404585,7.35804837991714,MATH Level 5,0.0838368580060423,8.38368580060423,GPQA,0.264261744966443,1.90156599552573,MUSR,0.32615625,1.53619791666667,MMLU-PRO,0.171376329787234,7.93070330969267,FALSE,FALSE,FALSE,FALSE,FALSE,"",2025-01-08,0,Removed,"",0,8.03,0.72017418144155 +T145/ZEUS-8B-V22_bfloat16_e0c00dfff7eb8b0fe0c3b63980d9558f55dd569c_True,T145/ZEUS-8B-V22,e0c00dfff7eb8b0fe0c3b63980d9558f55dd569c,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,30.8037244339059,TRUE,IFEval,0.799516394278293,79.9516394278293,BBH,0.524491552250772,32.2139563599642,MATH Level 5,0.202416918429003,20.2416918429003,GPQA,0.328020134228188,10.4026845637584,MUSR,0.398958333333333,9.36979166666666,MMLU-PRO,0.393783244680851,32.6425827423168,FALSE,FALSE,FALSE,FALSE,FALSE,2025-01-09,2025-01-09,1,T145/ZEUS-8B-V22 (Merge),"",1,8.03,0.706253266042686 T145/ZEUS-8B-V2L1_bfloat16_c2d7f009c769f7ebdef00412ad85f2d3bdea9869_False,T145/ZEUS-8B-V2L1,c2d7f009c769f7ebdef00412ad85f2d3bdea9869,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.0348610358661,FALSE,IFEval,0.31918864169293,31.918864169293,BBH,0.501348537526027,28.6942082065513,MATH Level 5,0.128398791540786,12.8398791540786,GPQA,0.312919463087248,8.38926174496644,MUSR,0.388197916666667,9.05807291666666,MMLU-PRO,0.363779920212766,29.3088800236407,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-02,0,Removed,"",0,8.03,0.744636958690887 T145/ZEUS-8B-V2L2_bfloat16_d3ae250942e4b749c2d545a48f08a93a659a9b6e_True,T145/ZEUS-8B-V2L2,d3ae250942e4b749c2d545a48f08a93a659a9b6e,bfloat16,chatmodels,Original,LlamaForCausalLM,29.8855739004236,TRUE,IFEval,0.802064078866297,80.2064078866297,BBH,0.520284366540213,32.0175092945529,MATH Level 5,0.198640483383686,19.8640483383686,GPQA,0.299496644295302,6.59955257270694,MUSR,0.39746875,8.58359375,MMLU-PRO,0.388380984042553,32.0423315602837,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-03,0,Removed,"",0,8.03,0.704039554036526 T145/ZEUS-8B-V3_bfloat16_2253fa275c722d46dd6380539042ec7f1bc0d7f7_True,T145/ZEUS-8B-V3,2253fa275c722d46dd6380539042ec7f1bc0d7f7,bfloat16,chatmodels,Original,LlamaForCausalLM,29.5797522194249,TRUE,IFEval,0.788675159687407,78.8675159687407,BBH,0.526506413353538,32.1082521099291,MATH Level 5,0.166163141993958,16.6163141993958,GPQA,0.322147651006711,9.61968680089485,MUSR,0.4016875,9.1109375,MMLU-PRO,0.380402260638298,31.1558067375887,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-05,0,Removed,"",0,8.03,0.60635058506023 @@ -1142,7 +1145,7 @@ T145/ZEUS-8B-V8_bfloat16_c7da6c67926ddaff25602bfd1b9941d9822c1387_True,T145/ZEUS T145/ZEUS-8B-V9_bfloat16_10b386571ad34d115433419d30b61746ef4d9735_True,T145/ZEUS-8B-V9,10b386571ad34d115433419d30b61746ef4d9735,bfloat16,chatmodels,Original,LlamaForCausalLM,25.8271249353926,TRUE,IFEval,0.555143685421349,55.5143685421349,BBH,0.520725634647775,31.8505495278181,MATH Level 5,0.211480362537764,21.1480362537764,GPQA,0.291107382550336,5.48098434004475,MUSR,0.394927083333333,8.73255208333333,MMLU-PRO,0.390126329787234,32.2362588652482,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,T145/ZEUS-8B-V9 (Merge),"",1,8.03,0.673209944939504 T145/qwen-2.5-3B-merge-test_bfloat16_0d5f82d841f811fbf1ee07bfbf7c6eb1de812840_True,T145/qwen-2.5-3B-merge-test,0d5f82d841f811fbf1ee07bfbf7c6eb1de812840,bfloat16,chatmodels,Original,Qwen2ForCausalLM,21.1541505180996,TRUE,IFEval,0.575101840893274,57.5101840893274,BBH,0.484248874772039,27.8893413136761,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.285234899328859,4.6979865771812,MUSR,0.400729166666667,8.29114583333333,MMLU-PRO,0.328956117021277,25.4395685579196,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-11-16,0,Removed,"",0,3.397,0.783956586523256 THUDM/glm-4-9b_bfloat16_99a140996f9d4f197842fb6b1aab217a42e27ef3_False,THUDM/glm-4-9b,99a140996f9d4f197842fb6b1aab217a42e27ef3,bfloat16,pretrained,Original,ChatGLMModelM,18.0067317317162,FALSE,IFEval,0.142608279365417,14.2608279365417,BBH,0.552836814166527,35.8112835812089,MATH Level 5,0,0,GPQA,0.316275167785235,8.83668903803132,MUSR,0.438583333333333,14.1895833333333,MMLU-PRO,0.414478058510638,34.942006501182,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-07-04,0,THUDM/glm-4-9b,other,119,9,1.67244683755118 -THUDM/glm-4-9b-chat_bfloat16_04419001bc63e05e70991ade6da1f91c4aeec278_True,THUDM/glm-4-9b-chat,04419001bc63e05e70991ade6da1f91c4aeec278,bfloat16,chatmodels,Original,ChatGLMModelM,10.9734772970452,TRUE,IFEval,0,0,BBH,0.473638842910357,25.2051836744402,MATH Level 5,0,0,GPQA,0.313758389261745,8.50111856823266,MUSR,0.399427083333333,8.06171875,MMLU-PRO,0.316655585106383,24.0728427895981,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-07-09,0,THUDM/glm-4-9b-chat,other,656,9,0.247134508492731 +THUDM/glm-4-9b-chat_bfloat16_04419001bc63e05e70991ade6da1f91c4aeec278_True,THUDM/glm-4-9b-chat,04419001bc63e05e70991ade6da1f91c4aeec278,bfloat16,chatmodels,Original,ChatGLMModelM,10.9734772970452,TRUE,IFEval,0,0,BBH,0.473638842910357,25.2051836744402,MATH Level 5,0,0,GPQA,0.313758389261745,8.50111856823266,MUSR,0.399427083333333,8.06171875,MMLU-PRO,0.316655585106383,24.0728427895981,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-07-09,0,THUDM/glm-4-9b-chat,other,657,9,0.247134508492731 THUDM/glm-4-9b-chat-1m_bfloat16_0aa722c7e0745dd21453427dd44c257dd253304f_True,THUDM/glm-4-9b-chat-1m,0aa722c7e0745dd21453427dd44c257dd253304f,bfloat16,chatmodels,Original,ChatGLMModel,8.92251018653198,TRUE,IFEval,0,0,BBH,0.418005782183303,17.1080285081681,MATH Level 5,0,0,GPQA,0.303691275167785,7.15883668903803,MUSR,0.379458333333333,5.23229166666667,MMLU-PRO,0.316323138297872,24.0359042553192,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-10-09,0,THUDM/glm-4-9b-chat-1m,other,183,9.484,0.205669954986166 TIGER-Lab/MAmmoTH2-7B-Plus_bfloat16_3ed578d8dda09787137e363a0dc32e3a8ed908de_True,TIGER-Lab/MAmmoTH2-7B-Plus,3ed578d8dda09787137e363a0dc32e3a8ed908de,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,21.4698622596292,TRUE,IFEval,0.557466411344123,55.7466411344123,BBH,0.423469498880191,18.9259532275557,MATH Level 5,0.175981873111782,17.5981873111782,GPQA,0.280201342281879,4.0268456375839,MUSR,0.412354166666667,10.1109375,MMLU-PRO,0.301695478723404,22.4106087470449,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-06,2024-06-27,0,TIGER-Lab/MAmmoTH2-7B-Plus,mit,7,7.242,0.552663350555736 TTTXXX01/Mistral-7B-Base-SimPO2-5e-7_bfloat16_7a271e3061165f4e1abfe26715c04e20c2ac935e_True,TTTXXX01/Mistral-7B-Base-SimPO2-5e-7,7a271e3061165f4e1abfe26715c04e20c2ac935e,bfloat16,chatmodels,Original,MistralForCausalLM,16.3796884014764,TRUE,IFEval,0.439189129288067,43.9189129288067,BBH,0.431955150148828,20.6926273825575,MATH Level 5,0.0241691842900302,2.41691842900302,GPQA,0.297818791946309,6.3758389261745,MUSR,0.360416666666667,5.25208333333333,MMLU-PRO,0.276595744680851,19.6217494089835,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-30,2024-09-01,2,mistralai/Mistral-7B-v0.1,apache-2.0,0,7.242,0.522996132267287 @@ -1151,14 +1154,14 @@ TencentARC/LLaMA-Pro-8B_bfloat16_7115e7179060e0623d1ee9ff4476faed7e478d8c_False, TencentARC/LLaMA-Pro-8B-Instruct_bfloat16_9850c8afce19a69d8fc4a1603a82441157514016_True,TencentARC/LLaMA-Pro-8B-Instruct,9850c8afce19a69d8fc4a1603a82441157514016,bfloat16,chatmodels,Original,LlamaForCausalLM,15.1449908953033,TRUE,IFEval,0.448606364446336,44.8606364446336,BBH,0.422420528246,19.485726056876,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.274328859060403,3.24384787472036,MUSR,0.419020833333333,11.1109375,MMLU-PRO,0.194564494680851,10.5071660756501,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-06,2024-06-12,0,TencentARC/LLaMA-Pro-8B-Instruct,llama2,63,8.357,3.10520335582265 TencentARC/MetaMath-Mistral-Pro_bfloat16_3835d38de15ed2a04c32aca879b782fc50e390bf_False,TencentARC/MetaMath-Mistral-Pro,3835d38de15ed2a04c32aca879b782fc50e390bf,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,12.0130022014745,FALSE,IFEval,0.211876709353405,21.1876709353405,BBH,0.441316185558836,22.3722787911346,MATH Level 5,0.0460725075528701,4.60725075528701,GPQA,0.269295302013423,2.57270693512304,MUSR,0.352416666666667,4.98541666666667,MMLU-PRO,0.24717420212766,16.3526891252955,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-26,2024-06-12,0,TencentARC/MetaMath-Mistral-Pro,apache-2.0,5,8.987,0.600752251790686 TencentARC/Mistral_Pro_8B_v0.1_bfloat16_366f159fc5b314ba2a955209d2bca4600f84dac0_False,TencentARC/Mistral_Pro_8B_v0.1,366f159fc5b314ba2a955209d2bca4600f84dac0,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,14.1953459280213,FALSE,IFEval,0.211452279950531,21.1452279950531,BBH,0.452597596806644,22.894188758768,MATH Level 5,0.0566465256797583,5.66465256797583,GPQA,0.280201342281879,4.0268456375839,MUSR,0.424229166666667,11.8286458333333,MMLU-PRO,0.276512632978723,19.6125147754137,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-22,2024-06-12,0,TencentARC/Mistral_Pro_8B_v0.1,apache-2.0,66,8.987,0.632482282038501 -TheDrummer/Cydonia-22B-v1.2_bfloat16_acd8da5efadc7dc404bb4eeebef2b27b1554a2ca_False,TheDrummer/Cydonia-22B-v1.2,acd8da5efadc7dc404bb4eeebef2b27b1554a2ca,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,28.3998567141722,FALSE,IFEval,0.563511482865464,56.3511482865464,BBH,0.580856074392761,39.9326040658862,MATH Level 5,0.1797583081571,17.97583081571,GPQA,0.330536912751678,10.738255033557,MUSR,0.402177083333333,10.50546875,MMLU-PRO,0.4140625,34.8958333333333,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-07,2024-10-26,0,TheDrummer/Cydonia-22B-v1.2,other,30,22.247,1.62870427503089 +TheDrummer/Cydonia-22B-v1.2_bfloat16_acd8da5efadc7dc404bb4eeebef2b27b1554a2ca_False,TheDrummer/Cydonia-22B-v1.2,acd8da5efadc7dc404bb4eeebef2b27b1554a2ca,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,28.3998567141722,FALSE,IFEval,0.563511482865464,56.3511482865464,BBH,0.580856074392761,39.9326040658862,MATH Level 5,0.1797583081571,17.97583081571,GPQA,0.330536912751678,10.738255033557,MUSR,0.402177083333333,10.50546875,MMLU-PRO,0.4140625,34.8958333333333,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-07,2024-10-26,0,TheDrummer/Cydonia-22B-v1.2,other,31,22.247,1.62870427503089 TheDrummer/Gemmasutra-9B-v1_bfloat16_21591f6a0140e095f1c6668ac7a267f214547609_False,TheDrummer/Gemmasutra-9B-v1,21591f6a0140e095f1c6668ac7a267f214547609,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,22.7360970816177,FALSE,IFEval,0.241551306090063,24.1551306090063,BBH,0.588691424836967,41.2003963172606,MATH Level 5,0.0823262839879154,8.23262839879154,GPQA,0.310402684563758,8.05369127516779,MUSR,0.48459375,20.9408854166667,MMLU-PRO,0.404504654255319,33.8338504728132,FALSE,FALSE,FALSE,FALSE,FALSE,2024-07-17,2024-09-19,1,TheDrummer/Gemmasutra-9B-v1 (Merge),"",23,10.159,2.90381874221704 TheDrummer/Gemmasutra-Mini-2B-v1_bfloat16_c1db4c8f975d3848edbdaf851217039c8dfdaeb5_True,TheDrummer/Gemmasutra-Mini-2B-v1,c1db4c8f975d3848edbdaf851217039c8dfdaeb5,bfloat16,chatmodels,Original,Gemma2ForCausalLM,9.02858758674283,TRUE,IFEval,0.254865977827719,25.4865977827719,BBH,0.357501907914718,9.81033614467704,MATH Level 5,0.0317220543806647,3.17220543806647,GPQA,0.270973154362416,2.79642058165548,MUSR,0.348979166666667,1.1890625,MMLU-PRO,0.205452127659574,11.7169030732861,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-03,2024-10-28,0,TheDrummer/Gemmasutra-Mini-2B-v1,other,51,2.614,1.39795467425649 TheDrummer/Ministrations-8B-v1_bfloat16_39b892de64401ec7990ebb816c4455ba4532bafb_False,TheDrummer/Ministrations-8B-v1,39b892de64401ec7990ebb816c4455ba4532bafb,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,21.1519831969903,FALSE,IFEval,0.282193468884781,28.2193468884781,BBH,0.487663126022514,26.9856373362961,MATH Level 5,0.175981873111782,17.5981873111782,GPQA,0.324664429530201,9.95525727069351,MUSR,0.44490625,14.7799479166667,MMLU-PRO,0.36436170212766,29.3735224586288,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-14,0,TheDrummer/Ministrations-8B-v1,other,16,8.02,0.862555890880867 TheDrummer/Rocinante-12B-v1_bfloat16_74a4ae2584d45655298995198d5ab3e660364a1a_True,TheDrummer/Rocinante-12B-v1,74a4ae2584d45655298995198d5ab3e660364a1a,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,23.6084556646878,TRUE,IFEval,0.607649924422754,60.7649924422754,BBH,0.506545208579745,30.0256540656073,MATH Level 5,0.0657099697885197,6.57099697885197,GPQA,0.291107382550336,5.48098434004475,MUSR,0.40171875,11.2815104166667,MMLU-PRO,0.347739361702128,27.5265957446809,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-14,2024-09-03,0,TheDrummer/Rocinante-12B-v1,other,27,12.248,1.86444159508034 TheDrummer/Tiger-Gemma-9B-v1_float16_e95392c07bab3c483937583c711939ab3f5044dd_True,TheDrummer/Tiger-Gemma-9B-v1,e95392c07bab3c483937583c711939ab3f5044dd,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,27.85031932524,TRUE,IFEval,0.728150197032762,72.8150197032762,BBH,0.570368773932957,37.2205460540878,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.338926174496644,11.8568232662192,MUSR,0.416166666666667,10.4875,MMLU-PRO,0.411818484042553,34.6464982269504,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-12,2025-01-07,0,TheDrummer/Tiger-Gemma-9B-v1,"",37,9.242,1.6204273310299 TheDrummer/Tiger-Gemma-9B-v2_float16_9aea74832c16646c9c4948ccc2e76cb812f3c089_True,TheDrummer/Tiger-Gemma-9B-v2,9aea74832c16646c9c4948ccc2e76cb812f3c089,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,26.8790544482852,TRUE,IFEval,0.698599715421748,69.8599715421748,BBH,0.561719111412178,35.4695405651825,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.339765100671141,11.9686800894855,MUSR,0.408416666666667,9.31875,MMLU-PRO,0.41123670212766,34.5818557919622,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2025-01-07,0,TheDrummer/Tiger-Gemma-9B-v2,"",25,9.242,1.6697989796741 -TheDrummer/Tiger-Gemma-9B-v3_float16_fe32c1926e4057f75ebc2a4a57103564168cdbb7_True,TheDrummer/Tiger-Gemma-9B-v3,fe32c1926e4057f75ebc2a4a57103564168cdbb7,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,26.7668303114656,TRUE,IFEval,0.682063591271161,68.2063591271161,BBH,0.581223155785325,38.8360227319598,MATH Level 5,0,0,GPQA,0.338926174496644,11.8568232662192,MUSR,0.400354166666667,7.7109375,MMLU-PRO,0.405917553191489,33.9908392434988,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-04,2025-01-07,0,TheDrummer/Tiger-Gemma-9B-v3,"",36,9.242,1.57175316413286 +TheDrummer/Tiger-Gemma-9B-v3_float16_fe32c1926e4057f75ebc2a4a57103564168cdbb7_True,TheDrummer/Tiger-Gemma-9B-v3,fe32c1926e4057f75ebc2a4a57103564168cdbb7,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,26.7668303114656,TRUE,IFEval,0.682063591271161,68.2063591271161,BBH,0.581223155785325,38.8360227319598,MATH Level 5,0,0,GPQA,0.338926174496644,11.8568232662192,MUSR,0.400354166666667,7.7109375,MMLU-PRO,0.405917553191489,33.9908392434988,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-04,2025-01-07,0,TheDrummer/Tiger-Gemma-9B-v3,"",37,9.242,1.57175316413286 TheDrunkenSnail/Son-of-Rhodia_float16_f855ee46e8c6f187e2885bccdb4dd40a4ec27d94_True,TheDrunkenSnail/Son-of-Rhodia,f855ee46e8c6f187e2885bccdb4dd40a4ec27d94,float16,basemergesandmoerges,Original,MistralForCausalLM,27.0525794587411,TRUE,IFEval,0.704644786943089,70.4644786943089,BBH,0.509732764772552,30.2220572521199,MATH Level 5,0.121601208459215,12.1601208459215,GPQA,0.312919463087248,8.38926174496644,MUSR,0.420291666666667,12.103125,MMLU-PRO,0.36078789893617,28.97643321513,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-31,2024-12-31,1,TheDrunkenSnail/Son-of-Rhodia (Merge),other,2,12.248,0.956210019715665 TheHierophant/Underground-Cognitive-V0.3-test_float16_2753b6f9068ad14efe836cde3160747cd208bf9e_False,TheHierophant/Underground-Cognitive-V0.3-test,2753b6f9068ad14efe836cde3160747cd208bf9e,float16,basemergesandmoerges,Original,LlamaForCausalLM,21.5249230693678,FALSE,IFEval,0.480829753941763,48.0829753941763,BBH,0.529013190099805,33.665101982715,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.298657718120805,6.48769574944072,MUSR,0.435114583333333,14.5559895833333,MMLU-PRO,0.331781914893617,25.7535460992908,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-22,2024-11-22,1,TheHierophant/Underground-Cognitive-V0.3-test (Merge),"",0,10.732,0.586581230652599 TheTsar1209/nemo-carpmuscle-v0.1_float16_84d20db8220014958ff157047b2216910637ae39_False,TheTsar1209/nemo-carpmuscle-v0.1,84d20db8220014958ff157047b2216910637ae39,float16,chatmodels,Original,MistralForCausalLM,16.7063721996565,FALSE,IFEval,0.227563974698245,22.7563974698245,BBH,0.508352969710139,30.0349957834341,MATH Level 5,0.0422960725075529,4.22960725075529,GPQA,0.296979865771812,6.26398210290828,MUSR,0.4135,10.2208333333333,MMLU-PRO,0.340591755319149,26.7324172576832,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-15,2024-10-10,1,unsloth/Mistral-Nemo-Base-2407-bnb-4bit,apache-2.0,1,12.248,1.80844038535292 @@ -1171,7 +1174,7 @@ Tijmen2/cosmosage-v3_bfloat16_e6d4b4e6868fcf113ab5261d71c7214a1f7fbb0c_True,Tijm TinyLlama/TinyLlama-1.1B-Chat-v0.1_float16_7abc14e7779eabc3a028bc695342869d0410dea2_False,TinyLlama/TinyLlama-1.1B-Chat-v0.1,7abc14e7779eabc3a028bc695342869d0410dea2,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,3.85687240027727,FALSE,IFEval,0.147854359765422,14.7854359765422,BBH,0.308352947486801,3.36301067393934,MATH Level 5,0,0,GPQA,0.229026845637584,0,MUSR,0.359239583333333,3.90494791666667,MMLU-PRO,0.109790558510638,1.08783983451537,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-16,2024-12-02,0,TinyLlama/TinyLlama-1.1B-Chat-v0.1,apache-2.0,53,1.1,0.0910952097470587 TinyLlama/TinyLlama-1.1B-Chat-v0.5_bfloat16_5c9e70dd07f5234bf6bf6a2425fffeecd5a6020b_False,TinyLlama/TinyLlama-1.1B-Chat-v0.5,5c9e70dd07f5234bf6bf6a2425fffeecd5a6020b,bfloat16,chatmodels,Original,LlamaForCausalLM,4.07581143646604,FALSE,IFEval,0.163366534129443,16.3366534129443,BBH,0.31050469159357,3.40769093756971,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.248322147651007,0,MUSR,0.366125,3.565625,MMLU-PRO,0.109624335106383,1.06937056737589,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-20,2024-10-23,0,TinyLlama/TinyLlama-1.1B-Chat-v0.5,apache-2.0,8,1.1,0.0949638317549067 TinyLlama/TinyLlama-1.1B-Chat-v0.6_bfloat16_bf9ae1c8bf026667e6f810768de259bb4a7f4777_True,TinyLlama/TinyLlama-1.1B-Chat-v0.6,bf9ae1c8bf026667e6f810768de259bb4a7f4777,bfloat16,chatmodels,Original,LlamaForCausalLM,4.09286641277805,TRUE,IFEval,0.157421197976923,15.7421197976923,BBH,0.306697665616683,3.39037070951253,MATH Level 5,0.00377643504531722,0.377643504531722,GPQA,0.258389261744966,1.11856823266219,MUSR,0.34221875,2.27734375,MMLU-PRO,0.114860372340426,1.6511524822695,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-20,2024-10-23,0,TinyLlama/TinyLlama-1.1B-Chat-v0.6,apache-2.0,92,1.1,0.430347260938312 -TinyLlama/TinyLlama-1.1B-Chat-v1.0_float16_fe8a4ea1ffedaf415f4da2f062534de366a451e6_False,TinyLlama/TinyLlama-1.1B-Chat-v1.0,fe8a4ea1ffedaf415f4da2f062534de366a451e6,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,2.71815455158305,FALSE,IFEval,0.0595763684800773,5.95763684800773,BBH,0.310356286749101,4.0133968484868,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.25,0,MUSR,0.351520833333333,4.30677083333334,MMLU-PRO,0.110123005319149,1.12477836879433,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-30,2024-08-04,0,TinyLlama/TinyLlama-1.1B-Chat-v1.0,apache-2.0,1115,1.1,0.268441454812413 +TinyLlama/TinyLlama-1.1B-Chat-v1.0_float16_fe8a4ea1ffedaf415f4da2f062534de366a451e6_False,TinyLlama/TinyLlama-1.1B-Chat-v1.0,fe8a4ea1ffedaf415f4da2f062534de366a451e6,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,2.71815455158305,FALSE,IFEval,0.0595763684800773,5.95763684800773,BBH,0.310356286749101,4.0133968484868,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.25,0,MUSR,0.351520833333333,4.30677083333334,MMLU-PRO,0.110123005319149,1.12477836879433,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-30,2024-08-04,0,TinyLlama/TinyLlama-1.1B-Chat-v1.0,apache-2.0,1116,1.1,0.268441454812413 TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T_bfloat16_59f6f375b26bde864a6ca194a9a3044570490064_False,TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T,59f6f375b26bde864a6ca194a9a3044570490064,bfloat16,pretrained,Original,LlamaForCausalLM,5.16737751670247,FALSE,IFEval,0.227663710067066,22.7663710067067,BBH,0.307118843826727,3.54709338950808,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.25251677852349,0.335570469798655,MUSR,0.33803125,2.18723958333333,MMLU-PRO,0.112034574468085,1.33717494089835,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-28,2024-11-27,0,TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T,apache-2.0,164,1.1,0.165797879432131 TinyLlama/TinyLlama_v1.1_bfloat16_ff3c701f2424c7625fdefb9dd470f45ef18b02d6_False,TinyLlama/TinyLlama_v1.1,ff3c701f2424c7625fdefb9dd470f45ef18b02d6,bfloat16,pretrained,Original,LlamaForCausalLM,4.72384891003899,FALSE,IFEval,0.200061392660363,20.0061392660363,BBH,0.302370180450761,3.21030104971281,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.245805369127517,0,MUSR,0.36996875,3.97942708333333,MMLU-PRO,0.104886968085106,0.542996453900708,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-09,2024-06-12,0,TinyLlama/TinyLlama_v1.1,apache-2.0,80,1.1,0.248928618602363 Trappu/Magnum-Picaro-0.7-v2-12b_bfloat16_2ffc46cde49eb823f5588990bd6b848cd505271e_False,Trappu/Magnum-Picaro-0.7-v2-12b,2ffc46cde49eb823f5588990bd6b848cd505271e,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,21.4783017974636,FALSE,IFEval,0.300278815764394,30.0278815764394,BBH,0.550666191882885,35.7462331985544,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.322986577181208,9.73154362416107,MUSR,0.47271875,19.5565104166667,MMLU-PRO,0.358045212765957,28.6716903073286,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-11,2024-09-12,1,Trappu/Magnum-Picaro-0.7-v2-12b (Merge),apache-2.0,7,12.248,1.67495885513732 @@ -1246,7 +1249,7 @@ Xclbr7/Arcanum-12b_float16_845ac67d2b527296ae8c06da4453bf8a60f2e59b_False,Xclbr7 Xclbr7/Hyena-12b_bfloat16_9dd5eb77ce8e0e05e260ae4d812631fb980527fa_False,Xclbr7/Hyena-12b,9dd5eb77ce8e0e05e260ae4d812631fb980527fa,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,20.4372430816883,FALSE,IFEval,0.340445573301063,34.0445573301063,BBH,0.545718241546832,34.665648637656,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.297818791946309,6.3758389261745,MUSR,0.398427083333333,11.0700520833333,MMLU-PRO,0.343916223404255,27.1018026004728,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-19,2024-09-19,1,Xclbr7/Arcanum-12b,apache-2.0,1,12.248,1.85989339645317 Xclbr7/caliburn-12b_float16_f76fa67c7ca8bf7e75540baf55972ba52a46630b_False,Xclbr7/caliburn-12b,f76fa67c7ca8bf7e75540baf55972ba52a46630b,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,22.8083953347745,FALSE,IFEval,0.357631085519754,35.7631085519754,BBH,0.551863030023181,35.6368405675633,MATH Level 5,0.104229607250755,10.4229607250755,GPQA,0.336409395973154,11.5212527964206,MUSR,0.4291875,13.7817708333333,MMLU-PRO,0.367519946808511,29.724438534279,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-14,2024-09-14,0,Xclbr7/caliburn-12b,mit,0,12.248,1.85622045538097 Xclbr7/caliburn-v2-12b_float16_fa736b3b852298dd8c047ac6dcc620161df4a79b_False,Xclbr7/caliburn-v2-12b,fa736b3b852298dd8c047ac6dcc620161df4a79b,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,20.9535249528062,FALSE,IFEval,0.296681693462236,29.6681693462236,BBH,0.514142612509764,30.3879669463972,MATH Level 5,0.104229607250755,10.4229607250755,GPQA,0.326342281879195,10.1789709172259,MUSR,0.43703125,14.12890625,MMLU-PRO,0.378407579787234,30.9341755319149,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-16,2024-09-16,0,Xclbr7/caliburn-v2-12b,mit,0,12.248,1.63219374817133 -Xkev/Llama-3.2V-11B-cot_float16_86d718ed524bf79320497bc2029e835af3b9bcc4_False,Xkev/Llama-3.2V-11B-cot,86d718ed524bf79320497bc2029e835af3b9bcc4,float16,multimodal,Original,MllamaForConditionalGeneration,21.7212647920112,FALSE,IFEval,0.415808942494803,41.5808942494803,BBH,0.495871783411897,28.2467615530034,MATH Level 5,0.153323262839879,15.3323262839879,GPQA,0.295302013422819,6.04026845637584,MUSR,0.415854166666667,10.3817708333333,MMLU-PRO,0.358710106382979,28.7455673758865,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-12-26,1,Xkev/Llama-3.2V-11B-cot (Merge),apache-2.0,138,10.67,0.711610361039194 +Xkev/Llama-3.2V-11B-cot_float16_86d718ed524bf79320497bc2029e835af3b9bcc4_False,Xkev/Llama-3.2V-11B-cot,86d718ed524bf79320497bc2029e835af3b9bcc4,float16,multimodal,Original,MllamaForConditionalGeneration,21.7212647920112,FALSE,IFEval,0.415808942494803,41.5808942494803,BBH,0.495871783411897,28.2467615530034,MATH Level 5,0.153323262839879,15.3323262839879,GPQA,0.295302013422819,6.04026845637584,MUSR,0.415854166666667,10.3817708333333,MMLU-PRO,0.358710106382979,28.7455673758865,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-12-26,1,Xkev/Llama-3.2V-11B-cot (Merge),apache-2.0,139,10.67,0.711610361039194 Yash21/TinyYi-7B-Test_float16_7750e5de73fbcf1dcc0832b4cdabaa9713c20475_False,Yash21/TinyYi-7B-Test,7750e5de73fbcf1dcc0832b4cdabaa9713c20475,float16,pretrained,Original,LlamaForCausalLM,4.49516729496769,FALSE,IFEval,0.185648523694907,18.5648523694907,BBH,0.290980078012147,2.26796638883226,MATH Level 5,0,0,GPQA,0.264261744966443,1.90156599552573,MUSR,0.336447916666667,3.22265625,MMLU-PRO,0.109125664893617,1.01396276595745,TRUE,TRUE,FALSE,FALSE,FALSE,2024-01-06,2024-07-03,0,Yash21/TinyYi-7B-Test,apache-2.0,0,6.061,0.763109094577256 Youlln/1PARAMMYL-8B-ModelStock_bfloat16_4ce556da5ccd1ecac8d0f3e1e94d1982f11b910d_False,Youlln/1PARAMMYL-8B-ModelStock,4ce556da5ccd1ecac8d0f3e1e94d1982f11b910d,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,26.2839753599299,FALSE,IFEval,0.537133694153734,53.7133694153734,BBH,0.521583966355513,31.7999511933277,MATH Level 5,0.147280966767372,14.7280966767372,GPQA,0.323825503355705,9.84340044742729,MUSR,0.4409375,14.2838541666667,MMLU-PRO,0.400016622340426,33.3351802600473,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-20,2024-09-20,1,Youlln/1PARAMMYL-8B-ModelStock (Merge),"",0,8.03,0.892521845193913 Youlln/2PRYMMAL-Yi1.5-6B-SLERP_bfloat16_b776bd3ce6784b96ff928b1d5ad51b2991909f2c_False,Youlln/2PRYMMAL-Yi1.5-6B-SLERP,b776bd3ce6784b96ff928b1d5ad51b2991909f2c,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,18.9792231413585,FALSE,IFEval,0.282593518530832,28.2593518530832,BBH,0.466475042917107,24.4956444207091,MATH Level 5,0.112537764350453,11.2537764350453,GPQA,0.307046979865772,7.60626398210291,MUSR,0.475604166666667,18.1505208333333,MMLU-PRO,0.316988031914894,24.1097813238771,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-22,2024-09-23,1,Youlln/2PRYMMAL-Yi1.5-6B-SLERP (Merge),apache-2.0,0,6.061,1.38317707881205 @@ -1314,7 +1317,7 @@ allenai/Llama-3.1-Tulu-3-8B-DPO_bfloat16_002347006131d85678ea3865520bc9caad69869 allenai/Llama-3.1-Tulu-3-8B-RM_bfloat16_76247c00745747f820f1712949b5b37901d0f9c4_True,allenai/Llama-3.1-Tulu-3-8B-RM,76247c00745747f820f1712949b5b37901d0f9c4,bfloat16,chatmodels,Original,LlamaForSequenceClassification,4.23505701818803,TRUE,IFEval,0.167013524116012,16.7013524116012,BBH,0.29500411474705,2.64966998137355,MATH Level 5,0,0,GPQA,0.256711409395973,0.894854586129753,MUSR,0.376416666666667,4.25208333333334,MMLU-PRO,0.108211436170213,0.912381796690307,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-22,1,allenai/Llama-3.1-Tulu-3-8B-RM (Merge),llama3.1,10,8,0.73689906762706 allenai/Llama-3.1-Tulu-3-8B-SFT_bfloat16_4ddd761e6750e04ea3d468175f78463628bba860_True,allenai/Llama-3.1-Tulu-3-8B-SFT,4ddd761e6750e04ea3d468175f78463628bba860,bfloat16,chatmodels,Original,LlamaForCausalLM,22.5339999676641,TRUE,IFEval,0.740340075444266,74.0340075444266,BBH,0.387186327050165,13.9312081682626,MATH Level 5,0.11404833836858,11.404833836858,GPQA,0.277684563758389,3.69127516778523,MUSR,0.426770833333333,12.0130208333333,MMLU-PRO,0.281166888297872,20.1296542553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-18,2024-11-22,1,allenai/Llama-3.1-Tulu-3-8B-SFT (Merge),llama3.1,16,8.03,0.683246279517383 allenai/OLMo-1B-hf_bfloat16_8e995430edd24416ccfa98b5b283fa07b0c9f1a9_False,allenai/OLMo-1B-hf,8e995430edd24416ccfa98b5b283fa07b0c9f1a9,bfloat16,pretrained,Original,OlmoForCausalLM,6.47027844039243,FALSE,IFEval,0.218196607224387,21.8196607224387,BBH,0.305194689884293,3.19654631243032,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.261744966442953,1.56599552572707,MUSR,0.40978125,9.55598958333333,MMLU-PRO,0.117353723404255,1.9281914893617,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-12,2024-06-12,0,allenai/OLMo-1B-hf,apache-2.0,18,1.177,0.248873749951744 -allenai/OLMo-2-1124-7B-Instruct_float16_470b1fba1ae01581f270116362ee4aa1b97f4c84_True,allenai/OLMo-2-1124-7B-Instruct,470b1fba1ae01581f270116362ee4aa1b97f4c84,float16,chatmodels,Original,Olmo2ForCausalLM,20.3256354495595,TRUE,IFEval,0.724403471677372,72.4403471677372,BBH,0.402236024744178,16.3267729495518,MATH Level 5,0.061178247734139,6.1178247734139,GPQA,0.278523489932886,3.80313199105145,MUSR,0.350833333333333,4.6875,MMLU-PRO,0.267204122340426,18.5782358156028,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-18,2025-01-07,1,allenai/OLMo-2-1124-7B-Instruct (Merge),apache-2.0,15,7.299,0.817944946577781 +allenai/OLMo-2-1124-7B-Instruct_float16_470b1fba1ae01581f270116362ee4aa1b97f4c84_True,allenai/OLMo-2-1124-7B-Instruct,470b1fba1ae01581f270116362ee4aa1b97f4c84,float16,chatmodels,Original,Olmo2ForCausalLM,20.3256354495595,TRUE,IFEval,0.724403471677372,72.4403471677372,BBH,0.402236024744178,16.3267729495518,MATH Level 5,0.061178247734139,6.1178247734139,GPQA,0.278523489932886,3.80313199105145,MUSR,0.350833333333333,4.6875,MMLU-PRO,0.267204122340426,18.5782358156028,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-18,2025-01-07,1,allenai/OLMo-2-1124-7B-Instruct (Merge),apache-2.0,17,7.299,0.817944946577781 allenai/OLMo-7B-Instruct-hf_bfloat16_2ea947518df93433aa71219f29b36c72ac63be95_True,allenai/OLMo-7B-Instruct-hf,2ea947518df93433aa71219f29b36c72ac63be95,bfloat16,chatmodels,Original,OlmoForCausalLM,10.7608566037124,TRUE,IFEval,0.347265256186917,34.7265256186917,BBH,0.370646986666272,13.159933415267,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.270973154362416,2.79642058165548,MUSR,0.376479166666667,4.3265625,MMLU-PRO,0.178523936170213,8.72488179669031,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-04,2024-06-27,0,allenai/OLMo-7B-Instruct-hf,apache-2.0,3,7,1.19995072912062 allenai/OLMo-7B-hf_bfloat16_687d934d36a05417048d0fe7482f24f389fef6aa_False,allenai/OLMo-7B-hf,687d934d36a05417048d0fe7482f24f389fef6aa,bfloat16,pretrained,Original,OlmoForCausalLM,6.77615120977129,FALSE,IFEval,0.271927374920766,27.1927374920766,BBH,0.327913165873623,5.76198704108083,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.272651006711409,3.02013422818792,MUSR,0.348666666666667,2.08333333333333,MMLU-PRO,0.117270611702128,1.91895685579196,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-12,2024-06-27,0,allenai/OLMo-7B-hf,apache-2.0,14,6.888,0.590564158425061 allenai/OLMoE-1B-7B-0924_bfloat16_4fa3a6e09ed0e41639962f38bfba0fc532b90075_False,allenai/OLMoE-1B-7B-0924,4fa3a6e09ed0e41639962f38bfba0fc532b90075,bfloat16,pretrained,Original,OlmoeForCausalLM,7.17846378604139,FALSE,IFEval,0.218471433574028,21.8471433574028,BBH,0.339343793117734,8.30810689489578,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.24748322147651,0,MUSR,0.348791666666667,3.565625,MMLU-PRO,0.173952792553192,8.21697695035461,TRUE,FALSE,TRUE,FALSE,TRUE,2024-07-20,2024-09-30,0,allenai/OLMoE-1B-7B-0924,apache-2.0,109,6.919,3.07640711692468 @@ -1427,7 +1430,7 @@ anthracite-org/magnum-v2.5-12b-kto_float16_aee0374e5a43e950c9977b0004dede1c57be2 anthracite-org/magnum-v3-27b-kto_bfloat16_96fbb750b3150e5fe9d6d2fcf757f49310d99a43_True,anthracite-org/magnum-v3-27b-kto,96fbb750b3150e5fe9d6d2fcf757f49310d99a43,bfloat16,chatmodels,Original,Gemma2ForCausalLM,29.0979057982708,TRUE,IFEval,0.567483166886085,56.7483166886085,BBH,0.586040577894583,41.1601029248443,MATH Level 5,0.166918429003021,16.6918429003021,GPQA,0.355704697986577,14.0939597315436,MUSR,0.38546875,9.91692708333333,MMLU-PRO,0.423786569148936,35.9762854609929,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-06,2024-09-15,1,anthracite-org/magnum-v3-27b-kto (Merge),gemma,12,27.227,3.93753396148653 anthracite-org/magnum-v3-34b_bfloat16_3bcd8c3dbb93021a5ce22203c690a1a084cafb73_True,anthracite-org/magnum-v3-34b,3bcd8c3dbb93021a5ce22203c690a1a084cafb73,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,29.6660813345297,TRUE,IFEval,0.511529408635753,51.1529408635753,BBH,0.608782869208523,44.3279034146296,MATH Level 5,0.194864048338369,19.4864048338369,GPQA,0.360738255033557,14.7651006711409,MUSR,0.387239583333333,6.57161458333334,MMLU-PRO,0.475232712765958,41.692523640662,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-22,2024-09-18,0,anthracite-org/magnum-v3-34b,apache-2.0,29,34.389,6.18930955707639 anthracite-org/magnum-v3-9b-chatml_bfloat16_96c2d023c56ef73be095ffbae8cedd7243ebca84_False,anthracite-org/magnum-v3-9b-chatml,96c2d023c56ef73be095ffbae8cedd7243ebca84,bfloat16,chatmodels,Original,Gemma2ForCausalLM,19.4159995515446,FALSE,IFEval,0.127470666719859,12.7470666719859,BBH,0.54276884888871,35.3178754123854,MATH Level 5,0.0641993957703927,6.41993957703927,GPQA,0.345637583892617,12.751677852349,MUSR,0.443229166666667,13.2369791666667,MMLU-PRO,0.424202127659575,36.0224586288416,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-27,2024-09-18,1,IntervitensInc/gemma-2-9b-chatml,gemma,24,9.242,2.88996530498741 -anthracite-org/magnum-v3-9b-customgemma2_bfloat16_9a7cd3d47434bed2bd80e34e45c74e413f8baaa8_False,anthracite-org/magnum-v3-9b-customgemma2,9a7cd3d47434bed2bd80e34e45c74e413f8baaa8,bfloat16,chatmodels,Original,Gemma2ForCausalLM,19.1373265419411,FALSE,IFEval,0.127295575739039,12.7295575739039,BBH,0.534013693691617,34.1167833409438,MATH Level 5,0.06797583081571,6.797583081571,GPQA,0.328859060402685,10.5145413870246,MUSR,0.45646875,15.05859375,MMLU-PRO,0.42046210106383,35.6069001182033,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-27,2024-09-18,1,google/gemma-2-9b,gemma,18,9.242,2.90182501706176 +anthracite-org/magnum-v3-9b-customgemma2_bfloat16_9a7cd3d47434bed2bd80e34e45c74e413f8baaa8_False,anthracite-org/magnum-v3-9b-customgemma2,9a7cd3d47434bed2bd80e34e45c74e413f8baaa8,bfloat16,chatmodels,Original,Gemma2ForCausalLM,19.1373265419411,FALSE,IFEval,0.127295575739039,12.7295575739039,BBH,0.534013693691617,34.1167833409438,MATH Level 5,0.06797583081571,6.797583081571,GPQA,0.328859060402685,10.5145413870246,MUSR,0.45646875,15.05859375,MMLU-PRO,0.42046210106383,35.6069001182033,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-27,2024-09-18,1,google/gemma-2-9b,gemma,19,9.242,2.90182501706176 anthracite-org/magnum-v4-12b_bfloat16_704f2ccfe662052e415499e56789dd88ec01a113_False,anthracite-org/magnum-v4-12b,704f2ccfe662052e415499e56789dd88ec01a113,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,19.949135830507,FALSE,IFEval,0.339296400218088,33.9296400218088,BBH,0.517669304659192,30.5039022664848,MATH Level 5,0.0981873111782477,9.81873111782477,GPQA,0.296140939597315,6.15212527964205,MUSR,0.40928125,10.36015625,MMLU-PRO,0.360372340425532,28.9302600472813,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-20,2024-10-23,0,anthracite-org/magnum-v4-12b,apache-2.0,37,12.248,1.69901572897805 anthracite-org/magnum-v4-22b_bfloat16_e5239e71d2628269b453a832de98c1ecb79d2557_False,anthracite-org/magnum-v4-22b,e5239e71d2628269b453a832de98c1ecb79d2557,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,27.7159004280105,FALSE,IFEval,0.56286209479736,56.286209479736,BBH,0.548612004937422,35.5491485327735,MATH Level 5,0.191842900302115,19.1842900302115,GPQA,0.328020134228188,10.4026845637584,MUSR,0.44078125,13.4309895833333,MMLU-PRO,0.382978723404255,31.4420803782506,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-20,2024-10-23,0,anthracite-org/magnum-v4-22b,other,17,22.247,1.65029003573429 anthracite-org/magnum-v4-27b_bfloat16_50a14716bdeb6a9376b9377df31ab1497864f3f9_False,anthracite-org/magnum-v4-27b,50a14716bdeb6a9376b9377df31ab1497864f3f9,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,26.3308890010956,FALSE,IFEval,0.345416827351428,34.5416827351428,BBH,0.586729810989139,40.9603843335009,MATH Level 5,0.161631419939577,16.1631419939577,GPQA,0.36996644295302,15.9955257270693,MUSR,0.437989583333333,12.8153645833333,MMLU-PRO,0.437583111702128,37.5092346335697,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-20,2024-10-23,0,anthracite-org/magnum-v4-27b,gemma,13,27.227,5.73635389356619 @@ -1442,7 +1445,7 @@ arcee-ai/Llama-3.1-SuperNova-Lite_bfloat16_76246ca4448c1a11787daee0958b60ab27f17 arcee-ai/Llama-Spark_bfloat16_6d74a617fbb17a1ada08528f2673c89f84fb062e_True,arcee-ai/Llama-Spark,6d74a617fbb17a1ada08528f2673c89f84fb062e,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.9224332761527,TRUE,IFEval,0.791073241222179,79.1073241222179,BBH,0.505350414574998,29.7702537002086,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.299496644295302,6.59955257270694,MUSR,0.359333333333333,2.61666666666667,MMLU-PRO,0.372091090425532,30.2323433806147,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-26,2024-08-08,0,arcee-ai/Llama-Spark,llama3,27,8.03,0.830714101745732 arcee-ai/SuperNova-Medius_bfloat16_e34fafcac2801be1ae5c7eb744e191a08119f2af_True,arcee-ai/SuperNova-Medius,e34fafcac2801be1ae5c7eb744e191a08119f2af,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,33.8924710529695,TRUE,IFEval,0.718358400156031,71.8358400156031,BBH,0.637728446311571,48.0050146271633,MATH Level 5,0.153323262839879,15.3323262839879,GPQA,0.333053691275168,11.0738255033557,MUSR,0.423270833333333,12.2755208333333,MMLU-PRO,0.503490691489362,44.8322990543735,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-02,2024-10-22,1,arcee-ai/SuperNova-Medius (Merge),apache-2.0,202,14.77,5.86781166745177 arcee-ai/Virtuoso-Small_bfloat16_ca5dec1c6351ba6f2f0c59e609b94628a29c1459_True,arcee-ai/Virtuoso-Small,ca5dec1c6351ba6f2f0c59e609b94628a29c1459,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,39.4283232965703,TRUE,IFEval,0.793521190441362,79.3521190441362,BBH,0.651763312945478,50.3998463118999,MATH Level 5,0.342900302114804,34.2900302114804,GPQA,0.336409395973154,11.5212527964206,MUSR,0.43390625,14.43828125,MMLU-PRO,0.519115691489362,46.5684101654846,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-03,1,arcee-ai/Virtuoso-Small (Merge),apache-2.0,45,14.77,1.51431412160642 -arcee-ai/raspberry-3B_bfloat16_66bf1346c060bbfe1f1b98cd22e7a26ada69cf70_True,arcee-ai/raspberry-3B,66bf1346c060bbfe1f1b98cd22e7a26ada69cf70,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,15.5380031214432,TRUE,IFEval,0.315416428409952,31.5416428409952,BBH,0.42689280188827,19.5282344009925,MATH Level 5,0.0845921450151058,8.45921450151058,GPQA,0.277684563758389,3.69127516778523,MUSR,0.412322916666667,9.40703125,MMLU-PRO,0.285405585106383,20.6006205673759,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-05,2024-10-07,1,Qwen/Qwen2.5-3B,other,37,3.086,1.03652651773508 +arcee-ai/raspberry-3B_bfloat16_66bf1346c060bbfe1f1b98cd22e7a26ada69cf70_True,arcee-ai/raspberry-3B,66bf1346c060bbfe1f1b98cd22e7a26ada69cf70,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,15.5380031214432,TRUE,IFEval,0.315416428409952,31.5416428409952,BBH,0.42689280188827,19.5282344009925,MATH Level 5,0.0845921450151058,8.45921450151058,GPQA,0.277684563758389,3.69127516778523,MUSR,0.412322916666667,9.40703125,MMLU-PRO,0.285405585106383,20.6006205673759,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-05,2024-10-07,1,Qwen/Qwen2.5-3B,other,38,3.086,1.03652651773508 argilla/notus-7b-v1_bfloat16_30172203a2d41cb487bf7e2b92a821080783b2c9_True,argilla/notus-7b-v1,30172203a2d41cb487bf7e2b92a821080783b2c9,bfloat16,chatmodels,Original,MistralForCausalLM,18.4113211888546,TRUE,IFEval,0.508207112683236,50.8207112683236,BBH,0.45118574073815,22.7471119611614,MATH Level 5,0.0279456193353474,2.79456193353474,GPQA,0.289429530201342,5.2572706935123,MUSR,0.336416666666667,6.58541666666667,MMLU-PRO,0.300365691489362,22.2628546099291,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-16,2024-06-27,2,mistralai/Mistral-7B-v0.1,mit,122,7.242,0.667908131155709 argilla/notux-8x7b-v1_bfloat16_0b29f9afcbae2ab4c5085638d8f5a7f6d44c6b17_True,argilla/notux-8x7b-v1,0b29f9afcbae2ab4c5085638d8f5a7f6d44c6b17,bfloat16,chatmodels,Original,MixtralForCausalLM,24.4282310956467,TRUE,IFEval,0.542229063329743,54.2229063329743,BBH,0.536330416451635,34.7580616829018,MATH Level 5,0.0966767371601208,9.66767371601208,GPQA,0.308724832214765,7.82997762863535,MUSR,0.41759375,10.5325520833333,MMLU-PRO,0.366023936170213,29.5582151300237,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-12,2024-06-12,2,mistralai/Mixtral-8x7B-v0.1,apache-2.0,165,46.703,21.3908445719779 argilla-warehouse/Llama-3.1-8B-MagPie-Ultra_bfloat16_1e12f20ca5db84f65a6db793a65100433aac0ac6_True,argilla-warehouse/Llama-3.1-8B-MagPie-Ultra,1e12f20ca5db84f65a6db793a65100433aac0ac6,bfloat16,chatmodels,Original,LlamaForCausalLM,19.4587597172733,TRUE,IFEval,0.575651493592557,57.5651493592557,BBH,0.461961346344686,23.5163103648276,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.266778523489933,2.23713646532438,MUSR,0.35425,4.24791666666667,MMLU-PRO,0.314411569148936,23.8235076832151,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-26,2024-09-30,1,meta-llama/Llama-3.1-8B,llama3.1,1,8.03,0.965677051991664 @@ -1496,7 +1499,7 @@ bfuzzy1/acheron-d_float16_337fc6d265062b22b368debdf42deb10af58b25e_False,bfuzzy1 bfuzzy1/llambses-1_float16_73d190c1726f22de8bb1be333d93cfeebb550984_True,bfuzzy1/llambses-1,73d190c1726f22de8bb1be333d93cfeebb550984,float16,basemergesandmoerges,Adapter,?,19.8118967247516,TRUE,IFEval,0.355383715208979,35.5383715208979,BBH,0.504697740517562,31.0778330887394,MATH Level 5,0.0672205438066465,6.72205438066465,GPQA,0.297818791946309,6.3758389261745,MUSR,0.45290625,15.3799479166667,MMLU-PRO,0.313996010638298,23.7773345153664,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-10,2024-10-10,1,bfuzzy1/llambses-1 (Merge),apache-2.0,0,7.242,0.468291696377507 bhuvneshsaini/merged_model_float16_35d045ae54b9bdf334b1c28becd85746cf4e9a38_False,bhuvneshsaini/merged_model,35d045ae54b9bdf334b1c28becd85746cf4e9a38,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,5.79574882820239,FALSE,IFEval,0.181276790028236,18.1276790028236,BBH,0.335977794907124,7.61738688305735,MATH Level 5,0,0,GPQA,0.25,0,MUSR,0.34971875,4.08151041666667,MMLU-PRO,0.14453125,4.94791666666667,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-13,2024-12-17,0,bhuvneshsaini/merged_model,mit,0,4.715,0.358215883478623 bigcode/starcoder2-15b_bfloat16_46d44742909c03ac8cee08eb03fdebce02e193ec_False,bigcode/starcoder2-15b,46d44742909c03ac8cee08eb03fdebce02e193ec,bfloat16,pretrained,Original,Starcoder2ForCausalLM,12.5517635384636,FALSE,IFEval,0.278022314126518,27.8022314126518,BBH,0.444795784123044,20.3735407526785,MATH Level 5,0.0604229607250755,6.04229607250755,GPQA,0.273489932885906,3.13199105145414,MUSR,0.35009375,2.92838541666667,MMLU-PRO,0.235289228723404,15.0321365248227,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-20,2024-06-09,0,bigcode/starcoder2-15b,bigcode-openrail-m,579,15.958,35.0445477497081 -bigcode/starcoder2-3b_bfloat16_733247c55e3f73af49ce8e9c7949bf14af205928_False,bigcode/starcoder2-3b,733247c55e3f73af49ce8e9c7949bf14af205928,bfloat16,pretrained,Original,Starcoder2ForCausalLM,6.53655950956181,FALSE,IFEval,0.203708382646932,20.3708382646932,BBH,0.350871413846018,8.90929942108357,MATH Level 5,0.0143504531722054,1.43504531722054,GPQA,0.244127516778523,0,MUSR,0.343458333333333,1.43229166666667,MMLU-PRO,0.163646941489362,7.07188238770686,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-29,2024-06-09,0,bigcode/starcoder2-3b,bigcode-openrail-m,155,3.03,0.446628918326529 +bigcode/starcoder2-3b_bfloat16_733247c55e3f73af49ce8e9c7949bf14af205928_False,bigcode/starcoder2-3b,733247c55e3f73af49ce8e9c7949bf14af205928,bfloat16,pretrained,Original,Starcoder2ForCausalLM,6.53655950956181,FALSE,IFEval,0.203708382646932,20.3708382646932,BBH,0.350871413846018,8.90929942108357,MATH Level 5,0.0143504531722054,1.43504531722054,GPQA,0.244127516778523,0,MUSR,0.343458333333333,1.43229166666667,MMLU-PRO,0.163646941489362,7.07188238770686,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-29,2024-06-09,0,bigcode/starcoder2-3b,bigcode-openrail-m,156,3.03,0.446628918326529 bigcode/starcoder2-7b_bfloat16_a3d33687b51284b528abeb17830776ffd24892a9_False,bigcode/starcoder2-7b,a3d33687b51284b528abeb17830776ffd24892a9,bfloat16,pretrained,Original,Starcoder2ForCausalLM,8.25567402602663,FALSE,IFEval,0.220919382793211,22.0919382793211,BBH,0.36609857669123,11.3951101065034,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.251677852348993,0.223713646532442,MUSR,0.379333333333333,5.81666666666667,MMLU-PRO,0.164228723404255,7.13652482269503,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-20,2024-06-09,0,bigcode/starcoder2-7b,bigcode-openrail-m,164,7.174,0.506401378527561 bigscience/bloom-1b1_bfloat16_eb3dd7399312f5f94fd13f41d2f318117d3eb1e4_False,bigscience/bloom-1b1,eb3dd7399312f5f94fd13f41d2f318117d3eb1e4,bfloat16,pretrained,Original,BloomForCausalLM,3.96221529197984,FALSE,IFEval,0.137337819208589,13.7337819208589,BBH,0.310727623773704,4.04270526926013,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.259228187919463,1.23042505592841,MUSR,0.37,3.41666666666667,MMLU-PRO,0.11078789893617,1.19865543735224,TRUE,FALSE,FALSE,FALSE,TRUE,2022-05-19,2024-06-13,0,bigscience/bloom-1b1,bigscience-bloom-rail-1.0,62,1.065,0.717021357543704 bigscience/bloom-1b7_bfloat16_cc72a88036c2fb937d65efeacc57a0c2ef5d6fe5_False,bigscience/bloom-1b7,cc72a88036c2fb937d65efeacc57a0c2ef5d6fe5,bfloat16,pretrained,Original,BloomForCausalLM,3.97122577983585,FALSE,IFEval,0.104389686033059,10.4389686033059,BBH,0.314054919904072,4.39745292760164,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.258389261744966,1.11856823266219,MUSR,0.388572916666667,6.83828125,MMLU-PRO,0.108626994680851,0.958554964539006,TRUE,FALSE,FALSE,FALSE,TRUE,2022-05-19,2024-06-13,0,bigscience/bloom-1b7,bigscience-bloom-rail-1.0,120,1.722,0.81835959878956 @@ -1562,7 +1565,7 @@ cloudyu/Yi-34Bx2-MoE-60B-DPO_bfloat16_5c2d31042229ee06246064100b781dd926cb0ffd_T cluebbers/Llama-3.1-8B-paraphrase-type-generation-apty-ipo_bfloat16_eb04613997875935cb667a517e518874bb716169_False,cluebbers/Llama-3.1-8B-paraphrase-type-generation-apty-ipo,eb04613997875935cb667a517e518874bb716169,bfloat16,chatmodels,Adapter,?,9.74964763156676,FALSE,IFEval,0.132666879435454,13.2666879435454,BBH,0.380021930319135,12.6694782230036,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.263422818791946,1.78970917225951,MUSR,0.43321875,12.4190104166667,MMLU-PRO,0.259059175531915,17.6732417257683,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-14,2024-11-15,1,cluebbers/Llama-3.1-8B-paraphrase-type-generation-apty-ipo (Merge),apache-2.0,0,8.03,0.719830889824629 cluebbers/Llama-3.1-8B-paraphrase-type-generation-apty-sigmoid_bfloat16_2c8b52e8db11a6ff57cccf890ee26688e858f9fb_False,cluebbers/Llama-3.1-8B-paraphrase-type-generation-apty-sigmoid,2c8b52e8db11a6ff57cccf890ee26688e858f9fb,bfloat16,chatmodels,Adapter,?,9.74340804431023,FALSE,IFEval,0.13184240038653,13.184240038653,BBH,0.378890160329037,12.7573252061306,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.268456375838926,2.46085011185682,MUSR,0.430552083333333,12.0190104166667,MMLU-PRO,0.256233377659575,17.3592641843972,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-15,2024-11-15,1,cluebbers/Llama-3.1-8B-paraphrase-type-generation-apty-sigmoid (Merge),apache-2.0,0,8.03,0.723560164735406 cluebbers/Llama-3.1-8B-paraphrase-type-generation-etpc_bfloat16_a003a227aed5c1ad67cd4a653b13a0dd7acb7ed5_False,cluebbers/Llama-3.1-8B-paraphrase-type-generation-etpc,a003a227aed5c1ad67cd4a653b13a0dd7acb7ed5,bfloat16,chatmodels,Adapter,?,9.43002583868446,FALSE,IFEval,0.120851562742412,12.0851562742412,BBH,0.378081141522332,12.6945791177963,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.26510067114094,2.01342281879195,MUSR,0.431854166666667,12.0484375,MMLU-PRO,0.255568484042553,17.2853871158392,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-04,2024-11-15,1,cluebbers/Llama-3.1-8B-paraphrase-type-generation-etpc (Merge),apache-2.0,0,8.03,0.741527168067679 -cognitivecomputations/Dolphin3.0-Llama3.1-8B_float16_0bf45a981ba100596ee0c3e7d27e7849b0206632_True,cognitivecomputations/Dolphin3.0-Llama3.1-8B,0bf45a981ba100596ee0c3e7d27e7849b0206632,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.9677291381145,TRUE,IFEval,0.762122279994858,76.2122279994858,BBH,0.49163663539212,27.6317028058839,MATH Level 5,0.104984894259819,10.4984894259819,GPQA,0.282718120805369,4.36241610738255,MUSR,0.36534375,8.96796875,MMLU-PRO,0.299202127659575,22.1335697399527,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-29,2025-01-05,1,cognitivecomputations/Dolphin3.0-Llama3.1-8B (Merge),llama3.1,107,8.03,0.619325263299384 +cognitivecomputations/Dolphin3.0-Llama3.1-8B_float16_0bf45a981ba100596ee0c3e7d27e7849b0206632_True,cognitivecomputations/Dolphin3.0-Llama3.1-8B,0bf45a981ba100596ee0c3e7d27e7849b0206632,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.9677291381145,TRUE,IFEval,0.762122279994858,76.2122279994858,BBH,0.49163663539212,27.6317028058839,MATH Level 5,0.104984894259819,10.4984894259819,GPQA,0.282718120805369,4.36241610738255,MUSR,0.36534375,8.96796875,MMLU-PRO,0.299202127659575,22.1335697399527,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-29,2025-01-05,1,cognitivecomputations/Dolphin3.0-Llama3.1-8B (Merge),llama3.1,109,8.03,0.619325263299384 cognitivecomputations/dolphin-2.9-llama3-8b_bfloat16_5aeb036f9215c558b483a654a8c6e1cc22e841bf_True,cognitivecomputations/dolphin-2.9-llama3-8b,5aeb036f9215c558b483a654a8c6e1cc22e841bf,bfloat16,chatmodels,Original,LlamaForCausalLM,18.3902850051619,TRUE,IFEval,0.385033932188815,38.5033932188815,BBH,0.494992201666092,27.8589292609051,MATH Level 5,0.0558912386706949,5.58912386706949,GPQA,0.286912751677852,4.92170022371365,MUSR,0.43753125,13.79140625,MMLU-PRO,0.277094414893617,19.6771572104019,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-20,2024-06-12,1,meta-llama/Meta-Llama-3-8B,other,428,8.03,0.73912013993247 cognitivecomputations/dolphin-2.9.1-llama-3-70b_bfloat16_31adf616c3c9176d147e0a62e9fedb7bf97678ac_True,cognitivecomputations/dolphin-2.9.1-llama-3-70b,31adf616c3c9176d147e0a62e9fedb7bf97678ac,bfloat16,chatmodels,Original,LlamaForCausalLM,23.4447587222945,TRUE,IFEval,0.376016746676596,37.6016746676596,BBH,0.520491931282147,31.1011518725692,MATH Level 5,0.0566465256797583,5.66465256797583,GPQA,0.308724832214765,7.82997762863535,MUSR,0.4975625,23.6953125,MMLU-PRO,0.41298204787234,34.7757830969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-27,1,meta-llama/Meta-Llama-3-70B,llama3,40,70.554,12.1490880696042 cognitivecomputations/dolphin-2.9.1-yi-1.5-34b_bfloat16_1ec522298a6935c881df6dc29d3669833bd8672d_True,cognitivecomputations/dolphin-2.9.1-yi-1.5-34b,1ec522298a6935c881df6dc29d3669833bd8672d,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,27.9043843077483,TRUE,IFEval,0.385258890854045,38.5258890854045,BBH,0.607622560062686,44.1740887427727,MATH Level 5,0.16238670694864,16.238670694864,GPQA,0.343120805369128,12.4161073825503,MUSR,0.459791666666667,16.9739583333333,MMLU-PRO,0.451878324468085,39.097591607565,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-18,2024-07-27,1,01-ai/Yi-1.5-34B,apache-2.0,34,34.389,2.99265335000313 @@ -1599,7 +1602,7 @@ deepseek-ai/deepseek-llm-67b-chat_bfloat16_79648bef7658bb824e4630740f6e1484c1b06 deepseek-ai/deepseek-llm-7b-base_bfloat16_7683fea62db869066ddaff6a41d032262c490d4f_False,deepseek-ai/deepseek-llm-7b-base,7683fea62db869066ddaff6a41d032262c490d4f,bfloat16,pretrained,Original,LlamaForCausalLM,8.1389816171466,FALSE,IFEval,0.217871913190335,21.7871913190335,BBH,0.350303158292995,9.76792479590425,MATH Level 5,0.0143504531722054,1.43504531722054,GPQA,0.273489932885906,3.13199105145414,MUSR,0.37378125,3.75598958333333,MMLU-PRO,0.180601728723404,8.9557476359338,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-29,2024-06-12,0,deepseek-ai/deepseek-llm-7b-base,other,40,7,0.822535589447325 deepseek-ai/deepseek-llm-7b-chat_bfloat16_afbda8b347ec881666061fa67447046fc5164ec8_True,deepseek-ai/deepseek-llm-7b-chat,afbda8b347ec881666061fa67447046fc5164ec8,bfloat16,chatmodels,Original,LlamaForCausalLM,14.7853925002332,TRUE,IFEval,0.417082230703423,41.7082230703422,BBH,0.363207976010867,11.2589493715017,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.265939597315436,2.12527964205817,MUSR,0.466770833333333,19.2130208333333,MMLU-PRO,0.213347739361702,12.5941932624113,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-29,2024-06-12,0,deepseek-ai/deepseek-llm-7b-chat,other,79,7,0.77448254761568 deepseek-ai/deepseek-moe-16b-base_bfloat16_521d2bc4fb69a3f3ae565310fcc3b65f97af2580_False,deepseek-ai/deepseek-moe-16b-base,521d2bc4fb69a3f3ae565310fcc3b65f97af2580,bfloat16,pretrained,Original,DeepseekForCausalLM,7.39080509075389,FALSE,IFEval,0.244974445582166,24.4974445582166,BBH,0.34094610552464,8.35555577938938,MATH Level 5,0.0196374622356496,1.96374622356496,GPQA,0.254194630872483,0.559284116331097,MUSR,0.36578125,3.35598958333333,MMLU-PRO,0.150515292553192,5.61281028368794,TRUE,FALSE,TRUE,FALSE,TRUE,2024-01-08,2024-06-12,0,deepseek-ai/deepseek-moe-16b-base,other,87,16.376,7.00246543090385 -deepseek-ai/deepseek-moe-16b-chat_bfloat16_eefd8ac7e8dc90e095129fe1a537d5e236b2e57c_True,deepseek-ai/deepseek-moe-16b-chat,eefd8ac7e8dc90e095129fe1a537d5e236b2e57c,bfloat16,chatmodels,Original,DeepseekForCausalLM,10.1773221729739,TRUE,IFEval,0.366299197241098,36.6299197241098,BBH,0.327495302644824,6.57374902689064,MATH Level 5,0.0188821752265861,1.88821752265861,GPQA,0.224832214765101,0,MUSR,0.380760416666667,5.26171875,MMLU-PRO,0.19639295212766,10.7103280141844,TRUE,FALSE,TRUE,FALSE,TRUE,2024-01-09,2024-06-12,0,deepseek-ai/deepseek-moe-16b-chat,other,117,16.376,4.59347807294513 +deepseek-ai/deepseek-moe-16b-chat_bfloat16_eefd8ac7e8dc90e095129fe1a537d5e236b2e57c_True,deepseek-ai/deepseek-moe-16b-chat,eefd8ac7e8dc90e095129fe1a537d5e236b2e57c,bfloat16,chatmodels,Original,DeepseekForCausalLM,10.1773221729739,TRUE,IFEval,0.366299197241098,36.6299197241098,BBH,0.327495302644824,6.57374902689064,MATH Level 5,0.0188821752265861,1.88821752265861,GPQA,0.224832214765101,0,MUSR,0.380760416666667,5.26171875,MMLU-PRO,0.19639295212766,10.7103280141844,TRUE,FALSE,TRUE,FALSE,TRUE,2024-01-09,2024-06-12,0,deepseek-ai/deepseek-moe-16b-chat,other,118,16.376,4.59347807294513 dfurman/CalmeRys-78B-Orpo-v0.1_bfloat16_7988deb48419c3f56bb24c139c23e5c476ec03f8_True,dfurman/CalmeRys-78B-Orpo-v0.1,7988deb48419c3f56bb24c139c23e5c476ec03f8,bfloat16,chatmodels,Original,Qwen2ForCausalLM,51.2439111928447,TRUE,IFEval,0.816327344778521,81.6327344778521,BBH,0.726228279224993,61.9247637925916,MATH Level 5,0.407099697885196,40.7099697885197,GPQA,0.400167785234899,20.0223713646532,MUSR,0.590177083333333,36.3721354166667,MMLU-PRO,0.701213430851064,66.8014923167849,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-24,2024-09-24,1,dfurman/CalmeRys-78B-Orpo-v0.1 (Merge),mit,64,77.965,12.9967673780368 dfurman/Llama-3-70B-Orpo-v0.1_float16_6bf3be5f7f427164c879f7a4ec9ccb6b22aa6631_True,dfurman/Llama-3-70B-Orpo-v0.1,6bf3be5f7f427164c879f7a4ec9ccb6b22aa6631,float16,chatmodels,Adapter,?,18.1741803011836,TRUE,IFEval,0.204907423414318,20.4907423414319,BBH,0.465523763470155,24.0938165463604,MATH Level 5,0.150302114803625,15.0302114803625,GPQA,0.25755033557047,1.00671140939597,MUSR,0.4534375,16.2796875,MMLU-PRO,0.389295212765957,32.1439125295508,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-26,2024-08-30,1,dfurman/Llama-3-70B-Orpo-v0.1 (Merge),llama3,2,70.554,14.4403427170369 dfurman/Llama-3-8B-Orpo-v0.1_float16_f02aef830e12a50892ac065826d5eb3dfc7675d1_True,dfurman/Llama-3-8B-Orpo-v0.1,f02aef830e12a50892ac065826d5eb3dfc7675d1,float16,chatmodels,Adapter,?,10.7560111427627,TRUE,IFEval,0.283517732948576,28.3517732948576,BBH,0.384242091989804,13.6807457474698,MATH Level 5,0.0438066465256798,4.38066465256798,GPQA,0.260906040268456,1.45413870246085,MUSR,0.356635416666667,2.24609375,MMLU-PRO,0.229803856382979,14.4226507092199,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-26,2024-08-30,1,dfurman/Llama-3-8B-Orpo-v0.1 (Merge),llama3,1,8.03,0.928079390858446 @@ -1743,17 +1746,17 @@ google/gemma-2-27b_bfloat16_938270f5272feb02779b55c2bb2fffdd0f53ff0c_False,googl google/gemma-2-27b-it_bfloat16_f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b_True,google/gemma-2-27b-it,f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b,bfloat16,chatmodels,Original,Gemma2ForCausalLM,32.3223187688799,TRUE,IFEval,0.797767700811624,79.7767700811624,BBH,0.64513874331688,49.2728421513039,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.375,16.6666666666667,MUSR,0.403302083333333,9.11276041666667,MMLU-PRO,0.445146276595745,38.3495862884161,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-08-07,1,google/gemma-2-27b,gemma,495,27.227,4.82621118669274 google/gemma-2-2b_bfloat16_4d05c88d00441bf62bf87dcfd29e204c05089f36_True,google/gemma-2-2b,4d05c88d00441bf62bf87dcfd29e204c05089f36,bfloat16,pretrained,Original,InternLM2ForCausalLM,10.1294631550552,TRUE,IFEval,0.199312269223438,19.9312269223438,BBH,0.365596699642259,11.7558075322361,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.26258389261745,1.67785234899329,MUSR,0.423177083333333,11.43046875,MMLU-PRO,0.218001994680851,13.1113327423168,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,0,google/gemma-2-2b,gemma,476,2.614,1.51879572271398 google/gemma-2-2b_float16_0738188b3055bc98daf0fe7211f0091357e5b979_False,google/gemma-2-2b,0738188b3055bc98daf0fe7211f0091357e5b979,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,10.3344393348315,FALSE,IFEval,0.201760218442621,20.1760218442621,BBH,0.370867461247026,12.4973062285736,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.26258389261745,1.67785234899329,MUSR,0.421875,11.2677083333333,MMLU-PRO,0.221658909574468,13.5176566193853,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-04,0,google/gemma-2-2b,gemma,476,2.614,1.41825735113158 -google/gemma-2-2b-it_bfloat16_2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f_True,google/gemma-2-2b-it,2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f,bfloat16,fine-tunedondomain-specificdatasets,Original,InternLM2ForCausalLM,17.0469392949665,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.419923089142747,17.9807928815234,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.274328859060403,3.24384787472036,MUSR,0.392885416666667,7.07734375,MMLU-PRO,0.25498670212766,17.2207446808511,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,1,google/gemma-2-2b,gemma,860,2.614,1.23474327420585 +google/gemma-2-2b-it_bfloat16_2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f_True,google/gemma-2-2b-it,2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f,bfloat16,fine-tunedondomain-specificdatasets,Original,InternLM2ForCausalLM,17.0469392949665,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.419923089142747,17.9807928815234,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.274328859060403,3.24384787472036,MUSR,0.392885416666667,7.07734375,MMLU-PRO,0.25498670212766,17.2207446808511,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,1,google/gemma-2-2b,gemma,862,2.614,1.23474327420585 google/gemma-2-2b-jpn-it_float16_6b046bbc091084a1ec89fe03e58871fde10868eb_False,google/gemma-2-2b-jpn-it,6b046bbc091084a1ec89fe03e58871fde10868eb,float16,pretrained,Original,Gemma2ForCausalLM,17.1154057059385,FALSE,IFEval,0.507782683280363,50.7782683280363,BBH,0.422556989006581,18.5256264498327,MATH Level 5,0.0347432024169184,3.47432024169184,GPQA,0.285234899328859,4.6979865771812,MUSR,0.396385416666667,7.68151041666667,MMLU-PRO,0.2578125,17.5347222222222,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-25,2024-10-11,2,google/gemma-2-2b,gemma,151,2.614,1.01143721051409 google/gemma-2-2b-jpn-it_bfloat16_6b046bbc091084a1ec89fe03e58871fde10868eb_True,google/gemma-2-2b-jpn-it,6b046bbc091084a1ec89fe03e58871fde10868eb,bfloat16,chatmodels,Original,Gemma2ForCausalLM,15.8855787074056,TRUE,IFEval,0.528840144150853,52.8840144150853,BBH,0.417844022621712,17.848086390818,MATH Level 5,0,0,GPQA,0.275167785234899,3.35570469798658,MUSR,0.372760416666667,4.92838541666667,MMLU-PRO,0.246675531914894,16.2972813238771,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-25,2024-10-14,2,google/gemma-2-2b,gemma,151,2.614,0.854400249040011 google/gemma-2-9b_bfloat16_beb0c08e9eeb0548f3aca2ac870792825c357b7d_False,google/gemma-2-9b,beb0c08e9eeb0548f3aca2ac870792825c357b7d,bfloat16,pretrained,Original,Gemma2ForCausalLM,21.1549343088298,FALSE,IFEval,0.203983208996574,20.3983208996574,BBH,0.537737339762188,34.0968185358978,MATH Level 5,0.131419939577039,13.1419939577039,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446114583333333,14.29765625,MMLU-PRO,0.410322473404255,34.480274822695,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,0,google/gemma-2-9b,gemma,627,9,5.6631856917904 -google/gemma-2-9b-it_bfloat16_1937c70277fcc5f7fb0fc772fc5bc69378996e71_True,google/gemma-2-9b-it,1937c70277fcc5f7fb0fc772fc5bc69378996e71,bfloat16,chatmodels,Original,Gemma2ForCausalLM,28.8627904641512,TRUE,IFEval,0.743562636027961,74.3562636027961,BBH,0.599034250416413,42.1366196836647,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.360738255033557,14.7651006711409,MUSR,0.407270833333333,9.7421875,MMLU-PRO,0.387549867021277,31.9499852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,1,google/gemma-2-9b,gemma,616,9,5.01449702077493 +google/gemma-2-9b-it_bfloat16_1937c70277fcc5f7fb0fc772fc5bc69378996e71_True,google/gemma-2-9b-it,1937c70277fcc5f7fb0fc772fc5bc69378996e71,bfloat16,chatmodels,Original,Gemma2ForCausalLM,28.8627904641512,TRUE,IFEval,0.743562636027961,74.3562636027961,BBH,0.599034250416413,42.1366196836647,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.360738255033557,14.7651006711409,MUSR,0.407270833333333,9.7421875,MMLU-PRO,0.387549867021277,31.9499852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,1,google/gemma-2-9b,gemma,617,9,5.01449702077493 google/gemma-2b_bfloat16_2ac59a5d7bf4e1425010f0d457dde7d146658953_False,google/gemma-2b,2ac59a5d7bf4e1425010f0d457dde7d146658953,bfloat16,pretrained,Original,GemmaForCausalLM,7.35870138352179,FALSE,IFEval,0.203758250331343,20.3758250331343,BBH,0.338099397582924,8.46671286484037,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.25503355704698,0.671140939597318,MUSR,0.39778125,7.55598958333334,MMLU-PRO,0.136552526595745,4.06139184397163,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b,gemma,941,2.506,1.23625082450337 -google/gemma-2b-it_bfloat16_de144fb2268dee1066f515465df532c05e699d48_True,google/gemma-2b-it,de144fb2268dee1066f515465df532c05e699d48,bfloat16,chatmodels,Original,GemmaForCausalLM,7.22145367714292,TRUE,IFEval,0.269029508371122,26.9029508371122,BBH,0.315081919887885,5.21430302216362,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.278523489932886,3.80313199105145,MUSR,0.334125,3.03229166666667,MMLU-PRO,0.13530585106383,3.92287234042553,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b-it,gemma,692,2.506,0.352950331047759 -google/gemma-7b_bfloat16_a0eac5b80dba224e6ed79d306df50b1e92c2125d_False,google/gemma-7b,a0eac5b80dba224e6ed79d306df50b1e92c2125d,bfloat16,pretrained,Original,GemmaForCausalLM,15.45540668709,FALSE,IFEval,0.265932171083835,26.5932171083835,BBH,0.436152852392864,21.1160993232917,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.286912751677852,4.92170022371365,MUSR,0.406239583333333,10.9799479166667,MMLU-PRO,0.294797207446809,21.6441341607565,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-08,0,google/gemma-7b,gemma,3088,8.538,1.25491405781993 +google/gemma-2b-it_bfloat16_de144fb2268dee1066f515465df532c05e699d48_True,google/gemma-2b-it,de144fb2268dee1066f515465df532c05e699d48,bfloat16,chatmodels,Original,GemmaForCausalLM,7.22145367714292,TRUE,IFEval,0.269029508371122,26.9029508371122,BBH,0.315081919887885,5.21430302216362,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.278523489932886,3.80313199105145,MUSR,0.334125,3.03229166666667,MMLU-PRO,0.13530585106383,3.92287234042553,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b-it,gemma,693,2.506,0.352950331047759 +google/gemma-7b_bfloat16_a0eac5b80dba224e6ed79d306df50b1e92c2125d_False,google/gemma-7b,a0eac5b80dba224e6ed79d306df50b1e92c2125d,bfloat16,pretrained,Original,GemmaForCausalLM,15.45540668709,FALSE,IFEval,0.265932171083835,26.5932171083835,BBH,0.436152852392864,21.1160993232917,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.286912751677852,4.92170022371365,MUSR,0.406239583333333,10.9799479166667,MMLU-PRO,0.294797207446809,21.6441341607565,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-08,0,google/gemma-7b,gemma,3090,8.538,1.25491405781993 google/gemma-7b-it_bfloat16_18329f019fb74ca4b24f97371785268543d687d2_True,google/gemma-7b-it,18329f019fb74ca4b24f97371785268543d687d2,bfloat16,chatmodels,Original,GemmaForCausalLM,12.8681419014102,TRUE,IFEval,0.386832493339894,38.6832493339894,BBH,0.364558292227017,11.8800913445494,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.284395973154362,4.58612975391499,MUSR,0.427427083333333,12.5283854166667,MMLU-PRO,0.169464760638298,7.71830673758865,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-13,2024-06-12,1,google/gemma-7b,gemma,1148,8.538,1.0999544452693 google/mt5-base_float16_2eb15465c5dd7f72a8f7984306ad05ebc3dd1e1f_False,google/mt5-base,2eb15465c5dd7f72a8f7984306ad05ebc3dd1e1f,float16,fine-tunedondomain-specificdatasets,Original,MT5ForConditionalGeneration,3.56528212264935,FALSE,IFEval,0.164515707212419,16.4515707212419,BBH,0.288316002284888,1.29855138817669,MATH Level 5,0,0,GPQA,0.239093959731544,0,MUSR,0.367208333333333,2.86770833333333,MMLU-PRO,0.106964760638298,0.773862293144208,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-base,apache-2.0,207,0.39,0.200039818164465 -google/mt5-small_float16_73fb5dbe4756edadc8fbe8c769b0a109493acf7a_False,google/mt5-small,73fb5dbe4756edadc8fbe8c769b0a109493acf7a,float16,fine-tunedondomain-specificdatasets,Original,MT5ForConditionalGeneration,4.25592817327735,FALSE,IFEval,0.171809687185557,17.1809687185557,BBH,0.276584202992908,1.07097147950089,MATH Level 5,0,0,GPQA,0.24244966442953,0,MUSR,0.38575,5.91875,MMLU-PRO,0.112283909574468,1.36487884160756,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-small,apache-2.0,118,0.17,0.180493674360773 +google/mt5-small_float16_73fb5dbe4756edadc8fbe8c769b0a109493acf7a_False,google/mt5-small,73fb5dbe4756edadc8fbe8c769b0a109493acf7a,float16,fine-tunedondomain-specificdatasets,Original,MT5ForConditionalGeneration,4.25592817327735,FALSE,IFEval,0.171809687185557,17.1809687185557,BBH,0.276584202992908,1.07097147950089,MATH Level 5,0,0,GPQA,0.24244966442953,0,MUSR,0.38575,5.91875,MMLU-PRO,0.112283909574468,1.36487884160756,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-small,apache-2.0,119,0.17,0.180493674360773 google/mt5-xl_float16_63fc6450d80515b48e026b69ef2fbbd426433e84_False,google/mt5-xl,63fc6450d80515b48e026b69ef2fbbd426433e84,float16,fine-tunedondomain-specificdatasets,Original,MT5ForConditionalGeneration,5.19142015303163,FALSE,IFEval,0.195964485343333,19.5964485343333,BBH,0.304735837080435,3.2824619143354,MATH Level 5,0,0,GPQA,0.264261744966443,1.90156599552573,MUSR,0.379520833333333,5.04010416666667,MMLU-PRO,0.111951462765957,1.32794030732861,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-xl,apache-2.0,23,3.23,0.903767224577182 google/mt5-xxl_float16_e07c395916dfbc315d4e5e48b4a54a1e8821b5c0_False,google/mt5-xxl,e07c395916dfbc315d4e5e48b4a54a1e8821b5c0,float16,fine-tunedondomain-specificdatasets,Original,T5ForConditionalGeneration,5.10307678308611,FALSE,IFEval,0.23575668116154,23.575668116154,BBH,0.295934415911691,2.50471080044775,MATH Level 5,0,0,GPQA,0.241610738255034,0,MUSR,0.368947916666667,3.55182291666667,MMLU-PRO,0.108876329787234,0.986258865248226,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-xxl,apache-2.0,68,11.9,2.28193850262229 google/recurrentgemma-2b_bfloat16_195f13c55b371fc721eda0662c00c64642c70e17_False,google/recurrentgemma-2b,195f13c55b371fc721eda0662c00c64642c70e17,bfloat16,pretrained,Original,RecurrentGemmaForCausalLM,6.95218641290216,FALSE,IFEval,0.301702815197011,30.1702815197011,BBH,0.319735828300845,4.82036223103474,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.245805369127517,0,MUSR,0.344572916666667,3.10494791666667,MMLU-PRO,0.117603058510638,1.95589539007092,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-06,2024-06-13,0,google/recurrentgemma-2b,gemma,91,2.683,3.69265287156138 @@ -1763,8 +1766,8 @@ google/recurrentgemma-9b-it_bfloat16_43e62f98c3d496a5469ef4b18c1b11e417d68d1d_Tr google/switch-base-8_float16_92fe2d22b024d9937146fe097ba3d3a7ba146e1b_False,google/switch-base-8,92fe2d22b024d9937146fe097ba3d3a7ba146e1b,float16,fine-tunedondomain-specificdatasets,Original,SwitchTransformersForConditionalGeneration,3.29595026839661,FALSE,IFEval,0.158520503375488,15.8520503375488,BBH,0.287631327306693,1.70247810498213,MATH Level 5,0,0,GPQA,0.25,0,MUSR,0.351739583333333,1.13333333333333,MMLU-PRO,0.109790558510638,1.08783983451537,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-24,2024-09-06,0,google/switch-base-8,apache-2.0,16,0.62,0.146702933877402 google/umt5-base_float16_0de9394d54f8975e71838d309de1cb496c894ab9_False,google/umt5-base,0de9394d54f8975e71838d309de1cb496c894ab9,float16,fine-tunedondomain-specificdatasets,Original,UMT5ForConditionalGeneration,3.44104602550114,FALSE,IFEval,0.174632198123202,17.4632198123202,BBH,0.278772623289455,0.813553178847296,MATH Level 5,0,0,GPQA,0.254194630872483,0.559284116331097,MUSR,0.33821875,0.944010416666666,MMLU-PRO,0.107795877659574,0.866208628841606,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-02,2024-09-06,0,google/umt5-base,apache-2.0,13,-1,0.668046044558199 goulue5/merging_LLM_float16_587115b34d72ef957fee2d8348b3ade3ae06d4a8_False,goulue5/merging_LLM,587115b34d72ef957fee2d8348b3ade3ae06d4a8,float16,basemergesandmoerges,Original,Qwen2ForCausalLM,16.4099852745745,FALSE,IFEval,0.323260061082373,32.3260061082373,BBH,0.42164986115901,18.282830291312,MATH Level 5,0.0785498489425982,7.85498489425982,GPQA,0.291107382550336,5.48098434004475,MUSR,0.43328125,12.76015625,MMLU-PRO,0.29579454787234,21.7549497635934,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-21,2024-11-22,0,goulue5/merging_LLM,"",0,1.544,0.551465090928402 -gpt2_bfloat16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,bfloat16,pretrained,Original,GPT2LMHeadModel,6.39102973137443,FALSE,IFEval,0.193416800755329,19.3416800755329,BBH,0.303638540151673,2.71429784738774,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.26006711409396,1.34228187919463,MUSR,0.432416666666667,12.9854166666667,MMLU-PRO,0.114943484042553,1.66038711583924,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-26,0,gpt2,mit,2495,0.137,0.323928012416449 -gpt2_float16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,float16,pretrained,Original,GPT2LMHeadModel,5.97773692810457,FALSE,IFEval,0.0833333333333333,8.33333333333333,BBH,0.308333333333333,9.19975490196079,MATH Level 5,0,0,GPQA,0.233333333333333,0,MUSR,0.433333333333333,18.3333333333333,MMLU-PRO,0.1,0,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-26,0,gpt2,mit,2495,0.137,0.0392451730685468 +gpt2_bfloat16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,bfloat16,pretrained,Original,GPT2LMHeadModel,6.39102973137443,FALSE,IFEval,0.193416800755329,19.3416800755329,BBH,0.303638540151673,2.71429784738774,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.26006711409396,1.34228187919463,MUSR,0.432416666666667,12.9854166666667,MMLU-PRO,0.114943484042553,1.66038711583924,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-26,0,gpt2,mit,2497,0.137,0.323928012416449 +gpt2_float16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,float16,pretrained,Original,GPT2LMHeadModel,5.97773692810457,FALSE,IFEval,0.0833333333333333,8.33333333333333,BBH,0.308333333333333,9.19975490196079,MATH Level 5,0,0,GPQA,0.233333333333333,0,MUSR,0.433333333333333,18.3333333333333,MMLU-PRO,0.1,0,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-26,0,gpt2,mit,2497,0.137,0.0392451730685468 gradientai/Llama-3-8B-Instruct-Gradient-1048k_bfloat16_8697fb25cb77c852311e03b4464b8467471d56a4_True,gradientai/Llama-3-8B-Instruct-Gradient-1048k,8697fb25cb77c852311e03b4464b8467471d56a4,bfloat16,chatmodels,Original,LlamaForCausalLM,18.2455696265917,TRUE,IFEval,0.44555889484346,44.555889484346,BBH,0.434590310706957,21.0105289871587,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.277684563758389,3.69127516778523,MUSR,0.42975,13.51875,MMLU-PRO,0.29404920212766,21.5610224586288,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-29,2024-06-12,0,gradientai/Llama-3-8B-Instruct-Gradient-1048k,llama3,680,8.03,0.887164486766284 grimjim/Gigantes-v1-gemma2-9b-it_bfloat16_f912b7cf7f07a593d0a4262f9f20a7adb0a93f9d_False,grimjim/Gigantes-v1-gemma2-9b-it,f912b7cf7f07a593d0a4262f9f20a7adb0a93f9d,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,30.707216841069,FALSE,IFEval,0.692454908531585,69.2454908531585,BBH,0.597792552822268,42.7978769655041,MATH Level 5,0.0626888217522659,6.26888217522659,GPQA,0.353187919463087,13.758389261745,MUSR,0.455479166666667,16.3348958333333,MMLU-PRO,0.422539893617021,35.8377659574468,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-28,2024-12-28,1,grimjim/Gigantes-v1-gemma2-9b-it (Merge),gemma,1,9.242,1.49782432731621 grimjim/Gigantes-v2-gemma2-9b-it_bfloat16_5c410fbc679de69de48b25d18bb7e374f4a3471f_False,grimjim/Gigantes-v2-gemma2-9b-it,5c410fbc679de69de48b25d18bb7e374f4a3471f,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,31.3088099444497,FALSE,IFEval,0.735069615287437,73.5069615287437,BBH,0.5986559388304,42.701632598503,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.351510067114094,13.5346756152125,MUSR,0.459479166666667,17.1348958333333,MMLU-PRO,0.425947473404255,36.2163859338062,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-29,2024-12-29,1,grimjim/Gigantes-v2-gemma2-9b-it (Merge),gemma,0,9.242,1.51886584161689 @@ -1852,11 +1855,11 @@ ibm-granite/granite-3.0-8b-instruct_bfloat16_e0a466fb25b9e07e9c2dc93380a36018970 ibm-granite/granite-3.1-1b-a400m-base_bfloat16_6bbcb9db44432d0a5d4cf13cdc082324b7ee9e7b_False,ibm-granite/granite-3.1-1b-a400m-base,6bbcb9db44432d0a5d4cf13cdc082324b7ee9e7b,bfloat16,pretrained,Original,GraniteMoeForCausalLM,6.22427469055773,FALSE,IFEval,0.251943731521253,25.1943731521253,BBH,0.329869954650672,6.42984500540235,MATH Level 5,0.0219033232628399,2.19033232628399,GPQA,0.251677852348993,0.223713646532442,MUSR,0.3500625,1.7578125,MMLU-PRO,0.113946143617021,1.54957151300236,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-1b-a400m-base,apache-2.0,3,1.335,1.12341183736504 ibm-granite/granite-3.1-1b-a400m-instruct_float16_c4f8e0dd19f0ce00bca6c9742751d1827e8fa03a_True,ibm-granite/granite-3.1-1b-a400m-instruct,c4f8e0dd19f0ce00bca6c9742751d1827e8fa03a,float16,chatmodels,Original,GraniteMoeForCausalLM,10.0517271754769,TRUE,IFEval,0.46863987553026,46.863987553026,BBH,0.327983438537518,6.17818321590479,MATH Level 5,0.040785498489426,4.0785498489426,GPQA,0.23993288590604,0,MUSR,0.33025,0.78125,MMLU-PRO,0.121675531914894,2.40839243498818,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-1b-a400m-instruct (Merge),apache-2.0,10,1.335,1.04808410688418 ibm-granite/granite-3.1-2b-base_bfloat16_31f1cf9bd26ca0c69bfaf86824ee6dc4268b8b73_False,ibm-granite/granite-3.1-2b-base,31f1cf9bd26ca0c69bfaf86824ee6dc4268b8b73,bfloat16,pretrained,Original,GraniteForCausalLM,13.1902381427805,FALSE,IFEval,0.352161154625283,35.2161154625283,BBH,0.404718802891887,16.8436898468885,MATH Level 5,0.0558912386706949,5.58912386706949,GPQA,0.277684563758389,3.69127516778523,MUSR,0.348572916666667,3.90494791666667,MMLU-PRO,0.225066489361702,13.8962765957447,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-2b-base,apache-2.0,6,2.534,0.494221356581282 -ibm-granite/granite-3.1-2b-instruct_float16_8f683a244be9034aeea43dd2a80b7b4fe01d376f_True,ibm-granite/granite-3.1-2b-instruct,8f683a244be9034aeea43dd2a80b7b4fe01d376f,float16,chatmodels,Original,GraniteForCausalLM,21.0576307475066,TRUE,IFEval,0.628557782240012,62.8557782240012,BBH,0.440898585580565,21.8229561407945,MATH Level 5,0.113293051359517,11.3293051359517,GPQA,0.289429530201342,5.2572706935123,MUSR,0.360541666666667,4.86770833333334,MMLU-PRO,0.281914893617021,20.2127659574468,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-2b-instruct (Merge),apache-2.0,20,2.534,0.505641903795969 -ibm-granite/granite-3.1-3b-a800m-base_bfloat16_e16343c6e3120c5f4e99ef53e48e9f882c9a8bd3_False,ibm-granite/granite-3.1-3b-a800m-base,e16343c6e3120c5f4e99ef53e48e9f882c9a8bd3,bfloat16,pretrained,Original,GraniteMoeForCausalLM,9.91293476951527,FALSE,IFEval,0.29962942769629,29.962942769629,BBH,0.362822992347764,11.9056051994898,MATH Level 5,0.0400302114803625,4.00302114803625,GPQA,0.277684563758389,3.69127516778523,MUSR,0.327520833333333,1.10677083333333,MMLU-PRO,0.179271941489362,8.80799349881797,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-3b-a800m-base,apache-2.0,3,3.299,1.62281050352824 -ibm-granite/granite-3.1-3b-a800m-instruct_float16_503b5f483d33443ba85a876d3c25f8b85779c9cc_True,ibm-granite/granite-3.1-3b-a800m-instruct,503b5f483d33443ba85a876d3c25f8b85779c9cc,float16,chatmodels,Original,GraniteMoeForCausalLM,17.1014424266068,TRUE,IFEval,0.551646298488012,55.1646298488012,BBH,0.400949452194719,16.6872363666604,MATH Level 5,0.103474320241692,10.3474320241692,GPQA,0.288590604026846,5.14541387024609,MUSR,0.348635416666667,2.51276041666667,MMLU-PRO,0.214760638297872,12.7511820330969,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-3b-a800m-instruct (Merge),apache-2.0,16,3.299,1.63636360410558 +ibm-granite/granite-3.1-2b-instruct_float16_8f683a244be9034aeea43dd2a80b7b4fe01d376f_True,ibm-granite/granite-3.1-2b-instruct,8f683a244be9034aeea43dd2a80b7b4fe01d376f,float16,chatmodels,Original,GraniteForCausalLM,21.0576307475066,TRUE,IFEval,0.628557782240012,62.8557782240012,BBH,0.440898585580565,21.8229561407945,MATH Level 5,0.113293051359517,11.3293051359517,GPQA,0.289429530201342,5.2572706935123,MUSR,0.360541666666667,4.86770833333334,MMLU-PRO,0.281914893617021,20.2127659574468,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-2b-instruct (Merge),apache-2.0,21,2.534,0.505641903795969 +ibm-granite/granite-3.1-3b-a800m-base_bfloat16_e16343c6e3120c5f4e99ef53e48e9f882c9a8bd3_False,ibm-granite/granite-3.1-3b-a800m-base,e16343c6e3120c5f4e99ef53e48e9f882c9a8bd3,bfloat16,pretrained,Original,GraniteMoeForCausalLM,9.91293476951527,FALSE,IFEval,0.29962942769629,29.962942769629,BBH,0.362822992347764,11.9056051994898,MATH Level 5,0.0400302114803625,4.00302114803625,GPQA,0.277684563758389,3.69127516778523,MUSR,0.327520833333333,1.10677083333333,MMLU-PRO,0.179271941489362,8.80799349881797,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-3b-a800m-base,apache-2.0,4,3.299,1.62281050352824 +ibm-granite/granite-3.1-3b-a800m-instruct_float16_503b5f483d33443ba85a876d3c25f8b85779c9cc_True,ibm-granite/granite-3.1-3b-a800m-instruct,503b5f483d33443ba85a876d3c25f8b85779c9cc,float16,chatmodels,Original,GraniteMoeForCausalLM,17.1014424266068,TRUE,IFEval,0.551646298488012,55.1646298488012,BBH,0.400949452194719,16.6872363666604,MATH Level 5,0.103474320241692,10.3474320241692,GPQA,0.288590604026846,5.14541387024609,MUSR,0.348635416666667,2.51276041666667,MMLU-PRO,0.214760638297872,12.7511820330969,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-3b-a800m-instruct (Merge),apache-2.0,17,3.299,1.63636360410558 ibm-granite/granite-3.1-8b-base_float16_174c7f4d7e9a016bdb85ecdf3319fe1f2d8991c4_False,ibm-granite/granite-3.1-8b-base,174c7f4d7e9a016bdb85ecdf3319fe1f2d8991c4,float16,pretrained,Original,GraniteForCausalLM,20.0697880358223,FALSE,IFEval,0.422103352438197,42.2103352438197,BBH,0.477695667711164,26.0195886710118,MATH Level 5,0.095166163141994,9.5166163141994,GPQA,0.321308724832215,9.50782997762864,MUSR,0.392229166666667,8.36197916666667,MMLU-PRO,0.323221409574468,24.8023788416076,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-8b-base,apache-2.0,15,8.171,0.598692557378878 -ibm-granite/granite-3.1-8b-instruct_float16_f6749f3946b2dc9983b870317a71ddf7a65c0806_True,ibm-granite/granite-3.1-8b-instruct,f6749f3946b2dc9983b870317a71ddf7a65c0806,float16,chatmodels,Original,GraniteForCausalLM,30.5526905408918,TRUE,IFEval,0.720756481690803,72.0756481690803,BBH,0.536446043381602,34.0896552994141,MATH Level 5,0.216767371601208,21.6767371601209,GPQA,0.312080536912752,8.27740492170022,MUSR,0.470708333333333,19.0052083333333,MMLU-PRO,0.353723404255319,28.1914893617021,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-8b-instruct (Merge),apache-2.0,120,8.171,0.61783334381855 +ibm-granite/granite-3.1-8b-instruct_float16_f6749f3946b2dc9983b870317a71ddf7a65c0806_True,ibm-granite/granite-3.1-8b-instruct,f6749f3946b2dc9983b870317a71ddf7a65c0806,float16,chatmodels,Original,GraniteForCausalLM,30.5526905408918,TRUE,IFEval,0.720756481690803,72.0756481690803,BBH,0.536446043381602,34.0896552994141,MATH Level 5,0.216767371601208,21.6767371601209,GPQA,0.312080536912752,8.27740492170022,MUSR,0.470708333333333,19.0052083333333,MMLU-PRO,0.353723404255319,28.1914893617021,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-8b-instruct (Merge),apache-2.0,121,8.171,0.61783334381855 ibm-granite/granite-7b-base_bfloat16_23fcb4cb5b69f8a122fb944491e9f1ad664ba37b_False,ibm-granite/granite-7b-base,23fcb4cb5b69f8a122fb944491e9f1ad664ba37b,bfloat16,pretrained,Original,LlamaForCausalLM,7.75764452802273,FALSE,IFEval,0.241427190964419,24.1427190964419,BBH,0.348043727161062,9.0508000028991,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.245805369127517,0,MUSR,0.355489583333333,3.40286458333333,MMLU-PRO,0.183427526595745,9.26972517730496,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-19,2024-06-12,0,ibm-granite/granite-7b-base,apache-2.0,27,6.738,0.652623838561169 ibm-granite/granite-7b-instruct_bfloat16_c6d1adfa5cdba2c8344e055bb7de87b7935250a8_True,ibm-granite/granite-7b-instruct,c6d1adfa5cdba2c8344e055bb7de87b7935250a8,bfloat16,chatmodels,Original,LlamaForCausalLM,11.8083734516443,TRUE,IFEval,0.297231346161518,29.7231346161518,BBH,0.372295296032695,12.6393287024653,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.285234899328859,4.6979865771812,MUSR,0.402,8.81666666666667,MMLU-PRO,0.228640292553192,14.2933658392435,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-19,2024-10-02,1,ibm/granite-7b-base,apache-2.0,6,6.738,0.711451918965055 icefog72/Ice0.15-02.10-RP_bfloat16_ab67a8b63836ec7c8e6729d79d9dfd2708b20eb3_False,icefog72/Ice0.15-02.10-RP,ab67a8b63836ec7c8e6729d79d9dfd2708b20eb3,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,21.4913274610034,FALSE,IFEval,0.534335562972912,53.4335562972912,BBH,0.49763847361884,30.1301040710686,MATH Level 5,0.0574018126888218,5.74018126888218,GPQA,0.277684563758389,3.69127516778523,MUSR,0.431979166666667,12.9973958333333,MMLU-PRO,0.306599069148936,22.9554521276596,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-02,2024-10-02,0,icefog72/Ice0.15-02.10-RP,cc-by-nc-4.0,7,7.242,0.592822160421274 @@ -1890,7 +1893,7 @@ icefog72/IceSakeV6RP-7b_float16_6838e68d35d037b0ef9b04a9de1ebc8ab508cd45_False,i icefog72/IceSakeV8RP-7b_float16_0f8f73fe356583e561479c689aa6597435327f4e_True,icefog72/IceSakeV8RP-7b,0f8f73fe356583e561479c689aa6597435327f4e,float16,basemergesandmoerges,Original,MistralForCausalLM,21.7650153990159,TRUE,IFEval,0.608574138840499,60.8574138840499,BBH,0.488471413379602,28.9662582332666,MATH Level 5,0.0641993957703928,6.41993957703928,GPQA,0.276006711409396,3.4675615212528,MUSR,0.399270833333333,8.5421875,MMLU-PRO,0.301030585106383,22.336731678487,TRUE,TRUE,FALSE,FALSE,FALSE,2024-06-26,2024-06-26,0,icefog72/IceSakeV8RP-7b,cc-by-nc-4.0,1,7.242,0.648285409734146 icefog72/IceTea21EnergyDrinkRPV13-DPOv3_bfloat16_2d4b4fd596ff0f6706a5752198e59da6ffc08067_False,icefog72/IceTea21EnergyDrinkRPV13-DPOv3,2d4b4fd596ff0f6706a5752198e59da6ffc08067,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,21.6842587279325,FALSE,IFEval,0.52634232724726,52.634232724726,BBH,0.501958758423263,30.6127340167025,MATH Level 5,0.0589123867069487,5.89123867069487,GPQA,0.283557046979866,4.47427293064877,MUSR,0.4371875,13.6484375,MMLU-PRO,0.305601728723404,22.8446365248227,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-05,2024-09-06,1,icefog72/IceTea21EnergyDrinkRPV13-DPOv3 (Merge),"",2,7.242,0.57994204720106 icefog72/IceTea21EnergyDrinkRPV13-DPOv3.5_bfloat16_0b0b0864347c3fad2b4d3e102f2f9839d20e296c_False,icefog72/IceTea21EnergyDrinkRPV13-DPOv3.5,0b0b0864347c3fad2b4d3e102f2f9839d20e296c,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,17.3087994924629,FALSE,IFEval,0.487099784128335,48.7099784128335,BBH,0.439966001310903,22.5732257792367,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.284395973154362,4.58612975391499,MUSR,0.396416666666667,7.78541666666667,MMLU-PRO,0.249833776595745,16.6481973995272,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-25,0,Removed,"",0,7.242,0.500728699428476 -ifable/gemma-2-Ifable-9B_bfloat16_d3dbde4efb93ea0a4f247de82541479de6b03160_False,ifable/gemma-2-Ifable-9B,d3dbde4efb93ea0a4f247de82541479de6b03160,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,22.8886905557519,FALSE,IFEval,0.29842927875814,29.842927875814,BBH,0.586611555669324,41.0326446462653,MATH Level 5,0.0989425981873112,9.89425981873112,GPQA,0.341442953020134,12.1923937360179,MUSR,0.40525,8.52291666666667,MMLU-PRO,0.422623005319149,35.8470005910166,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-10,2024-09-25,0,ifable/gemma-2-Ifable-9B,gemma,45,9.242,4.31760442146203 +ifable/gemma-2-Ifable-9B_bfloat16_d3dbde4efb93ea0a4f247de82541479de6b03160_False,ifable/gemma-2-Ifable-9B,d3dbde4efb93ea0a4f247de82541479de6b03160,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,22.8886905557519,FALSE,IFEval,0.29842927875814,29.842927875814,BBH,0.586611555669324,41.0326446462653,MATH Level 5,0.0989425981873112,9.89425981873112,GPQA,0.341442953020134,12.1923937360179,MUSR,0.40525,8.52291666666667,MMLU-PRO,0.422623005319149,35.8470005910166,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-10,2024-09-25,0,ifable/gemma-2-Ifable-9B,gemma,46,9.242,4.31760442146203 inflatebot/MN-12B-Mag-Mell-R1_bfloat16_170cea841f08b4dc047363cb71e903fc34c3258d_False,inflatebot/MN-12B-Mag-Mell-R1,170cea841f08b4dc047363cb71e903fc34c3258d,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,22.5677702399141,FALSE,IFEval,0.461296027872711,46.1296027872711,BBH,0.530385497543498,32.5358328330796,MATH Level 5,0.095166163141994,9.5166163141994,GPQA,0.316275167785235,8.83668903803132,MUSR,0.400229166666667,11.2953125,MMLU-PRO,0.343833111702128,27.0925679669031,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-16,2025-01-04,1,inflatebot/MN-12B-Mag-Mell-R1 (Merge),"",86,12.248,1.11755563267615 informatiker/Qwen2-7B-Instruct-abliterated_bfloat16_7577d60acfe4544d5ab303f0a4d69a9fcb9cf1aa_True,informatiker/Qwen2-7B-Instruct-abliterated,7577d60acfe4544d5ab303f0a4d69a9fcb9cf1aa,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,25.1216036134891,TRUE,IFEval,0.582170862201182,58.2170862201182,BBH,0.553426551593674,37.7957234413659,MATH Level 5,0.0913897280966767,9.13897280966767,GPQA,0.301174496644295,6.82326621923937,MUSR,0.388791666666667,6.83229166666667,MMLU-PRO,0.387300531914894,31.9222813238771,FALSE,FALSE,FALSE,FALSE,FALSE,2024-07-10,2024-09-15,0,informatiker/Qwen2-7B-Instruct-abliterated,"",6,7.616,1.06060504568381 instruction-pretrain/InstructLM-500M_float16_e9d33823c76303dfaff6a8397a8b70d0118ea350_False,instruction-pretrain/InstructLM-500M,e9d33823c76303dfaff6a8397a8b70d0118ea350,float16,pretrained,Original,MistralForCausalLM,2.85435031976667,FALSE,IFEval,0.1027662158628,10.27662158628,BBH,0.294087178725297,2.31705371604848,MATH Level 5,0,0,GPQA,0.256711409395973,0.894854586129753,MUSR,0.352822916666667,2.06953125,MMLU-PRO,0.114112367021277,1.56804078014184,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-18,2024-06-27,0,instruction-pretrain/InstructLM-500M,apache-2.0,34,0.5,0.245792145066826 @@ -2081,11 +2084,11 @@ lalainy/ECE-PRYMMAL-YL-6B-SLERP-V2_bfloat16_18d282d0206ae8f878a9cfa80ce4eaf04205 langgptai/Qwen-las-v0.1_bfloat16_a7a4d4945d28bac955554c9abd2f74a71ebbf22f_True,langgptai/Qwen-las-v0.1,a7a4d4945d28bac955554c9abd2f74a71ebbf22f,bfloat16,chatmodels,Adapter,?,11.3940042774707,TRUE,IFEval,0.33010412372505,33.010412372505,BBH,0.389255256299562,14.6986398981074,MATH Level 5,0.0226586102719033,2.26586102719033,GPQA,0.246644295302013,0,MUSR,0.37009375,3.66171875,MMLU-PRO,0.232546542553192,14.7273936170213,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-26,2024-06-27,1,Qwen/Qwen1.5-4B-Chat,other,0,7.901,1.79809641527475 langgptai/qwen1.5-7b-chat-sa-v0.1_bfloat16_5f4f5e69ac7f1d508f8369e977de208b4803444b_True,langgptai/qwen1.5-7b-chat-sa-v0.1,5f4f5e69ac7f1d508f8369e977de208b4803444b,bfloat16,chatmodels,Adapter,?,16.5801707526462,TRUE,IFEval,0.426774292211333,42.6774292211333,BBH,0.432526799287866,20.3023421299341,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.312080536912752,8.27740492170022,MUSR,0.355145833333333,3.05989583333333,MMLU-PRO,0.299285239361702,22.1428043735225,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-30,2024-06-27,1,Qwen/Qwen1.5-7B-Chat,other,0,15.443,1.46432108342615 leafspark/Llama-3.1-8B-MultiReflection-Instruct_float16_b748441154efdbd7690d773b0194197bfc136ed0_True,leafspark/Llama-3.1-8B-MultiReflection-Instruct,b748441154efdbd7690d773b0194197bfc136ed0,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,26.3118813526605,TRUE,IFEval,0.71253828729992,71.253828729992,BBH,0.500908826149571,28.4480450371186,MATH Level 5,0.136706948640483,13.6706948640483,GPQA,0.292785234899329,5.70469798657718,MUSR,0.368197916666667,8.52473958333334,MMLU-PRO,0.372423537234043,30.2692819148936,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-15,2024-09-15,1,leafspark/Llama-3.1-8B-MultiReflection-Instruct (Merge),llama3.1,5,8.03,0.848446832752584 -lemon07r/Gemma-2-Ataraxy-9B_bfloat16_fb22193268c7a6c3b4598255999ce2de3af8c256_False,lemon07r/Gemma-2-Ataraxy-9B,fb22193268c7a6c3b4598255999ce2de3af8c256,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,22.4652844939409,FALSE,IFEval,0.300877227977322,30.0877227977322,BBH,0.593129841772577,42.0319905289865,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.334731543624161,11.2975391498881,MUSR,0.442427083333333,14.4700520833333,MMLU-PRO,0.422623005319149,35.8470005910166,TRUE,TRUE,FALSE,FALSE,FALSE,2024-08-14,2024-08-27,1,lemon07r/Gemma-2-Ataraxy-9B (Merge),gemma,66,10.159,2.91068818043067 +lemon07r/Gemma-2-Ataraxy-9B_bfloat16_fb22193268c7a6c3b4598255999ce2de3af8c256_False,lemon07r/Gemma-2-Ataraxy-9B,fb22193268c7a6c3b4598255999ce2de3af8c256,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,22.4652844939409,FALSE,IFEval,0.300877227977322,30.0877227977322,BBH,0.593129841772577,42.0319905289865,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.334731543624161,11.2975391498881,MUSR,0.442427083333333,14.4700520833333,MMLU-PRO,0.422623005319149,35.8470005910166,TRUE,TRUE,FALSE,FALSE,FALSE,2024-08-14,2024-08-27,1,lemon07r/Gemma-2-Ataraxy-9B (Merge),gemma,67,10.159,2.91068818043067 lemon07r/Gemma-2-Ataraxy-Advanced-9B_bfloat16_960654f5780f0b458367a6b591ad8440892c2aad_False,lemon07r/Gemma-2-Ataraxy-Advanced-9B,960654f5780f0b458367a6b591ad8440892c2aad,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,25.1096938653496,FALSE,IFEval,0.551596430803601,55.1596430803601,BBH,0.588906726318496,41.1614381547368,MATH Level 5,0.00377643504531722,0.377643504531722,GPQA,0.335570469798658,11.4093959731544,MUSR,0.376072916666667,6.50911458333333,MMLU-PRO,0.42436835106383,36.0409278959811,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-30,2024-09-30,1,lemon07r/Gemma-2-Ataraxy-Advanced-9B (Merge),"",3,10.159,3.22727724523601 lemon07r/Gemma-2-Ataraxy-Remix-9B_bfloat16_f917a9be9f86d58fe122d58ba84cf4b08e4a975e_False,lemon07r/Gemma-2-Ataraxy-Remix-9B,f917a9be9f86d58fe122d58ba84cf4b08e4a975e,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,29.2616712539704,FALSE,IFEval,0.708341644614069,70.8341644614069,BBH,0.589202101504685,41.5923128159338,MATH Level 5,0.0158610271903323,1.58610271903323,GPQA,0.338926174496644,11.8568232662192,MUSR,0.4371875,13.7151041666667,MMLU-PRO,0.423869680851064,35.9855200945627,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-30,2024-09-30,1,lemon07r/Gemma-2-Ataraxy-Remix-9B (Merge),"",4,10.159,2.15744090409982 lemon07r/Gemma-2-Ataraxy-v2-9B_bfloat16_77aca48ac25eb2cbe8c0751a4ef77e5face34d80_False,lemon07r/Gemma-2-Ataraxy-v2-9B,77aca48ac25eb2cbe8c0751a4ef77e5face34d80,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,19.1738302064348,FALSE,IFEval,0.213624294649308,21.3624294649308,BBH,0.576583581562531,39.7968535972527,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.342281879194631,12.3042505592841,MUSR,0.348385416666667,4.88151041666667,MMLU-PRO,0.422124335106383,35.7915927895981,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-28,2024-09-28,1,lemon07r/Gemma-2-Ataraxy-v2-9B (Merge),"",14,10.159,2.99624189404415 -lemon07r/Gemma-2-Ataraxy-v2a-9B_bfloat16_899fb093d80569fc919f53217e3acf031dde89a5_False,lemon07r/Gemma-2-Ataraxy-v2a-9B,899fb093d80569fc919f53217e3acf031dde89a5,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,15.0193613837601,FALSE,IFEval,0.159469097550056,15.9469097550056,BBH,0.518248966271832,31.198528369417,MATH Level 5,0,0,GPQA,0.339765100671141,11.9686800894855,MUSR,0.316479166666667,3.05989583333333,MMLU-PRO,0.351479388297872,27.9421542553192,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-29,2024-09-29,1,lemon07r/Gemma-2-Ataraxy-v2a-9B (Merge),"",1,10.159,2.98139623564809 +lemon07r/Gemma-2-Ataraxy-v2a-9B_bfloat16_899fb093d80569fc919f53217e3acf031dde89a5_False,lemon07r/Gemma-2-Ataraxy-v2a-9B,899fb093d80569fc919f53217e3acf031dde89a5,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,15.0193613837601,FALSE,IFEval,0.159469097550056,15.9469097550056,BBH,0.518248966271832,31.198528369417,MATH Level 5,0,0,GPQA,0.339765100671141,11.9686800894855,MUSR,0.316479166666667,3.05989583333333,MMLU-PRO,0.351479388297872,27.9421542553192,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-29,2024-09-29,1,lemon07r/Gemma-2-Ataraxy-v2a-9B (Merge),"",2,10.159,2.98139623564809 lemon07r/Gemma-2-Ataraxy-v2f-9B_bfloat16_44da9d6a9bc7be5a9af24fb0951047849d5f717d_False,lemon07r/Gemma-2-Ataraxy-v2f-9B,44da9d6a9bc7be5a9af24fb0951047849d5f717d,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,18.7659444016726,FALSE,IFEval,0.379114083963882,37.9114083963882,BBH,0.519284546796177,31.4213361954188,MATH Level 5,0,0,GPQA,0.338926174496644,11.8568232662192,MUSR,0.323145833333333,3.59322916666667,MMLU-PRO,0.350315824468085,27.8128693853428,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-30,2024-09-30,1,lemon07r/Gemma-2-Ataraxy-v2f-9B (Merge),"",1,10.159,3.39859555497881 lemon07r/Gemma-2-Ataraxy-v3-Advanced-9B_bfloat16_318afe2b44a150780e44483a0f90a499e81f946f_False,lemon07r/Gemma-2-Ataraxy-v3-Advanced-9B,318afe2b44a150780e44483a0f90a499e81f946f,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,28.333876970643,FALSE,IFEval,0.660181651351747,66.0181651351747,BBH,0.593514685373779,42.2104722912777,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.336409395973154,11.5212527964206,MUSR,0.44496875,14.5877604166667,MMLU-PRO,0.419630984042553,35.5145537825059,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-09,2024-10-09,1,lemon07r/Gemma-2-Ataraxy-v3-Advanced-9B (Merge),"",3,10.159,2.78799597948833 lemon07r/Gemma-2-Ataraxy-v3b-9B_bfloat16_de8bbacddabf22dad89658d3b3d358b3eccbd59c_False,lemon07r/Gemma-2-Ataraxy-v3b-9B,de8bbacddabf22dad89658d3b3d358b3eccbd59c,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,29.0163291770684,FALSE,IFEval,0.680914418188185,68.0914418188185,BBH,0.590769816289816,41.6239854921233,MATH Level 5,0.0249244712990937,2.49244712990937,GPQA,0.333053691275168,11.0738255033557,MUSR,0.448875,15.209375,MMLU-PRO,0.42046210106383,35.6069001182033,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-08,2024-10-08,1,lemon07r/Gemma-2-Ataraxy-v3b-9B (Merge),"",1,9.242,2.30372776599022 @@ -2120,7 +2123,7 @@ llnYou/ECE-PRYMMAL-YL-3B-SLERP-V2_bfloat16_c3d4fbef1a10ef2746c47c0379b4247c78475 llnYou/ECE-PRYMMAL-YL-3B-SLERP-V3_bfloat16_90648507743059de96334fdc97309b6f2af3d01d_False,llnYou/ECE-PRYMMAL-YL-3B-SLERP-V3,90648507743059de96334fdc97309b6f2af3d01d,bfloat16,basemergesandmoerges,Original,Phi3ForCausalLM,22.9107419271518,FALSE,IFEval,0.358081002850215,35.8081002850215,BBH,0.547312191805515,36.6257563245135,MATH Level 5,0.0989425981873112,9.89425981873112,GPQA,0.304530201342282,7.27069351230425,MUSR,0.436135416666667,14.0502604166667,MMLU-PRO,0.404338430851064,33.8153812056738,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-13,2024-11-13,0,llnYou/ECE-PRYMMAL-YL-3B-SLERP-V3,apache-2.0,0,3.821,0.543325489591988 lmsys/vicuna-13b-v1.3_float16_6566e9cb1787585d1147dcf4f9bc48f29e1328d2_True,lmsys/vicuna-13b-v1.3,6566e9cb1787585d1147dcf4f9bc48f29e1328d2,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,10.284476273841,TRUE,IFEval,0.334350634095312,33.4350634095312,BBH,0.338439931277757,7.48978931162921,MATH Level 5,0.00528700906344411,0.528700906344411,GPQA,0.26761744966443,2.3489932885906,MUSR,0.372729166666667,4.09114583333333,MMLU-PRO,0.224318484042553,13.813164893617,TRUE,FALSE,FALSE,FALSE,TRUE,2023-06-18,2024-06-28,0,lmsys/vicuna-13b-v1.3,"",197,13,1.09423290568838 lmsys/vicuna-7b-v1.3_float16_236eeeab96f0dc2e463f2bebb7bb49809279c6d6_True,lmsys/vicuna-7b-v1.3,236eeeab96f0dc2e463f2bebb7bb49809279c6d6,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,8.31181120581355,TRUE,IFEval,0.290861580606125,29.0861580606125,BBH,0.329841000659292,6.4613787960182,MATH Level 5,0,0,GPQA,0.24244966442953,0,MUSR,0.379333333333333,5.01666666666667,MMLU-PRO,0.183759973404255,9.30666371158392,TRUE,FALSE,FALSE,FALSE,TRUE,2023-06-18,2024-06-28,0,lmsys/vicuna-7b-v1.3,"",129,7,0.563378203120384 -lmsys/vicuna-7b-v1.5_float16_3321f76e3f527bd14065daf69dad9344000a201d_False,lmsys/vicuna-7b-v1.5,3321f76e3f527bd14065daf69dad9344000a201d,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,10.7844473803135,FALSE,IFEval,0.235157160777847,23.5157160777847,BBH,0.394704368422338,15.1525093128437,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.258389261744966,1.11856823266219,MUSR,0.423114583333333,11.42265625,MMLU-PRO,0.214677526595745,12.7419473995272,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-29,2024-06-12,0,lmsys/vicuna-7b-v1.5,llama2,321,7,0.602718105132222 +lmsys/vicuna-7b-v1.5_float16_3321f76e3f527bd14065daf69dad9344000a201d_False,lmsys/vicuna-7b-v1.5,3321f76e3f527bd14065daf69dad9344000a201d,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,10.7844473803135,FALSE,IFEval,0.235157160777847,23.5157160777847,BBH,0.394704368422338,15.1525093128437,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.258389261744966,1.11856823266219,MUSR,0.423114583333333,11.42265625,MMLU-PRO,0.214677526595745,12.7419473995272,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-29,2024-06-12,0,lmsys/vicuna-7b-v1.5,llama2,322,7,0.602718105132222 lodrick-the-lafted/llama-3.1-8b-instruct-ortho-v7_bfloat16_6b7673cd78398c3a8c92f8e759aaae6409e96978_False,lodrick-the-lafted/llama-3.1-8b-instruct-ortho-v7,6b7673cd78398c3a8c92f8e759aaae6409e96978,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,11.6617619528325,FALSE,IFEval,0.351461898872769,35.1461898872769,BBH,0.390691402613629,14.4378630794236,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.272651006711409,3.02013422818792,MUSR,0.36159375,4.73255208333333,MMLU-PRO,0.197390292553192,10.8211436170213,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-25,2024-07-30,0,lodrick-the-lafted/llama-3.1-8b-instruct-ortho-v7,wtfpl,0,8.03,0.931573857187958 lordjia/Llama-3-Cantonese-8B-Instruct_bfloat16_ea98e9b1ab3ea0d66e5270816e43d7a70aaaa151_True,lordjia/Llama-3-Cantonese-8B-Instruct,ea98e9b1ab3ea0d66e5270816e43d7a70aaaa151,bfloat16,chatmodels,Original,LlamaForCausalLM,24.2591207678994,TRUE,IFEval,0.666925978625602,66.6925978625602,BBH,0.481414801895404,26.7910388402978,MATH Level 5,0.088368580060423,8.8368580060423,GPQA,0.293624161073826,5.8165548098434,MUSR,0.404604166666667,9.47552083333334,MMLU-PRO,0.351479388297872,27.9421542553192,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2024-08-03,0,lordjia/Llama-3-Cantonese-8B-Instruct,llama3,5,8.03,0.76770296284449 lordjia/Qwen2-Cantonese-7B-Instruct_bfloat16_eb8b0faee749d167fd70e74f5e579094c4cfe7fb_True,lordjia/Qwen2-Cantonese-7B-Instruct,eb8b0faee749d167fd70e74f5e579094c4cfe7fb,bfloat16,chatmodels,Original,Qwen2ForCausalLM,23.640515390226,TRUE,IFEval,0.54352783946595,54.352783946595,BBH,0.521531134622122,32.453216657913,MATH Level 5,0.0959214501510574,9.59214501510574,GPQA,0.295302013422819,6.04026845637584,MUSR,0.400385416666667,7.81484375,MMLU-PRO,0.384308510638298,31.5898345153664,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-13,2024-08-03,0,lordjia/Qwen2-Cantonese-7B-Instruct,apache-2.0,3,7.616,1.01600679589683 @@ -2169,23 +2172,23 @@ meta-llama/Llama-2-13b-chat-hf_float16_a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8_ meta-llama/Llama-2-13b-hf_float16_5c31dfb671ce7cfe2d7bb7c04375e44c55e815b1_False,meta-llama/Llama-2-13b-hf,5c31dfb671ce7cfe2d7bb7c04375e44c55e815b1,float16,pretrained,Original,LlamaForCausalLM,11.0148335140031,FALSE,IFEval,0.248246873850273,24.8246873850273,BBH,0.412562422338351,17.2225598250581,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.281040268456376,4.13870246085012,MUSR,0.35375,3.38541666666667,MMLU-PRO,0.237782579787234,15.3091755319149,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-06-12,0,meta-llama/Llama-2-13b-hf,llama2,581,13.016,1.11238015630798 meta-llama/Llama-2-70b-chat-hf_float16_e9149a12809580e8602995856f8098ce973d1080_True,meta-llama/Llama-2-70b-chat-hf,e9149a12809580e8602995856f8098ce973d1080,float16,chatmodels,Original,LlamaForCausalLM,12.7464047385667,TRUE,IFEval,0.495792275606502,49.5792275606502,BBH,0.304247414616427,4.61376708259061,MATH Level 5,0.00981873111782478,0.981873111782478,GPQA,0.264261744966443,1.90156599552573,MUSR,0.368666666666667,3.48333333333334,MMLU-PRO,0.24326795212766,15.9186613475177,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-14,2024-06-12,0,meta-llama/Llama-2-70b-chat-hf,llama2,2172,68.977,22.8984550552606 meta-llama/Llama-2-70b-hf_float16_3aba440b59558f995867ba6e1f58f21d0336b5bb_False,meta-llama/Llama-2-70b-hf,3aba440b59558f995867ba6e1f58f21d0336b5bb,float16,pretrained,Original,LlamaForCausalLM,18.3096580216144,FALSE,IFEval,0.240678067527494,24.0678067527494,BBH,0.547259119044934,35.9000618637217,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.302852348993289,7.04697986577182,MUSR,0.412354166666667,9.77760416666667,MMLU-PRO,0.371758643617021,30.1954048463357,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-11,2024-06-12,0,meta-llama/Llama-2-70b-hf,llama2,844,68.977,29.6212466171519 -meta-llama/Llama-2-7b-chat-hf_float16_f5db02db724555f92da89c216ac04704f23d4590_True,meta-llama/Llama-2-7b-chat-hf,f5db02db724555f92da89c216ac04704f23d4590,float16,pretrained,Original,LlamaForCausalLM,9.39548527825095,TRUE,IFEval,0.398647810032935,39.8647810032935,BBH,0.311354635500219,4.45917164595948,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.253355704697987,0.447427293064876,MUSR,0.367552083333333,3.27734375,MMLU-PRO,0.168799867021277,7.64442966903073,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-08-30,0,meta-llama/Llama-2-7b-chat-hf,llama2,4134,6.738,1.15687903615516 -meta-llama/Llama-2-7b-hf_float16_01c7f73d771dfac7d292323805ebc428287df4f9_False,meta-llama/Llama-2-7b-hf,01c7f73d771dfac7d292323805ebc428287df4f9,float16,pretrained,Original,LlamaForCausalLM,8.73082889563367,FALSE,IFEval,0.251893863836842,25.1893863836842,BBH,0.349619581998218,10.351416657849,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.266778523489933,2.23713646532438,MUSR,0.3700625,3.7578125,MMLU-PRO,0.18608710106383,9.56523345153664,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-06-12,0,meta-llama/Llama-2-7b-hf,llama2,1891,6.738,0.563094562772064 -meta-llama/Llama-3.1-8B_float16_d04e592bb4f6aa9cfee91e2e20afa771667e1d4b_False,meta-llama/Llama-3.1-8B,d04e592bb4f6aa9cfee91e2e20afa771667e1d4b,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,14.2194553235834,FALSE,IFEval,0.124598288097803,12.4598288097803,BBH,0.465959054460073,25.3044706347549,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.310402684563758,8.05369127516779,MUSR,0.3811875,8.71510416666667,MMLU-PRO,0.328789893617021,25.4210992907801,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-12-07,0,meta-llama/Llama-3.1-8B,llama3.1,1263,8.03,0.713243580943846 -meta-llama/Llama-3.2-1B_bfloat16_a7c18587d7f473bfea02aa5639aa349403307b54_False,meta-llama/Llama-3.2-1B,a7c18587d7f473bfea02aa5639aa349403307b54,bfloat16,pretrained,Original,LlamaForCausalLM,4.03149449541509,FALSE,IFEval,0.147779004153424,14.7779004153424,BBH,0.311495409646081,4.36602965655676,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.228187919463087,0,MUSR,0.344729166666667,2.5578125,MMLU-PRO,0.120345744680851,2.26063829787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-23,0,meta-llama/Llama-3.2-1B,llama3.2,1431,1.24,0.41912851784102 -meta-llama/Llama-3.2-1B-Instruct_bfloat16_d0a2081ed47e20ce524e8bc5d132f3fad2f69ff0_True,meta-llama/Llama-3.2-1B-Instruct,d0a2081ed47e20ce524e8bc5d132f3fad2f69ff0,bfloat16,chatmodels,Original,LlamaForCausalLM,13.8137204928249,TRUE,IFEval,0.569831380736446,56.9831380736446,BBH,0.349684980617683,8.74252131230305,MATH Level 5,0.0324773413897281,3.24773413897281,GPQA,0.275167785234899,3.35570469798658,MUSR,0.332854166666667,2.9734375,MMLU-PRO,0.168218085106383,7.57978723404255,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-23,0,meta-llama/Llama-3.2-1B-Instruct,llama3.2,690,1.24,0.404904524907622 -meta-llama/Llama-3.2-3B_bfloat16_95c102307f55fbd6d18ddf28bfbcb537ffdc2806_False,meta-llama/Llama-3.2-3B,95c102307f55fbd6d18ddf28bfbcb537ffdc2806,bfloat16,pretrained,Original,LlamaForCausalLM,8.5845296652033,FALSE,IFEval,0.133740696906431,13.374069690643,BBH,0.390511711699106,14.2326648843641,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.26761744966443,2.3489932885906,MUSR,0.35771875,3.81484375,MMLU-PRO,0.248753324468085,16.5281471631206,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-27,0,meta-llama/Llama-3.2-3B,llama3.2,450,3.213,1.33181264899492 -meta-llama/Llama-3.2-3B-Instruct_bfloat16_276b29ce8303c9b88966a9b32fc75692dce4d8e1_True,meta-llama/Llama-3.2-3B-Instruct,276b29ce8303c9b88966a9b32fc75692dce4d8e1,bfloat16,chatmodels,Original,LlamaForCausalLM,24.1165339900694,TRUE,IFEval,0.739316125657699,73.9316125657699,BBH,0.461007023946607,24.0591864468855,MATH Level 5,0.171450151057402,17.1450151057402,GPQA,0.278523489932886,3.80313199105145,MUSR,0.352854166666667,1.3734375,MMLU-PRO,0.319481382978723,24.3868203309693,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-27,0,meta-llama/Llama-3.2-3B-Instruct,llama3.2,872,3.213,1.27120351986613 -meta-llama/Llama-3.3-70B-Instruct_bfloat16__True,meta-llama/Llama-3.3-70B-Instruct,"",bfloat16,chatmodels,Original,LlamaForCausalLM,36.8288410384085,TRUE,IFEval,0.899758197139146,89.9758197139146,BBH,0.691931282832581,56.5614107880222,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446125,15.565625,MMLU-PRO,0.533161569148936,48.1290632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-26,2024-12-03,1,meta-llama/Llama-3.3-70B-Instruct (Merge),llama3.3,1579,70.554,38.2795370537265 -meta-llama/Meta-Llama-3-70B_bfloat16_b4d08b7db49d488da3ac49adf25a6b9ac01ae338_False,meta-llama/Meta-Llama-3-70B,b4d08b7db49d488da3ac49adf25a6b9ac01ae338,bfloat16,pretrained,Original,LlamaForCausalLM,26.6675858211602,FALSE,IFEval,0.160319064526567,16.0319064526567,BBH,0.646107459990447,48.7098126475059,MATH Level 5,0.183534743202417,18.3534743202417,GPQA,0.397651006711409,19.6868008948546,MUSR,0.451822916666667,16.0111979166667,MMLU-PRO,0.470910904255319,41.2123226950355,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-70B,llama3,841,70.554,23.4071857793614 +meta-llama/Llama-2-7b-chat-hf_float16_f5db02db724555f92da89c216ac04704f23d4590_True,meta-llama/Llama-2-7b-chat-hf,f5db02db724555f92da89c216ac04704f23d4590,float16,pretrained,Original,LlamaForCausalLM,9.39548527825095,TRUE,IFEval,0.398647810032935,39.8647810032935,BBH,0.311354635500219,4.45917164595948,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.253355704697987,0.447427293064876,MUSR,0.367552083333333,3.27734375,MMLU-PRO,0.168799867021277,7.64442966903073,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-08-30,0,meta-llama/Llama-2-7b-chat-hf,llama2,4136,6.738,1.15687903615516 +meta-llama/Llama-2-7b-hf_float16_01c7f73d771dfac7d292323805ebc428287df4f9_False,meta-llama/Llama-2-7b-hf,01c7f73d771dfac7d292323805ebc428287df4f9,float16,pretrained,Original,LlamaForCausalLM,8.73082889563367,FALSE,IFEval,0.251893863836842,25.1893863836842,BBH,0.349619581998218,10.351416657849,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.266778523489933,2.23713646532438,MUSR,0.3700625,3.7578125,MMLU-PRO,0.18608710106383,9.56523345153664,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-06-12,0,meta-llama/Llama-2-7b-hf,llama2,1892,6.738,0.563094562772064 +meta-llama/Llama-3.1-8B_float16_d04e592bb4f6aa9cfee91e2e20afa771667e1d4b_False,meta-llama/Llama-3.1-8B,d04e592bb4f6aa9cfee91e2e20afa771667e1d4b,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,14.2194553235834,FALSE,IFEval,0.124598288097803,12.4598288097803,BBH,0.465959054460073,25.3044706347549,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.310402684563758,8.05369127516779,MUSR,0.3811875,8.71510416666667,MMLU-PRO,0.328789893617021,25.4210992907801,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-12-07,0,meta-llama/Llama-3.1-8B,llama3.1,1265,8.03,0.713243580943846 +meta-llama/Llama-3.2-1B_bfloat16_a7c18587d7f473bfea02aa5639aa349403307b54_False,meta-llama/Llama-3.2-1B,a7c18587d7f473bfea02aa5639aa349403307b54,bfloat16,pretrained,Original,LlamaForCausalLM,4.03149449541509,FALSE,IFEval,0.147779004153424,14.7779004153424,BBH,0.311495409646081,4.36602965655676,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.228187919463087,0,MUSR,0.344729166666667,2.5578125,MMLU-PRO,0.120345744680851,2.26063829787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-23,0,meta-llama/Llama-3.2-1B,llama3.2,1436,1.24,0.41912851784102 +meta-llama/Llama-3.2-1B-Instruct_bfloat16_d0a2081ed47e20ce524e8bc5d132f3fad2f69ff0_True,meta-llama/Llama-3.2-1B-Instruct,d0a2081ed47e20ce524e8bc5d132f3fad2f69ff0,bfloat16,chatmodels,Original,LlamaForCausalLM,13.8137204928249,TRUE,IFEval,0.569831380736446,56.9831380736446,BBH,0.349684980617683,8.74252131230305,MATH Level 5,0.0324773413897281,3.24773413897281,GPQA,0.275167785234899,3.35570469798658,MUSR,0.332854166666667,2.9734375,MMLU-PRO,0.168218085106383,7.57978723404255,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-23,0,meta-llama/Llama-3.2-1B-Instruct,llama3.2,691,1.24,0.404904524907622 +meta-llama/Llama-3.2-3B_bfloat16_95c102307f55fbd6d18ddf28bfbcb537ffdc2806_False,meta-llama/Llama-3.2-3B,95c102307f55fbd6d18ddf28bfbcb537ffdc2806,bfloat16,pretrained,Original,LlamaForCausalLM,8.5845296652033,FALSE,IFEval,0.133740696906431,13.374069690643,BBH,0.390511711699106,14.2326648843641,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.26761744966443,2.3489932885906,MUSR,0.35771875,3.81484375,MMLU-PRO,0.248753324468085,16.5281471631206,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-27,0,meta-llama/Llama-3.2-3B,llama3.2,451,3.213,1.33181264899492 +meta-llama/Llama-3.2-3B-Instruct_bfloat16_276b29ce8303c9b88966a9b32fc75692dce4d8e1_True,meta-llama/Llama-3.2-3B-Instruct,276b29ce8303c9b88966a9b32fc75692dce4d8e1,bfloat16,chatmodels,Original,LlamaForCausalLM,24.1165339900694,TRUE,IFEval,0.739316125657699,73.9316125657699,BBH,0.461007023946607,24.0591864468855,MATH Level 5,0.171450151057402,17.1450151057402,GPQA,0.278523489932886,3.80313199105145,MUSR,0.352854166666667,1.3734375,MMLU-PRO,0.319481382978723,24.3868203309693,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-27,0,meta-llama/Llama-3.2-3B-Instruct,llama3.2,878,3.213,1.27120351986613 +meta-llama/Llama-3.3-70B-Instruct_bfloat16__True,meta-llama/Llama-3.3-70B-Instruct,"",bfloat16,chatmodels,Original,LlamaForCausalLM,36.8288410384085,TRUE,IFEval,0.899758197139146,89.9758197139146,BBH,0.691931282832581,56.5614107880222,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446125,15.565625,MMLU-PRO,0.533161569148936,48.1290632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-26,2024-12-03,1,meta-llama/Llama-3.3-70B-Instruct (Merge),llama3.3,1592,70.554,38.2795370537265 +meta-llama/Meta-Llama-3-70B_bfloat16_b4d08b7db49d488da3ac49adf25a6b9ac01ae338_False,meta-llama/Meta-Llama-3-70B,b4d08b7db49d488da3ac49adf25a6b9ac01ae338,bfloat16,pretrained,Original,LlamaForCausalLM,26.6675858211602,FALSE,IFEval,0.160319064526567,16.0319064526567,BBH,0.646107459990447,48.7098126475059,MATH Level 5,0.183534743202417,18.3534743202417,GPQA,0.397651006711409,19.6868008948546,MUSR,0.451822916666667,16.0111979166667,MMLU-PRO,0.470910904255319,41.2123226950355,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-70B,llama3,842,70.554,23.4071857793614 meta-llama/Meta-Llama-3-70B-Instruct_bfloat16_7129260dd854a80eb10ace5f61c20324b472b31c_True,meta-llama/Meta-Llama-3-70B-Instruct,7129260dd854a80eb10ace5f61c20324b472b31c,bfloat16,chatmodels,Original,LlamaForCausalLM,36.5106934142651,TRUE,IFEval,0.809907711538717,80.9907711538717,BBH,0.654669943237205,50.1851331844035,MATH Level 5,0.253021148036254,25.3021148036254,GPQA,0.286912751677852,4.92170022371365,MUSR,0.415364583333333,10.9205729166667,MMLU-PRO,0.520694813829787,46.7438682033097,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,1,meta-llama/Meta-Llama-3-70B,llama3,1452,70.554,18.2391501177391 -meta-llama/Meta-Llama-3-8B_bfloat16_62bd457b6fe961a42a631306577e622c83876cb6_False,meta-llama/Meta-Llama-3-8B,62bd457b6fe961a42a631306577e622c83876cb6,bfloat16,pretrained,Original,LlamaForCausalLM,13.4632115530557,FALSE,IFEval,0.145506145915061,14.5506145915061,BBH,0.459790519524026,24.500763796768,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.305369127516779,7.38255033557047,MUSR,0.36140625,6.24244791666667,MMLU-PRO,0.320977393617021,24.5530437352246,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-8B,llama3,5958,8.03,0.87256849761081 -meta-llama/Meta-Llama-3-8B-Instruct_bfloat16_e1945c40cd546c78e41f1151f4db032b271faeaa_True,meta-llama/Meta-Llama-3-8B-Instruct,e1945c40cd546c78e41f1151f4db032b271faeaa,bfloat16,chatmodels,Original,LlamaForCausalLM,23.9087356939368,TRUE,IFEval,0.740839860459137,74.0839860459137,BBH,0.498871111361695,28.2449495763436,MATH Level 5,0.0868580060422961,8.68580060422961,GPQA,0.259228187919463,1.23042505592841,MUSR,0.356822916666667,1.60286458333334,MMLU-PRO,0.366439494680851,29.6043882978723,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-8B-Instruct,llama3,3752,8.03,0.797499677890947 -meta-llama/Meta-Llama-3-8B-Instruct_float16_e1945c40cd546c78e41f1151f4db032b271faeaa_False,meta-llama/Meta-Llama-3-8B-Instruct,e1945c40cd546c78e41f1151f4db032b271faeaa,float16,chatmodels,Original,LlamaForCausalLM,20.5965713292081,FALSE,IFEval,0.478232201669349,47.8232201669349,BBH,0.491026417512868,26.7952835025737,MATH Level 5,0.0906344410876133,9.06344410876133,GPQA,0.292785234899329,5.70469798657718,MUSR,0.380541666666667,5.40104166666667,MMLU-PRO,0.359125664893617,28.7917405437352,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-07-08,0,meta-llama/Meta-Llama-3-8B-Instruct,llama3,3752,8.03,0.949473257188463 +meta-llama/Meta-Llama-3-8B_bfloat16_62bd457b6fe961a42a631306577e622c83876cb6_False,meta-llama/Meta-Llama-3-8B,62bd457b6fe961a42a631306577e622c83876cb6,bfloat16,pretrained,Original,LlamaForCausalLM,13.4632115530557,FALSE,IFEval,0.145506145915061,14.5506145915061,BBH,0.459790519524026,24.500763796768,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.305369127516779,7.38255033557047,MUSR,0.36140625,6.24244791666667,MMLU-PRO,0.320977393617021,24.5530437352246,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-8B,llama3,5960,8.03,0.87256849761081 +meta-llama/Meta-Llama-3-8B-Instruct_bfloat16_e1945c40cd546c78e41f1151f4db032b271faeaa_True,meta-llama/Meta-Llama-3-8B-Instruct,e1945c40cd546c78e41f1151f4db032b271faeaa,bfloat16,chatmodels,Original,LlamaForCausalLM,23.9087356939368,TRUE,IFEval,0.740839860459137,74.0839860459137,BBH,0.498871111361695,28.2449495763436,MATH Level 5,0.0868580060422961,8.68580060422961,GPQA,0.259228187919463,1.23042505592841,MUSR,0.356822916666667,1.60286458333334,MMLU-PRO,0.366439494680851,29.6043882978723,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-8B-Instruct,llama3,3754,8.03,0.797499677890947 +meta-llama/Meta-Llama-3-8B-Instruct_float16_e1945c40cd546c78e41f1151f4db032b271faeaa_False,meta-llama/Meta-Llama-3-8B-Instruct,e1945c40cd546c78e41f1151f4db032b271faeaa,float16,chatmodels,Original,LlamaForCausalLM,20.5965713292081,FALSE,IFEval,0.478232201669349,47.8232201669349,BBH,0.491026417512868,26.7952835025737,MATH Level 5,0.0906344410876133,9.06344410876133,GPQA,0.292785234899329,5.70469798657718,MUSR,0.380541666666667,5.40104166666667,MMLU-PRO,0.359125664893617,28.7917405437352,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-07-08,0,meta-llama/Meta-Llama-3-8B-Instruct,llama3,3754,8.03,0.949473257188463 meta-llama/Meta-Llama-3.1-70B_bfloat16_f7d3cc45ed4ff669a354baf2e0f05e65799a0bee_True,meta-llama/Meta-Llama-3.1-70B,f7d3cc45ed4ff669a354baf2e0f05e65799a0bee,bfloat16,pretrained,Original,LlamaForCausalLM,26.2002158433759,TRUE,IFEval,0.168437523548629,16.8437523548629,BBH,0.626006918317161,46.3994129558189,MATH Level 5,0.18429003021148,18.429003021148,GPQA,0.38758389261745,18.34451901566,MUSR,0.4571875,16.5817708333333,MMLU-PRO,0.465425531914894,40.6028368794326,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-07-23,0,meta-llama/Meta-Llama-3.1-70B,llama3.1,334,70.554,13.6018520327186 -meta-llama/Meta-Llama-3.1-70B-Instruct_bfloat16_b9461463b511ed3c0762467538ea32cf7c9669f2_True,meta-llama/Meta-Llama-3.1-70B-Instruct,b9461463b511ed3c0762467538ea32cf7c9669f2,bfloat16,chatmodels,Original,LlamaForCausalLM,42.1763127975088,TRUE,IFEval,0.866885419575615,86.6885419575615,BBH,0.691728745366365,55.9279917389847,MATH Level 5,0.306646525679758,30.6646525679758,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4580625,17.6911458333333,MMLU-PRO,0.530917553191489,47.8797281323877,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-15,1,meta-llama/Meta-Llama-3.1-70B,llama3.1,768,70.554,26.8020157168701 -meta-llama/Meta-Llama-3.1-8B_bfloat16_e5c39e551424c763dbc3e58e32ef2999d33a6d8d_True,meta-llama/Meta-Llama-3.1-8B,e5c39e551424c763dbc3e58e32ef2999d33a6d8d,bfloat16,pretrained,Original,LlamaForCausalLM,13.8690662612791,TRUE,IFEval,0.126996369632575,12.6996369632575,BBH,0.4666136555004,25.2947798510872,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.296140939597315,6.15212527964205,MUSR,0.382520833333333,8.98177083333333,MMLU-PRO,0.324551196808511,24.9501329787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-07-23,0,meta-llama/Meta-Llama-3.1-8B,llama3.1,1263,8.03,3.5985230038683 -meta-llama/Meta-Llama-3.1-8B-Instruct_bfloat16_df34336b42332c6d360959e259cd6271c6a09fd4_True,meta-llama/Meta-Llama-3.1-8B-Instruct,df34336b42332c6d360959e259cd6271c6a09fd4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2044584981019,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.26761744966443,2.3489932885906,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376163563829787,30.6848404255319,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-08-15,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,3418,8.03,2.48701186834409 +meta-llama/Meta-Llama-3.1-70B-Instruct_bfloat16_b9461463b511ed3c0762467538ea32cf7c9669f2_True,meta-llama/Meta-Llama-3.1-70B-Instruct,b9461463b511ed3c0762467538ea32cf7c9669f2,bfloat16,chatmodels,Original,LlamaForCausalLM,42.1763127975088,TRUE,IFEval,0.866885419575615,86.6885419575615,BBH,0.691728745366365,55.9279917389847,MATH Level 5,0.306646525679758,30.6646525679758,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4580625,17.6911458333333,MMLU-PRO,0.530917553191489,47.8797281323877,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-15,1,meta-llama/Meta-Llama-3.1-70B,llama3.1,769,70.554,26.8020157168701 +meta-llama/Meta-Llama-3.1-8B_bfloat16_e5c39e551424c763dbc3e58e32ef2999d33a6d8d_True,meta-llama/Meta-Llama-3.1-8B,e5c39e551424c763dbc3e58e32ef2999d33a6d8d,bfloat16,pretrained,Original,LlamaForCausalLM,13.8690662612791,TRUE,IFEval,0.126996369632575,12.6996369632575,BBH,0.4666136555004,25.2947798510872,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.296140939597315,6.15212527964205,MUSR,0.382520833333333,8.98177083333333,MMLU-PRO,0.324551196808511,24.9501329787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-07-23,0,meta-llama/Meta-Llama-3.1-8B,llama3.1,1265,8.03,3.5985230038683 +meta-llama/Meta-Llama-3.1-8B-Instruct_bfloat16_df34336b42332c6d360959e259cd6271c6a09fd4_True,meta-llama/Meta-Llama-3.1-8B-Instruct,df34336b42332c6d360959e259cd6271c6a09fd4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2044584981019,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.26761744966443,2.3489932885906,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376163563829787,30.6848404255319,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-08-15,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,3423,8.03,2.48701186834409 mhl1/Qwen2.5-0.5B-cinstruct-stage1_bfloat16_19d55d8d5bf1e7d98a865121862f3781a27b1b2e_True,mhl1/Qwen2.5-0.5B-cinstruct-stage1,19d55d8d5bf1e7d98a865121862f3781a27b1b2e,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,4.36284288680766,TRUE,IFEval,0.148179053799474,14.8179053799474,BBH,0.325578324782835,5.72452729062484,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.26510067114094,2.01342281879195,MUSR,0.35003125,1.92057291666667,MMLU-PRO,0.113946143617021,1.54957151300236,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-08,1,mhl1/Qwen2.5-0.5B-cinstruct-stage1 (Merge),apache-2.0,0,0.63,0.882400730496291 microsoft/DialoGPT-medium_bfloat16_7b40bb0f92c45fefa957d088000d8648e5c7fa33_True,microsoft/DialoGPT-medium,7b40bb0f92c45fefa957d088000d8648e5c7fa33,bfloat16,chatmodels,Original,GPT2LMHeadModel,5.25143360679031,TRUE,IFEval,0.147904227449833,14.7904227449833,BBH,0.301415638014199,2.55685577233522,MATH Level 5,0,0,GPQA,0.254194630872483,0.559284116331097,MUSR,0.428666666666667,12.2833333333333,MMLU-PRO,0.11186835106383,1.31870567375887,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-13,0,microsoft/DialoGPT-medium,mit,343,0.345,0.129464485100266 microsoft/Orca-2-13b_bfloat16_2539ff53e6baa4cc603774ad5a2d646f4041ea4e_False,microsoft/Orca-2-13b,2539ff53e6baa4cc603774ad5a2d646f4041ea4e,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.1494038209109,FALSE,IFEval,0.31279338820995,31.279338820995,BBH,0.488448972883961,27.3080194999426,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.280201342281879,4.0268456375839,MUSR,0.51296875,25.7877604166667,MMLU-PRO,0.274933510638298,19.4370567375887,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-14,2024-06-12,0,microsoft/Orca-2-13b,other,666,13,1.00858169959549 @@ -2193,17 +2196,17 @@ microsoft/Orca-2-7b_bfloat16_60e31e6bdcf582ad103b807cb74b73ee1d2c4b17_False,micr microsoft/Phi-3-medium-128k-instruct_bfloat16_fa7d2aa4f5ea69b2e36b20d050cdae79c9bfbb3f_True,microsoft/Phi-3-medium-128k-instruct,fa7d2aa4f5ea69b2e36b20d050cdae79c9bfbb3f,bfloat16,chatmodels,Original,Phi3ForCausalLM,31.7116532556656,TRUE,IFEval,0.604002934436185,60.4002934436185,BBH,0.638232253087055,48.4604512739902,MATH Level 5,0.172960725075529,17.2960725075529,GPQA,0.336409395973154,11.5212527964206,MUSR,0.412947916666667,11.3518229166667,MMLU-PRO,0.471160239361702,41.2400265957447,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-08-21,0,microsoft/Phi-3-medium-128k-instruct,mit,376,13.96,1.94755874452617 microsoft/Phi-3-medium-4k-instruct_bfloat16_d194e4e74ffad5a5e193e26af25bcfc80c7f1ffc_True,microsoft/Phi-3-medium-4k-instruct,d194e4e74ffad5a5e193e26af25bcfc80c7f1ffc,bfloat16,chatmodels,Original,Phi3ForCausalLM,32.8962495702928,TRUE,IFEval,0.642271395452954,64.2271395452954,BBH,0.641246489055555,49.3806100742202,MATH Level 5,0.183534743202417,18.3534743202417,GPQA,0.336409395973154,11.5212527964206,MUSR,0.42575,13.0520833333333,MMLU-PRO,0.467586436170213,40.8429373522459,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-12,0,microsoft/Phi-3-medium-4k-instruct,mit,215,13.96,1.45526252332937 microsoft/Phi-3-mini-128k-instruct_bfloat16_5be6479b4bc06a081e8f4c6ece294241ccd32dec_True,microsoft/Phi-3-mini-128k-instruct,5be6479b4bc06a081e8f4c6ece294241ccd32dec,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.6262872732554,TRUE,IFEval,0.597633168880792,59.7633168880792,BBH,0.557453179267985,37.0997666322403,MATH Level 5,0.0974320241691843,9.74320241691843,GPQA,0.317953020134228,9.06040268456376,MUSR,0.3936875,7.7109375,MMLU-PRO,0.373420877659575,30.3800975177305,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-08-21,0,microsoft/Phi-3-mini-128k-instruct,mit,1626,3.821,24.2222515926888 -microsoft/Phi-3-mini-4k-instruct_bfloat16_ff07dc01615f8113924aed013115ab2abd32115b_True,microsoft/Phi-3-mini-4k-instruct,ff07dc01615f8113924aed013115ab2abd32115b,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.9677326380416,TRUE,IFEval,0.561288492311511,56.1288492311511,BBH,0.567597262633488,39.2693352377728,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.319630872483222,9.2841163310962,MUSR,0.395020833333333,7.64427083333334,MMLU-PRO,0.386635638297872,31.8484042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-06-12,0,microsoft/Phi-3-mini-4k-instruct,mit,1110,3.821,0.804074829912372 -microsoft/Phi-3-mini-4k-instruct_float16_c1358f8a35e6d2af81890deffbbfa575b978c62f_True,microsoft/Phi-3-mini-4k-instruct,c1358f8a35e6d2af81890deffbbfa575b978c62f,float16,chatmodels,Original,Phi3ForCausalLM,27.4111166417796,TRUE,IFEval,0.547674614467391,54.7674614467391,BBH,0.549071891949582,36.5598553051879,MATH Level 5,0.154833836858006,15.4833836858006,GPQA,0.332214765100671,10.9619686800895,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.402177526595745,33.5752807328605,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-07-02,0,microsoft/Phi-3-mini-4k-instruct,mit,1110,3.821,0.786699265454341 +microsoft/Phi-3-mini-4k-instruct_bfloat16_ff07dc01615f8113924aed013115ab2abd32115b_True,microsoft/Phi-3-mini-4k-instruct,ff07dc01615f8113924aed013115ab2abd32115b,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.9677326380416,TRUE,IFEval,0.561288492311511,56.1288492311511,BBH,0.567597262633488,39.2693352377728,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.319630872483222,9.2841163310962,MUSR,0.395020833333333,7.64427083333334,MMLU-PRO,0.386635638297872,31.8484042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-06-12,0,microsoft/Phi-3-mini-4k-instruct,mit,1112,3.821,0.804074829912372 +microsoft/Phi-3-mini-4k-instruct_float16_c1358f8a35e6d2af81890deffbbfa575b978c62f_True,microsoft/Phi-3-mini-4k-instruct,c1358f8a35e6d2af81890deffbbfa575b978c62f,float16,chatmodels,Original,Phi3ForCausalLM,27.4111166417796,TRUE,IFEval,0.547674614467391,54.7674614467391,BBH,0.549071891949582,36.5598553051879,MATH Level 5,0.154833836858006,15.4833836858006,GPQA,0.332214765100671,10.9619686800895,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.402177526595745,33.5752807328605,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-07-02,0,microsoft/Phi-3-mini-4k-instruct,mit,1112,3.821,0.786699265454341 microsoft/Phi-3-small-128k-instruct_bfloat16_f80aaa30bfc64c2b8ab214b541d9050e97163bc4_True,microsoft/Phi-3-small-128k-instruct,f80aaa30bfc64c2b8ab214b541d9050e97163bc4,bfloat16,chatmodels,Original,Phi3SmallForCausalLM,28.5909915695228,TRUE,IFEval,0.636825844315306,63.6825844315306,BBH,0.620217677869698,45.6340696414479,MATH Level 5,0,0,GPQA,0.317114093959732,8.94854586129754,MUSR,0.43784375,14.4971354166667,MMLU-PRO,0.449052526595745,38.7836140661939,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-13,0,microsoft/Phi-3-small-128k-instruct,mit,173,7.392,2.50846790619425 microsoft/Phi-3-small-8k-instruct_bfloat16_1535ae26fb4faada95c6950e8bc6e867cdad6b00_True,microsoft/Phi-3-small-8k-instruct,1535ae26fb4faada95c6950e8bc6e867cdad6b00,bfloat16,chatmodels,Original,Phi3SmallForCausalLM,29.6709218521057,TRUE,IFEval,0.649665110794913,64.9665110794913,BBH,0.620836488087056,46.2055703663891,MATH Level 5,0.0284301430770108,2.84301430770108,GPQA,0.312080536912752,8.27740492170022,MUSR,0.455791666666667,16.7739583333333,MMLU-PRO,0.45063164893617,38.9590721040189,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-13,0,microsoft/Phi-3-small-8k-instruct,mit,159,7.392,1.0254536035218 -microsoft/Phi-3.5-MoE-instruct_bfloat16_482a9ba0eb0e1fa1671e3560e009d7cec2e5147c_True,microsoft/Phi-3.5-MoE-instruct,482a9ba0eb0e1fa1671e3560e009d7cec2e5147c,bfloat16,chatmodels,Original,Phi3ForCausalLM,35.4565075216065,TRUE,IFEval,0.692454908531585,69.2454908531585,BBH,0.640762564622586,48.7746463593219,MATH Level 5,0.226586102719033,22.6586102719033,GPQA,0.355704697986577,14.0939597315436,MUSR,0.456479166666667,17.3265625,MMLU-PRO,0.465757978723404,40.6397754137116,TRUE,FALSE,TRUE,FALSE,TRUE,2024-08-17,2024-08-21,0,microsoft/Phi-3.5-MoE-instruct,mit,547,42,4.63227861394431 +microsoft/Phi-3.5-MoE-instruct_bfloat16_482a9ba0eb0e1fa1671e3560e009d7cec2e5147c_True,microsoft/Phi-3.5-MoE-instruct,482a9ba0eb0e1fa1671e3560e009d7cec2e5147c,bfloat16,chatmodels,Original,Phi3ForCausalLM,35.4565075216065,TRUE,IFEval,0.692454908531585,69.2454908531585,BBH,0.640762564622586,48.7746463593219,MATH Level 5,0.226586102719033,22.6586102719033,GPQA,0.355704697986577,14.0939597315436,MUSR,0.456479166666667,17.3265625,MMLU-PRO,0.465757978723404,40.6397754137116,TRUE,FALSE,TRUE,FALSE,TRUE,2024-08-17,2024-08-21,0,microsoft/Phi-3.5-MoE-instruct,mit,548,42,4.63227861394431 microsoft/Phi-3.5-mini-instruct_bfloat16_64963004ad95869fa73a30279371c8778509ac84_True,microsoft/Phi-3.5-mini-instruct,64963004ad95869fa73a30279371c8778509ac84,bfloat16,chatmodels,Original,Phi3ForCausalLM,27.5675734687961,TRUE,IFEval,0.577450054743636,57.7450054743636,BBH,0.551778512611196,36.7458539085166,MATH Level 5,0.159365558912387,15.9365558912387,GPQA,0.339765100671141,11.9686800894855,MUSR,0.402125,10.0989583333333,MMLU-PRO,0.396193484042553,32.9103871158392,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-16,2024-08-21,0,microsoft/Phi-3.5-mini-instruct,mit,751,3.821,3.69600430233737 microsoft/phi-1_bfloat16_b9ac0e6d78d43970ecf88e9e0154b3a7da20ed89_False,microsoft/phi-1,b9ac0e6d78d43970ecf88e9e0154b3a7da20ed89,bfloat16,pretrained,Original,PhiForCausalLM,5.52396572810627,FALSE,IFEval,0.206805719934219,20.6805719934219,BBH,0.313947558958378,4.27399921221468,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.26510067114094,2.01342281879195,MUSR,0.352510416666667,3.69713541666667,MMLU-PRO,0.116190159574468,1.79890661938534,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-10,2024-06-13,0,microsoft/phi-1,mit,207,1.418,0.28622924752808 microsoft/phi-1_5_float16_675aa382d814580b22651a30acb1a585d7c25963_False,microsoft/phi-1_5,675aa382d814580b22651a30acb1a585d7c25963,float16,pretrained,Original,PhiForCausalLM,7.05767379443971,FALSE,IFEval,0.203283953244059,20.3283953244059,BBH,0.335975832119967,7.46893877007024,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.26761744966443,2.3489932885906,MUSR,0.340416666666667,3.38541666666667,MMLU-PRO,0.169132313829787,7.68136820330969,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-10,2024-06-09,0,microsoft/phi-1_5,mit,1321,1.418,0.340862069057633 microsoft/phi-2_float16_ef382358ec9e382308935a992d908de099b64c23_False,microsoft/phi-2,ef382358ec9e382308935a992d908de099b64c23,float16,pretrained,Original,PhiForCausalLM,15.4713509741263,FALSE,IFEval,0.273875539125077,27.3875539125077,BBH,0.48812087712497,28.0385192934393,MATH Level 5,0.0256797583081571,2.56797583081571,GPQA,0.271812080536913,2.9082774049217,MUSR,0.409895833333333,13.8369791666667,MMLU-PRO,0.26279920212766,18.0888002364066,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-13,2024-06-09,0,microsoft/phi-2,mit,3260,2.78,0.423520982590239 -microsoft/phi-4_float16_381727a5ee103da6c1b14ecd3d39cd09832cbcf8_False,microsoft/phi-4,381727a5ee103da6c1b14ecd3d39cd09832cbcf8,float16,pretrained,Original,Phi3ForCausalLM,29.4834167912232,FALSE,IFEval,0.0487850015736025,4.87850015736025,BBH,0.670346462661911,52.5756715725828,MATH Level 5,0.278700906344411,27.8700906344411,GPQA,0.401006711409396,20.1342281879195,MUSR,0.503354166666667,23.7192708333333,MMLU-PRO,0.529504654255319,47.7227393617021,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2025-01-08,0,microsoft/phi-4,mit,1024,14.66,0.878361822105986 -microsoft/phi-4_bfloat16_381727a5ee103da6c1b14ecd3d39cd09832cbcf8_True,microsoft/phi-4,381727a5ee103da6c1b14ecd3d39cd09832cbcf8,bfloat16,chatmodels,Original,Phi3ForCausalLM,34.2454249023323,TRUE,IFEval,0.675144173016485,67.5144173016485,BBH,0.688587440604014,55.2392561095812,MATH Level 5,0.123111782477341,12.3111782477341,GPQA,0.337248322147651,11.6331096196868,MUSR,0.411427083333333,10.1283854166667,MMLU-PRO,0.537815824468085,48.6462027186761,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2025-01-08,0,microsoft/phi-4,mit,1024,14.66,1.87735397589108 +microsoft/phi-4_float16_381727a5ee103da6c1b14ecd3d39cd09832cbcf8_False,microsoft/phi-4,381727a5ee103da6c1b14ecd3d39cd09832cbcf8,float16,pretrained,Original,Phi3ForCausalLM,29.4834167912232,FALSE,IFEval,0.0487850015736025,4.87850015736025,BBH,0.670346462661911,52.5756715725828,MATH Level 5,0.278700906344411,27.8700906344411,GPQA,0.401006711409396,20.1342281879195,MUSR,0.503354166666667,23.7192708333333,MMLU-PRO,0.529504654255319,47.7227393617021,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2025-01-08,0,microsoft/phi-4,mit,1097,14.66,0.878361822105986 +microsoft/phi-4_bfloat16_381727a5ee103da6c1b14ecd3d39cd09832cbcf8_True,microsoft/phi-4,381727a5ee103da6c1b14ecd3d39cd09832cbcf8,bfloat16,chatmodels,Original,Phi3ForCausalLM,34.2454249023323,TRUE,IFEval,0.675144173016485,67.5144173016485,BBH,0.688587440604014,55.2392561095812,MATH Level 5,0.123111782477341,12.3111782477341,GPQA,0.337248322147651,11.6331096196868,MUSR,0.411427083333333,10.1283854166667,MMLU-PRO,0.537815824468085,48.6462027186761,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2025-01-08,0,microsoft/phi-4,mit,1097,14.66,1.87735397589108 migtissera/Llama-3-70B-Synthia-v3.5_float16_8744db0bccfc18f1847633da9d29fc89b35b4190_True,migtissera/Llama-3-70B-Synthia-v3.5,8744db0bccfc18f1847633da9d29fc89b35b4190,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,35.2042985630762,TRUE,IFEval,0.607649924422754,60.7649924422754,BBH,0.648863802627128,49.1181596957482,MATH Level 5,0.189577039274924,18.9577039274924,GPQA,0.38758389261745,18.34451901566,MUSR,0.492197916666667,23.39140625,MMLU-PRO,0.465841090425532,40.6490100472813,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-26,2024-08-28,0,migtissera/Llama-3-70B-Synthia-v3.5,llama3,5,70.554,8.76969798956 migtissera/Llama-3-8B-Synthia-v3.5_float16_af4990801a24fee7acf16370cb5aa5643b5e9d6c_True,migtissera/Llama-3-8B-Synthia-v3.5,af4990801a24fee7acf16370cb5aa5643b5e9d6c,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.6966778088349,TRUE,IFEval,0.506958204231439,50.6958204231439,BBH,0.488794093366004,27.5423394300577,MATH Level 5,0.0506042296072508,5.06042296072508,GPQA,0.271812080536913,2.9082774049217,MUSR,0.404385416666667,9.41484375,MMLU-PRO,0.303025265957447,22.5583628841608,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-17,2024-08-28,0,migtissera/Llama-3-8B-Synthia-v3.5,llama3,15,8.03,0.828698366274131 migtissera/Tess-3-7B-SFT_bfloat16_404de3b56564dbd43cd64d97f8574b43189462f3_True,migtissera/Tess-3-7B-SFT,404de3b56564dbd43cd64d97f8574b43189462f3,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,17.0961631507225,TRUE,IFEval,0.394626258327903,39.4626258327903,BBH,0.460734838950762,24.123847398237,MATH Level 5,0.0332326283987915,3.32326283987915,GPQA,0.270973154362416,2.79642058165548,MUSR,0.411270833333333,10.2755208333333,MMLU-PRO,0.303357712765957,22.5953014184397,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-09,2024-07-20,1,mistralai/Mistral-7B-v0.3,apache-2.0,4,7.248,0.647169773785903 @@ -2218,20 +2221,20 @@ ministral/Ministral-3b-instruct_bfloat16_2c95908929198d6e69af8638f0dbbd9bc6b93f9 mistral-community/Mistral-7B-v0.2_bfloat16_2c3e624962b1a3f3fbf52e15969565caa7bc064a_False,mistral-community/Mistral-7B-v0.2,2c3e624962b1a3f3fbf52e15969565caa7bc064a,bfloat16,pretrained,Original,MistralForCausalLM,14.2153624426921,FALSE,IFEval,0.2266397602805,22.66397602805,BBH,0.451018796279758,23.9508653830296,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.291946308724832,5.59284116331097,MUSR,0.403177083333333,8.36380208333333,MMLU-PRO,0.295295877659575,21.6995419621749,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-23,2024-06-12,0,mistral-community/Mistral-7B-v0.2,apache-2.0,232,7.242,0.553213277920435 mistral-community/mixtral-8x22B-v0.3_bfloat16_211b177b79ab5ef245ee334d106c27623e786882_False,mistral-community/mixtral-8x22B-v0.3,211b177b79ab5ef245ee334d106c27623e786882,bfloat16,pretrained,Original,MixtralForCausalLM,25.789406608528,FALSE,IFEval,0.258263629392235,25.8263629392235,BBH,0.625000217843585,45.7310408976333,MATH Level 5,0.182779456193354,18.2779456193354,GPQA,0.37751677852349,17.0022371364653,MUSR,0.403697916666667,7.46223958333334,MMLU-PRO,0.463929521276596,40.4366134751773,TRUE,FALSE,TRUE,FALSE,TRUE,2024-05-25,2024-06-13,0,mistral-community/mixtral-8x22B-v0.3,apache-2.0,3,140.63,52.4944851685548 mistralai/Codestral-22B-v0.1_bfloat16_8f5fe23af91885222a1563283c87416745a5e212_True,mistralai/Codestral-22B-v0.1,8f5fe23af91885222a1563283c87416745a5e212,bfloat16,pretrained,Original,MistralForCausalLM,23.2799174068646,TRUE,IFEval,0.577175228393995,57.7175228393995,BBH,0.513913692100317,30.7376344119456,MATH Level 5,0.100453172205438,10.0453172205438,GPQA,0.298657718120805,6.48769574944072,MUSR,0.418708333333333,10.7385416666667,MMLU-PRO,0.315575132978723,23.9527925531915,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-29,2024-09-28,0,mistralai/Codestral-22B-v0.1,other,1175,22.247,1.3066695609381 -mistralai/Ministral-8B-Instruct-2410_bfloat16_199e57c1d66379760f6413f79d27008d1d1dbd6e_True,mistralai/Ministral-8B-Instruct-2410,199e57c1d66379760f6413f79d27008d1d1dbd6e,bfloat16,chatmodels,Original,MistralForCausalLM,22.0078589303086,TRUE,IFEval,0.589639933155139,58.963993315514,BBH,0.476164020168914,25.8247744094178,MATH Level 5,0.0649546827794562,6.49546827794562,GPQA,0.284395973154362,4.58612975391499,MUSR,0.41375,10.71875,MMLU-PRO,0.329122340425532,25.4580378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-15,2024-12-01,0,mistralai/Ministral-8B-Instruct-2410,other,385,8.02,0.797086392156932 +mistralai/Ministral-8B-Instruct-2410_bfloat16_199e57c1d66379760f6413f79d27008d1d1dbd6e_True,mistralai/Ministral-8B-Instruct-2410,199e57c1d66379760f6413f79d27008d1d1dbd6e,bfloat16,chatmodels,Original,MistralForCausalLM,22.0078589303086,TRUE,IFEval,0.589639933155139,58.963993315514,BBH,0.476164020168914,25.8247744094178,MATH Level 5,0.0649546827794562,6.49546827794562,GPQA,0.284395973154362,4.58612975391499,MUSR,0.41375,10.71875,MMLU-PRO,0.329122340425532,25.4580378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-15,2024-12-01,0,mistralai/Ministral-8B-Instruct-2410,other,386,8.02,0.797086392156932 mistralai/Mistral-7B-Instruct-v0.1_bfloat16_73068f3702d050a2fd5aa2ca1e612e5036429398_True,mistralai/Mistral-7B-Instruct-v0.1,73068f3702d050a2fd5aa2ca1e612e5036429398,bfloat16,chatmodels,Original,MistralForCausalLM,12.6957006941243,TRUE,IFEval,0.448706099815157,44.8706099815157,BBH,0.33548084759811,7.64702053582754,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.25,0,MUSR,0.384760416666667,6.12838541666667,MMLU-PRO,0.241439494680851,15.7154994089835,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-27,2024-06-27,1,mistralai/Mistral-7B-v0.1,apache-2.0,1544,7.242,1.21604471748007 mistralai/Mistral-7B-Instruct-v0.2_bfloat16_41b61a33a2483885c981aa79e0df6b32407ed873_True,mistralai/Mistral-7B-Instruct-v0.2,41b61a33a2483885c981aa79e0df6b32407ed873,bfloat16,chatmodels,Original,MistralForCausalLM,18.4575391254667,TRUE,IFEval,0.549622778671702,54.9622778671702,BBH,0.445973552032928,22.9106019367136,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.276006711409396,3.4675615212528,MUSR,0.396604166666667,7.60885416666667,MMLU-PRO,0.271692154255319,19.0769060283688,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-11,2024-06-12,0,mistralai/Mistral-7B-Instruct-v0.2,apache-2.0,2610,7.242,0.534406629050985 -mistralai/Mistral-7B-Instruct-v0.3_bfloat16_83e9aa141f2e28c82232fea5325f54edf17c43de_True,mistralai/Mistral-7B-Instruct-v0.3,83e9aa141f2e28c82232fea5325f54edf17c43de,bfloat16,chatmodels,Original,MistralForCausalLM,19.174746309635,TRUE,IFEval,0.546525441384416,54.6525441384416,BBH,0.472196317126484,25.569114948859,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.279362416107383,3.91498881431767,MUSR,0.37390625,4.30494791666667,MMLU-PRO,0.30751329787234,23.0570330969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-12,1,mistralai/Mistral-7B-v0.3,apache-2.0,1237,7.248,0.5377834643891 -mistralai/Mistral-7B-v0.1_bfloat16_26bca36bde8333b5d7f72e9ed20ccda6a618af24_False,mistralai/Mistral-7B-v0.1,26bca36bde8333b5d7f72e9ed20ccda6a618af24,bfloat16,pretrained,Original,MistralForCausalLM,14.5626190834339,FALSE,IFEval,0.238554812342363,23.8554812342363,BBH,0.443106781218371,22.1684024578981,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.291946308724832,5.59284116331097,MUSR,0.4139375,10.6755208333333,MMLU-PRO,0.301279920212766,22.3644355791962,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-20,2024-06-12,0,mistralai/Mistral-7B-v0.1,apache-2.0,3520,7.242,0.675534465568117 +mistralai/Mistral-7B-Instruct-v0.3_bfloat16_83e9aa141f2e28c82232fea5325f54edf17c43de_True,mistralai/Mistral-7B-Instruct-v0.3,83e9aa141f2e28c82232fea5325f54edf17c43de,bfloat16,chatmodels,Original,MistralForCausalLM,19.174746309635,TRUE,IFEval,0.546525441384416,54.6525441384416,BBH,0.472196317126484,25.569114948859,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.279362416107383,3.91498881431767,MUSR,0.37390625,4.30494791666667,MMLU-PRO,0.30751329787234,23.0570330969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-12,1,mistralai/Mistral-7B-v0.3,apache-2.0,1239,7.248,0.5377834643891 +mistralai/Mistral-7B-v0.1_bfloat16_26bca36bde8333b5d7f72e9ed20ccda6a618af24_False,mistralai/Mistral-7B-v0.1,26bca36bde8333b5d7f72e9ed20ccda6a618af24,bfloat16,pretrained,Original,MistralForCausalLM,14.5626190834339,FALSE,IFEval,0.238554812342363,23.8554812342363,BBH,0.443106781218371,22.1684024578981,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.291946308724832,5.59284116331097,MUSR,0.4139375,10.6755208333333,MMLU-PRO,0.301279920212766,22.3644355791962,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-20,2024-06-12,0,mistralai/Mistral-7B-v0.1,apache-2.0,3523,7.242,0.675534465568117 mistralai/Mistral-7B-v0.3_bfloat16_b67d6a03ca097c5122fa65904fce0413500bf8c8_False,mistralai/Mistral-7B-v0.3,b67d6a03ca097c5122fa65904fce0413500bf8c8,bfloat16,pretrained,Original,MistralForCausalLM,14.2153624426921,FALSE,IFEval,0.2266397602805,22.66397602805,BBH,0.451018796279758,23.9508653830296,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.291946308724832,5.59284116331097,MUSR,0.403177083333333,8.36380208333333,MMLU-PRO,0.295295877659575,21.6995419621749,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-12,0,mistralai/Mistral-7B-v0.3,apache-2.0,418,7.248,0.660475600081291 mistralai/Mistral-Large-Instruct-2411_float16_3a5cb136f6106edf5c1210369068eb5a4f787cab_True,mistralai/Mistral-Large-Instruct-2411,3a5cb136f6106edf5c1210369068eb5a4f787cab,float16,chatmodels,Original,MistralForCausalLM,38.4552314758039,TRUE,IFEval,0.840057713533425,84.0057713533425,BBH,0.674664773567507,52.7448919952634,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.437080536912752,24.9440715883669,MUSR,0.454,17.2166666666667,MMLU-PRO,0.556183510638298,50.6870567375887,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-14,2024-11-19,0,mistralai/Mistral-Large-Instruct-2411,other,185,122.61,26.272305228873 mistralai/Mistral-Nemo-Base-2407_bfloat16_d2efb15544d5401f761235bef327babb850887d0_False,mistralai/Mistral-Nemo-Base-2407,d2efb15544d5401f761235bef327babb850887d0,bfloat16,pretrained,Original,MistralForCausalLM,15.1386511082141,FALSE,IFEval,0.162991972410981,16.2991972410981,BBH,0.503506200036929,29.3747364409669,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.293624161073826,5.8165548098434,MUSR,0.392135416666667,6.51692708333334,MMLU-PRO,0.347157579787234,27.4619533096927,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-07-19,0,mistralai/Mistral-Nemo-Base-2407,apache-2.0,274,11.58,1.70299545491031 -mistralai/Mistral-Nemo-Instruct-2407_bfloat16_4d14c1db68fe20dbf80b8eca85d39b909c5fe1d5_True,mistralai/Mistral-Nemo-Instruct-2407,4d14c1db68fe20dbf80b8eca85d39b909c5fe1d5,bfloat16,chatmodels,Original,MistralForCausalLM,23.6333743622513,TRUE,IFEval,0.638024885082692,63.8024885082692,BBH,0.503652395031081,29.6799703811528,MATH Level 5,0.0649546827794562,6.49546827794562,GPQA,0.290268456375839,5.36912751677852,MUSR,0.39,8.48333333333333,MMLU-PRO,0.351728723404255,27.9698581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-17,2024-08-29,1,mistralai/Mistral-Nemo-Base-2407,apache-2.0,1359,12.248,2.99760056248369 -mistralai/Mistral-Small-Instruct-2409_bfloat16_63e53df6575e7085d62113f4383835ff979b3795_True,mistralai/Mistral-Small-Instruct-2409,63e53df6575e7085d62113f4383835ff979b3795,bfloat16,chatmodels,Original,MistralForCausalLM,26.2627489764183,TRUE,IFEval,0.666975846310013,66.6975846310013,BBH,0.521307509814622,30.7920960925092,MATH Level 5,0.143504531722054,14.3504531722054,GPQA,0.323825503355705,9.84340044742729,MUSR,0.363208333333333,3.00104166666667,MMLU-PRO,0.396027260638298,32.8919178486998,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,0,mistralai/Mistral-Small-Instruct-2409,other,367,22.05,1.37933750885174 -mistralai/Mistral-Small-Instruct-2409_float16_63e53df6575e7085d62113f4383835ff979b3795_False,mistralai/Mistral-Small-Instruct-2409,63e53df6575e7085d62113f4383835ff979b3795,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,29.8182425699334,FALSE,IFEval,0.628282955890371,62.8282955890371,BBH,0.583028384689821,40.5597130348992,MATH Level 5,0.197885196374622,19.7885196374622,GPQA,0.333053691275168,11.0738255033557,MUSR,0.406333333333333,10.225,MMLU-PRO,0.409906914893617,34.4341016548463,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-25,0,mistralai/Mistral-Small-Instruct-2409,other,367,22.247,1.61000748804136 +mistralai/Mistral-Nemo-Instruct-2407_bfloat16_4d14c1db68fe20dbf80b8eca85d39b909c5fe1d5_True,mistralai/Mistral-Nemo-Instruct-2407,4d14c1db68fe20dbf80b8eca85d39b909c5fe1d5,bfloat16,chatmodels,Original,MistralForCausalLM,23.6333743622513,TRUE,IFEval,0.638024885082692,63.8024885082692,BBH,0.503652395031081,29.6799703811528,MATH Level 5,0.0649546827794562,6.49546827794562,GPQA,0.290268456375839,5.36912751677852,MUSR,0.39,8.48333333333333,MMLU-PRO,0.351728723404255,27.9698581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-17,2024-08-29,1,mistralai/Mistral-Nemo-Base-2407,apache-2.0,1362,12.248,2.99760056248369 +mistralai/Mistral-Small-Instruct-2409_bfloat16_63e53df6575e7085d62113f4383835ff979b3795_True,mistralai/Mistral-Small-Instruct-2409,63e53df6575e7085d62113f4383835ff979b3795,bfloat16,chatmodels,Original,MistralForCausalLM,26.2627489764183,TRUE,IFEval,0.666975846310013,66.6975846310013,BBH,0.521307509814622,30.7920960925092,MATH Level 5,0.143504531722054,14.3504531722054,GPQA,0.323825503355705,9.84340044742729,MUSR,0.363208333333333,3.00104166666667,MMLU-PRO,0.396027260638298,32.8919178486998,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,0,mistralai/Mistral-Small-Instruct-2409,other,368,22.05,1.37933750885174 +mistralai/Mistral-Small-Instruct-2409_float16_63e53df6575e7085d62113f4383835ff979b3795_False,mistralai/Mistral-Small-Instruct-2409,63e53df6575e7085d62113f4383835ff979b3795,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,29.8182425699334,FALSE,IFEval,0.628282955890371,62.8282955890371,BBH,0.583028384689821,40.5597130348992,MATH Level 5,0.197885196374622,19.7885196374622,GPQA,0.333053691275168,11.0738255033557,MUSR,0.406333333333333,10.225,MMLU-PRO,0.409906914893617,34.4341016548463,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-25,0,mistralai/Mistral-Small-Instruct-2409,other,368,22.247,1.61000748804136 mistralai/Mixtral-8x22B-Instruct-v0.1_bfloat16_b0c3516041d014f640267b14feb4e9a84c8e8c71_True,mistralai/Mixtral-8x22B-Instruct-v0.1,b0c3516041d014f640267b14feb4e9a84c8e8c71,bfloat16,chatmodels,Original,MixtralForCausalLM,33.885680288082,TRUE,IFEval,0.718358400156031,71.8358400156031,BBH,0.612492492627202,44.1143455872484,MATH Level 5,0.187311178247734,18.7311178247734,GPQA,0.373322147651007,16.4429530201342,MUSR,0.431114583333333,13.4893229166667,MMLU-PRO,0.448304521276596,38.7005023640662,TRUE,FALSE,TRUE,FALSE,TRUE,2024-04-16,2024-06-12,1,mistralai/Mixtral-8x22B-v0.1,apache-2.0,699,140.621,47.147578592378 mistralai/Mixtral-8x22B-v0.1_bfloat16_b03e260818710044a2f088d88fab12bb220884fb_False,mistralai/Mixtral-8x22B-v0.1,b03e260818710044a2f088d88fab12bb220884fb,bfloat16,pretrained,Original,MixtralForCausalLM,25.7283481584049,FALSE,IFEval,0.258263629392235,25.8263629392235,BBH,0.623980747318727,45.5884038434272,MATH Level 5,0.182779456193354,18.2779456193354,GPQA,0.375838926174497,16.7785234899329,MUSR,0.403697916666667,7.46223958333334,MMLU-PRO,0.463929521276596,40.4366134751773,TRUE,FALSE,TRUE,FALSE,TRUE,2024-04-16,2024-06-12,0,mistralai/Mixtral-8x22B-v0.1,apache-2.0,208,140.621,104.697316275112 -mistralai/Mixtral-8x7B-Instruct-v0.1_bfloat16_1e637f2d7cb0a9d6fb1922f305cb784995190a83_True,mistralai/Mixtral-8x7B-Instruct-v0.1,1e637f2d7cb0a9d6fb1922f305cb784995190a83,bfloat16,chatmodels,Original,MixtralForCausalLM,23.8422789394817,TRUE,IFEval,0.559914360563305,55.9914360563305,BBH,0.496236540133565,29.7423983809673,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.302852348993289,7.04697986577182,MUSR,0.420322916666667,11.0736979166667,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-10,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,4260,46.703,13.7649393661468 +mistralai/Mixtral-8x7B-Instruct-v0.1_bfloat16_1e637f2d7cb0a9d6fb1922f305cb784995190a83_True,mistralai/Mixtral-8x7B-Instruct-v0.1,1e637f2d7cb0a9d6fb1922f305cb784995190a83,bfloat16,chatmodels,Original,MixtralForCausalLM,23.8422789394817,TRUE,IFEval,0.559914360563305,55.9914360563305,BBH,0.496236540133565,29.7423983809673,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.302852348993289,7.04697986577182,MUSR,0.420322916666667,11.0736979166667,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-10,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,4264,46.703,13.7649393661468 mistralai/Mixtral-8x7B-v0.1_bfloat16_985aa055896a8f943d4a9f2572e6ea1341823841_False,mistralai/Mixtral-8x7B-v0.1,985aa055896a8f943d4a9f2572e6ea1341823841,bfloat16,pretrained,Original,MixtralForCausalLM,19.4519879614403,FALSE,IFEval,0.24152692633324,24.152692633324,BBH,0.508666743762444,30.2941949189615,MATH Level 5,0.095166163141994,9.5166163141994,GPQA,0.313758389261745,8.50111856823266,MUSR,0.432135416666667,12.58359375,MMLU-PRO,0.384973404255319,31.6637115839244,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-01,2024-08-20,0,mistralai/Mixtral-8x7B-v0.1,apache-2.0,1659,46.703,18.3878645797549 mistralai/Mixtral-8x7B-v0.1_float16_985aa055896a8f943d4a9f2572e6ea1341823841_False,mistralai/Mixtral-8x7B-v0.1,985aa055896a8f943d4a9f2572e6ea1341823841,float16,fine-tunedondomain-specificdatasets,Original,MixtralForCausalLM,19.6651089183161,FALSE,IFEval,0.232609476189843,23.2609476189843,BBH,0.509771137755339,30.4002992674255,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.320469798657718,9.39597315436242,MUSR,0.4413125,13.6640625,MMLU-PRO,0.387134308510638,31.9038120567376,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-01,2024-06-27,0,mistralai/Mixtral-8x7B-v0.1,apache-2.0,1659,46.703,5.13509985481396 mixtao/MixTAO-7Bx2-MoE-v8.1_bfloat16_339130b87b6ef2484fea9fbfacba8a714ac03347_False,mixtao/MixTAO-7Bx2-MoE-v8.1,339130b87b6ef2484fea9fbfacba8a714ac03347,bfloat16,fine-tunedondomain-specificdatasets,Original,MixtralForCausalLM,21.0779269837969,FALSE,IFEval,0.416233371897676,41.6233371897676,BBH,0.518905939173352,32.3103423396992,MATH Level 5,0.0906344410876133,9.06344410876133,GPQA,0.284395973154362,4.58612975391499,MUSR,0.446333333333333,15.2916666666667,MMLU-PRO,0.312333776595745,23.5926418439716,TRUE,FALSE,TRUE,FALSE,FALSE,2024-02-26,2024-10-04,0,mixtao/MixTAO-7Bx2-MoE-v8.1,apache-2.0,55,12.879,0.924035071773507 @@ -2308,6 +2311,7 @@ neopolita/jessi-v0.1-bf16-falcon3-7b-instruct_bfloat16_da9877089d4975e84e10cbb02 neopolita/jessi-v0.1-qwen2.5-7b-instruct_bfloat16_e73d1545a57a4c8e20df50d6641b08015fb039a3_True,neopolita/jessi-v0.1-qwen2.5-7b-instruct,e73d1545a57a4c8e20df50d6641b08015fb039a3,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,26.1391000867543,TRUE,IFEval,0.727450941280248,72.7450941280248,BBH,0.538661143344097,35.0879283733587,MATH Level 5,0,0,GPQA,0.290268456375839,5.36912751677852,MUSR,0.3939375,7.3421875,MMLU-PRO,0.426612367021277,36.2902630023641,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-08,1,neopolita/jessi-v0.1-qwen2.5-7b-instruct (Merge),apache-2.0,0,7.616,1.33604458794411 neopolita/jessi-v0.2-falcon3-7b-instruct_bfloat16_efd74223ccaf140aab43df0c9a271007e826124b_True,neopolita/jessi-v0.2-falcon3-7b-instruct,efd74223ccaf140aab43df0c9a271007e826124b,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,33.8586463293059,TRUE,IFEval,0.724353603992961,72.4353603992961,BBH,0.537214521881345,34.6212934442251,MATH Level 5,0.347432024169184,34.7432024169184,GPQA,0.313758389261745,8.50111856823266,MUSR,0.482427083333333,20.6700520833333,MMLU-PRO,0.389627659574468,32.1808510638298,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-08,1,neopolita/jessi-v0.2-falcon3-7b-instruct (Merge),other,0,7.456,1.1611336152358 neopolita/jessi-v0.3-falcon3-7b-instruct_bfloat16_6f95f4e365f8f087f6d037e72493ecff68d9298f_True,neopolita/jessi-v0.3-falcon3-7b-instruct,6f95f4e365f8f087f6d037e72493ecff68d9298f,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,34.0036734905278,TRUE,IFEval,0.75090648368551,75.090648368551,BBH,0.538793502664194,34.5652683395658,MATH Level 5,0.335347432024169,33.5347432024169,GPQA,0.319630872483222,9.2841163310962,MUSR,0.46915625,18.54453125,MMLU-PRO,0.39702460106383,33.0027334515366,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-08,1,neopolita/jessi-v0.3-falcon3-7b-instruct (Merge),other,0,7.456,1.22328260636943 +neopolita/jessi-v0.5-falcon3-7b-instruct_bfloat16_1b70a742251a75c8a5fd047f0c9cdd5bffc27a43_True,neopolita/jessi-v0.5-falcon3-7b-instruct,1b70a742251a75c8a5fd047f0c9cdd5bffc27a43,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,33.9777585104975,TRUE,IFEval,0.741164554493189,74.1164554493189,BBH,0.558962730227608,37.1680693690063,MATH Level 5,0.302114803625378,30.2114803625378,GPQA,0.311241610738255,8.165548098434,MUSR,0.486520833333333,21.2484375,MMLU-PRO,0.396609042553192,32.956560283688,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-09,2025-01-09,1,neopolita/jessi-v0.5-falcon3-7b-instruct (Merge),other,0,7.456,0.633127656642667 netcat420/Llama3.1-MFANN-8b_float16_6714fe00996d2679e9325b503ab991f4ecc0273d_False,netcat420/Llama3.1-MFANN-8b,6714fe00996d2679e9325b503ab991f4ecc0273d,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,13.0667107112471,FALSE,IFEval,0.296956519811877,29.6956519811877,BBH,0.428115468074255,19.2866837601937,MATH Level 5,0.0264350453172205,2.64350453172205,GPQA,0.287751677852349,5.03355704697987,MUSR,0.33790625,2.57161458333333,MMLU-PRO,0.272523271276596,19.1692523640662,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,netcat420/Llama3.1-MFANN-8b (Merge),llama3.1,0,8.03,0.700506207811858 netcat420/MFANN-Llama3.1-Abliterated-SLERP-TIES-V2_float16_0e649dd355ad7d562f9346c96642c24eff35338e_False,netcat420/MFANN-Llama3.1-Abliterated-SLERP-TIES-V2,0e649dd355ad7d562f9346c96642c24eff35338e,float16,basemergesandmoerges,Original,LlamaForCausalLM,19.2137281822613,FALSE,IFEval,0.42097966728281,42.097966728281,BBH,0.492376062364722,26.9383700967246,MATH Level 5,0.0762839879154079,7.62839879154079,GPQA,0.296979865771812,6.26398210290828,MUSR,0.372760416666667,4.32838541666667,MMLU-PRO,0.352227393617021,28.0252659574468,TRUE,TRUE,FALSE,FALSE,FALSE,2024-11-08,2024-11-09,0,netcat420/MFANN-Llama3.1-Abliterated-SLERP-TIES-V2,apache-2.0,0,8.03,0.704112935134176 netcat420/MFANN-Llama3.1-Abliterated-SLERP-TIES-V3_float16_381cf003a5e28d2b273226364b568cc60b857b5b_False,netcat420/MFANN-Llama3.1-Abliterated-SLERP-TIES-V3,381cf003a5e28d2b273226364b568cc60b857b5b,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.2220303405577,FALSE,IFEval,0.423802178220455,42.3802178220455,BBH,0.491402159422544,26.9788509461975,MATH Level 5,0.0755287009063444,7.55287009063444,GPQA,0.296979865771812,6.26398210290828,MUSR,0.3740625,4.49114583333333,MMLU-PRO,0.348986037234043,27.665115248227,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-25,2024-11-26,1,netcat420/MFANN-Llama3.1-Abliterated-SLERP-TIES-V3 (Merge),"",2,8.03,0.720910445854624 @@ -2349,7 +2353,7 @@ newsbang/Homer-v1.0-Qwen2.5-72B_bfloat16_c7f3c5c131c046626f8d33eb615c1a0aba19998 newsbang/Homer-v1.0-Qwen2.5-7B_bfloat16_4795825dff1b68dd2cc02b3bd39598a161c09c66_False,newsbang/Homer-v1.0-Qwen2.5-7B,4795825dff1b68dd2cc02b3bd39598a161c09c66,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,32.1452276066116,FALSE,IFEval,0.639273793534489,63.9273793534489,BBH,0.565525417737022,37.8108474922518,MATH Level 5,0.303625377643505,30.3625377643505,GPQA,0.322147651006711,9.61968680089485,MUSR,0.427822916666667,11.8778645833333,MMLU-PRO,0.453457446808511,39.2730496453901,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-04,2024-12-04,0,newsbang/Homer-v1.0-Qwen2.5-7B,apache-2.0,2,7.616,0.639252118205651 nguyentd/FinancialAdvice-Qwen2.5-7B_bfloat16_5c3421d5a980d0b2365b0d704ead30c9e534a019_False,nguyentd/FinancialAdvice-Qwen2.5-7B,5c3421d5a980d0b2365b0d704ead30c9e534a019,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,20.9354650535882,FALSE,IFEval,0.449605934476079,44.9605934476079,BBH,0.473093415389579,25.6304356221603,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.294463087248322,5.92841163310962,MUSR,0.402489583333333,9.14453125,MMLU-PRO,0.375249335106383,30.5832594562648,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-21,2024-11-18,1,nguyentd/FinancialAdvice-Qwen2.5-7B (Merge),apache-2.0,1,7.616,0.654445044832706 ngxson/MiniThinky-1B-Llama-3.2_float16_a5e5adf4f7e63f7127a72def90ba3a627bae36bf_True,ngxson/MiniThinky-1B-Llama-3.2,a5e5adf4f7e63f7127a72def90ba3a627bae36bf,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,6.4210032438225,TRUE,IFEval,0.277147967393183,27.7147967393183,BBH,0.314226503827215,4.34779539343128,MATH Level 5,0.0264350453172205,2.64350453172205,GPQA,0.239093959731544,0,MUSR,0.343364583333333,2.18723958333333,MMLU-PRO,0.11469414893617,1.63268321513002,FALSE,FALSE,FALSE,FALSE,FALSE,2025-01-06,2025-01-07,1,ngxson/MiniThinky-1B-Llama-3.2 (Merge),"",3,1.236,0.747680911048283 -ngxson/MiniThinky-v2-1B-Llama-3.2_float16_0eb811aca13439292d4151456577a527a2982c46_True,ngxson/MiniThinky-v2-1B-Llama-3.2,0eb811aca13439292d4151456577a527a2982c46,float16,chatmodels,Original,LlamaForCausalLM,6.37444380612719,TRUE,IFEval,0.296307131743773,29.6307131743773,BBH,0.320511113589516,4.89376948425059,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.23993288590604,0,MUSR,0.335614583333333,0.618489583333333,MMLU-PRO,0.111619015957447,1.29100177304964,FALSE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-09,1,ngxson/MiniThinky-v2-1B-Llama-3.2 (Merge),"",22,1.236,0.731149067797528 +ngxson/MiniThinky-v2-1B-Llama-3.2_float16_0eb811aca13439292d4151456577a527a2982c46_True,ngxson/MiniThinky-v2-1B-Llama-3.2,0eb811aca13439292d4151456577a527a2982c46,float16,chatmodels,Original,LlamaForCausalLM,6.37444380612719,TRUE,IFEval,0.296307131743773,29.6307131743773,BBH,0.320511113589516,4.89376948425059,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.23993288590604,0,MUSR,0.335614583333333,0.618489583333333,MMLU-PRO,0.111619015957447,1.29100177304964,FALSE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-09,1,ngxson/MiniThinky-v2-1B-Llama-3.2 (Merge),"",24,1.236,0.731149067797528 nhyha/N3N_Delirium-v1_1030_0227_bfloat16_41eabc719bd611e2bd0094b0842df84916a57a46_True,nhyha/N3N_Delirium-v1_1030_0227,41eabc719bd611e2bd0094b0842df84916a57a46,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,31.143320415941,TRUE,IFEval,0.802289037531527,80.2289037531527,BBH,0.589068667782223,40.7750400744857,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.337248322147651,11.6331096196868,MUSR,0.4098125,9.85989583333333,MMLU-PRO,0.414976728723404,34.9974143026005,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-30,2024-11-04,2,unsloth/gemma-2-9b-it,apache-2.0,0,10.159,2.13185600002894 nhyha/N3N_Llama-3.1-8B-Instruct_1028_0216_bfloat16_d0715a631898112c9c3b729d0334588a2ff636d8_False,nhyha/N3N_Llama-3.1-8B-Instruct_1028_0216,d0715a631898112c9c3b729d0334588a2ff636d8,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,23.4036037255736,FALSE,IFEval,0.478082598616116,47.8082598616116,BBH,0.505374130992036,28.9804641248107,MATH Level 5,0.167673716012085,16.7673716012085,GPQA,0.306208053691275,7.49440715883669,MUSR,0.40503125,10.0622395833333,MMLU-PRO,0.363779920212766,29.3088800236407,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-28,2024-11-04,2,meta-llama/Meta-Llama-3.1-8B,apache-2.0,0,8.03,0.749506263677984 nhyha/N3N_gemma-2-9b-it_20241029_1532_bfloat16_6cfc55a717961ef206978b577bd74df97efe1455_False,nhyha/N3N_gemma-2-9b-it_20241029_1532,6cfc55a717961ef206978b577bd74df97efe1455,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,32.0222492594182,FALSE,IFEval,0.675194040700896,67.5194040700896,BBH,0.586312438182767,40.9866677332497,MATH Level 5,0.204682779456193,20.4682779456193,GPQA,0.340604026845638,12.0805369127517,MUSR,0.459354166666667,16.3859375,MMLU-PRO,0.412234042553192,34.6926713947991,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-29,2024-11-04,1,unsloth/gemma-2-9b-it,apache-2.0,2,10.159,2.39404419850728 @@ -2372,7 +2376,7 @@ nothingiisreal/MN-12B-Starcannon-v3_bfloat16_169480b62121c4f070e93a05158545c6797 nvidia/Hymba-1.5B-Base_bfloat16_85e5b833d75f26170c7684ba83140f1bf9fedf37_False,nvidia/Hymba-1.5B-Base,85e5b833d75f26170c7684ba83140f1bf9fedf37,bfloat16,pretrained,Original,HymbaForCausalLM,7.92198908307419,FALSE,IFEval,0.229512138902556,22.9512138902556,BBH,0.325647852141822,7.68994111813814,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.255872483221477,0.782997762863532,MUSR,0.356635416666667,5.17942708333334,MMLU-PRO,0.192237367021277,10.2485963356974,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-09,2024-12-06,0,nvidia/Hymba-1.5B-Base,other,135,1.523,9.10791437880169 nvidia/Hymba-1.5B-Instruct_bfloat16_ffc758eefef247c0ee4d7ce41636562759027ce6_True,nvidia/Hymba-1.5B-Instruct,ffc758eefef247c0ee4d7ce41636562759027ce6,bfloat16,chatmodels,Original,HymbaForCausalLM,13.7392113616459,TRUE,IFEval,0.600905597148898,60.0905597148898,BBH,0.306713390823188,4.59146361547248,MATH Level 5,0,0,GPQA,0.288590604026846,5.14541387024609,MUSR,0.331583333333333,1.04791666666667,MMLU-PRO,0.204039228723404,11.5599143026005,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-12-06,1,nvidia/Hymba-1.5B-Instruct (Merge),other,219,1.523,6.71266576424283 nvidia/Llama-3.1-Minitron-4B-Depth-Base_bfloat16_40d82bc951b4f39e9c9e11176334250c30975098_False,nvidia/Llama-3.1-Minitron-4B-Depth-Base,40d82bc951b4f39e9c9e11176334250c30975098,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,11.5321699752737,FALSE,IFEval,0.16069362624503,16.069362624503,BBH,0.417070419310489,19.4441095555079,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.263422818791946,1.78970917225951,MUSR,0.4010625,10.6994791666667,MMLU-PRO,0.27983710106383,19.9819001182033,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-13,2024-09-25,0,nvidia/Llama-3.1-Minitron-4B-Depth-Base,other,20,4.02,0.467690635805229 -nvidia/Llama-3.1-Nemotron-70B-Instruct-HF_bfloat16_250db5cf2323e04a6d2025a2ca2b94a95c439e88_True,nvidia/Llama-3.1-Nemotron-70B-Instruct-HF,250db5cf2323e04a6d2025a2ca2b94a95c439e88,bfloat16,chatmodels,Original,LlamaForCausalLM,34.5783715382223,TRUE,IFEval,0.738067217205903,73.8067217205903,BBH,0.631600066889504,47.1095304937273,MATH Level 5,0.287009063444109,28.7009063444109,GPQA,0.258389261744966,1.11856823266219,MUSR,0.432760416666667,13.1950520833333,MMLU-PRO,0.491855053191489,43.5394503546099,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-12,2024-10-16,2,meta-llama/Meta-Llama-3.1-70B,llama3.1,1978,70.554,13.6287476336013 +nvidia/Llama-3.1-Nemotron-70B-Instruct-HF_bfloat16_250db5cf2323e04a6d2025a2ca2b94a95c439e88_True,nvidia/Llama-3.1-Nemotron-70B-Instruct-HF,250db5cf2323e04a6d2025a2ca2b94a95c439e88,bfloat16,chatmodels,Original,LlamaForCausalLM,34.5783715382223,TRUE,IFEval,0.738067217205903,73.8067217205903,BBH,0.631600066889504,47.1095304937273,MATH Level 5,0.287009063444109,28.7009063444109,GPQA,0.258389261744966,1.11856823266219,MUSR,0.432760416666667,13.1950520833333,MMLU-PRO,0.491855053191489,43.5394503546099,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-12,2024-10-16,2,meta-llama/Meta-Llama-3.1-70B,llama3.1,1981,70.554,13.6287476336013 nvidia/Minitron-4B-Base_bfloat16_d6321f64412982046a32d761701167e752fedc02_False,nvidia/Minitron-4B-Base,d6321f64412982046a32d761701167e752fedc02,bfloat16,pretrained,Original,NemotronForCausalLM,11.9399727051767,FALSE,IFEval,0.221793729526545,22.1793729526545,BBH,0.40838762439925,17.2156006550611,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.269295302013423,2.57270693512304,MUSR,0.413375,9.93854166666667,MMLU-PRO,0.261968085106383,17.9964539007092,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-19,2024-09-25,0,nvidia/Minitron-4B-Base,other,128,4,1.18926681315643 nvidia/Minitron-8B-Base_bfloat16_70fa5997afc42807f41eebd5d481f040556fdf97_False,nvidia/Minitron-8B-Base,70fa5997afc42807f41eebd5d481f040556fdf97,bfloat16,pretrained,Original,NemotronForCausalLM,14.1787264154315,FALSE,IFEval,0.242426760994162,24.2426760994162,BBH,0.43950631883576,22.0407929700052,MATH Level 5,0.0234138972809668,2.34138972809668,GPQA,0.273489932885906,3.13199105145414,MUSR,0.402552083333333,9.08567708333334,MMLU-PRO,0.318068484042553,24.2298315602837,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-19,2024-09-25,0,nvidia/Minitron-8B-Base,other,63,7.22,1.41252072016633 nvidia/Mistral-NeMo-Minitron-8B-Base_bfloat16_cc94637b669b62c4829b1e0c3b9074fecd883b74_False,nvidia/Mistral-NeMo-Minitron-8B-Base,cc94637b669b62c4829b1e0c3b9074fecd883b74,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,17.6601615070764,FALSE,IFEval,0.194565973838305,19.4565973838305,BBH,0.521909809052142,31.8220151574902,MATH Level 5,0.0460725075528701,4.60725075528701,GPQA,0.325503355704698,10.0671140939597,MUSR,0.40915625,8.94453125,MMLU-PRO,0.379571143617021,31.0634604018913,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-19,2024-08-22,0,nvidia/Mistral-NeMo-Minitron-8B-Base,other,166,7.88,3.40402832024504 @@ -2390,11 +2394,11 @@ oopere/pruned40-llama-1b_float16_3de470d9c61cb57cea821e93b43fb250aa14b975_False, oopere/pruned40-llama-3.2-3b_float16_ceb2073cda2f21afa10efcbae74583fc9b319d54_False,oopere/pruned40-llama-3.2-3b,ceb2073cda2f21afa10efcbae74583fc9b319d54,float16,pretrained,Original,LlamaForCausalLM,5.18246289956441,FALSE,IFEval,0.218296342593208,21.8296342593208,BBH,0.316711702809771,4.74010154594563,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.229865771812081,0,MUSR,0.3539375,2.40885416666667,MMLU-PRO,0.117686170212766,1.96513002364066,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-12,2024-12-12,1,oopere/pruned40-llama-3.2-3b (Merge),llama3.2,0,2.367,0.597667318719724 oopere/pruned60-llama-1b_float16_86b157256928b50ee07cc3cf5b3884b70062f2fe_False,oopere/pruned60-llama-1b,86b157256928b50ee07cc3cf5b3884b70062f2fe,float16,pretrained,Original,LlamaForCausalLM,5.42980237577008,FALSE,IFEval,0.182850392514085,18.2850392514085,BBH,0.30161934741854,2.94252648075335,MATH Level 5,0,0,GPQA,0.249161073825503,0,MUSR,0.408791666666667,9.43229166666667,MMLU-PRO,0.117270611702128,1.91895685579196,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-16,2024-11-25,1,oopere/pruned60-llama-1b (Merge),llama3.2,0,0.753,0.382487881515074 oopere/pruned60-llama-3.2-3b_float16_c8c061d55288274a59205fa740b51a951ca93335_False,oopere/pruned60-llama-3.2-3b,c8c061d55288274a59205fa740b51a951ca93335,float16,pretrained,Original,LlamaForCausalLM,5.065740099545,FALSE,IFEval,0.182475830795622,18.2475830795622,BBH,0.31662597093352,3.98840191534689,MATH Level 5,0,0,GPQA,0.27013422818792,2.68456375838927,MUSR,0.363333333333333,4.01666666666667,MMLU-PRO,0.113115026595745,1.45722517730496,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-12,2024-12-13,1,oopere/pruned60-llama-3.2-3b (Merge),llama3.2,0,1.944,0.620884220907376 -openai-community/gpt2_bfloat16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,openai-community/gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,bfloat16,pretrained,Original,GPT2LMHeadModel,6.51080708776172,FALSE,IFEval,0.179253270211927,17.9253270211927,BBH,0.303571124421336,2.67498136798699,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.258389261744966,1.11856823266219,MUSR,0.447052083333333,15.3481770833333,MMLU-PRO,0.115940824468085,1.77120271867612,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2,mit,2495,0.137,0.0859412568146148 -openai-community/gpt2_float16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,openai-community/gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,float16,pretrained,Original,GPT2LMHeadModel,6.29647106783872,FALSE,IFEval,0.177954494075719,17.7954494075719,BBH,0.301658010676531,2.81591130950851,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.258389261744966,1.11856823266219,MUSR,0.439020833333333,13.9109375,MMLU-PRO,0.116522606382979,1.8358451536643,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-12,0,openai-community/gpt2,mit,2495,0.137,0.117386895248811 -openai-community/gpt2-large_bfloat16_32b71b12589c2f8d625668d2335a01cac3249519_False,openai-community/gpt2-large,32b71b12589c2f8d625668d2335a01cac3249519,bfloat16,pretrained,Original,GPT2LMHeadModel,5.47959037520557,FALSE,IFEval,0.204782200117909,20.4782200117909,BBH,0.306884187601188,3.25379054497874,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.259228187919463,1.23042505592841,MUSR,0.378864583333333,5.65807291666667,MMLU-PRO,0.114195478723404,1.57727541371158,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-large,mit,279,0.812,0.180462238431619 -openai-community/gpt2-medium_bfloat16_6dcaa7a952f72f9298047fd5137cd6e4f05f41da_False,openai-community/gpt2-medium,6dcaa7a952f72f9298047fd5137cd6e4f05f41da,bfloat16,pretrained,Original,GPT2LMHeadModel,5.8268115862481,FALSE,IFEval,0.220844027181213,22.0844027181213,BBH,0.305028023217627,2.71997223835624,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.26258389261745,1.67785234899329,MUSR,0.388447916666667,6.15598958333333,MMLU-PRO,0.118184840425532,2.0205378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-medium,mit,162,0.38,0.121061915000596 -openai-community/gpt2-xl_bfloat16_15ea56dee5df4983c59b2538573817e1667135e2_False,openai-community/gpt2-xl,15ea56dee5df4983c59b2538573817e1667135e2,bfloat16,pretrained,Original,GPT2LMHeadModel,4.98018762739917,FALSE,IFEval,0.203857985700164,20.3857985700164,BBH,0.300857611232608,2.58096064745272,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.258389261744966,1.11856823266219,MUSR,0.370958333333333,4.03645833333333,MMLU-PRO,0.113115026595745,1.45722517730496,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-xl,mit,320,1.608,0.215313699838485 +openai-community/gpt2_bfloat16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,openai-community/gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,bfloat16,pretrained,Original,GPT2LMHeadModel,6.51080708776172,FALSE,IFEval,0.179253270211927,17.9253270211927,BBH,0.303571124421336,2.67498136798699,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.258389261744966,1.11856823266219,MUSR,0.447052083333333,15.3481770833333,MMLU-PRO,0.115940824468085,1.77120271867612,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2,mit,2497,0.137,0.0859412568146148 +openai-community/gpt2_float16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,openai-community/gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,float16,pretrained,Original,GPT2LMHeadModel,6.29647106783872,FALSE,IFEval,0.177954494075719,17.7954494075719,BBH,0.301658010676531,2.81591130950851,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.258389261744966,1.11856823266219,MUSR,0.439020833333333,13.9109375,MMLU-PRO,0.116522606382979,1.8358451536643,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-12,0,openai-community/gpt2,mit,2497,0.137,0.117386895248811 +openai-community/gpt2-large_bfloat16_32b71b12589c2f8d625668d2335a01cac3249519_False,openai-community/gpt2-large,32b71b12589c2f8d625668d2335a01cac3249519,bfloat16,pretrained,Original,GPT2LMHeadModel,5.47959037520557,FALSE,IFEval,0.204782200117909,20.4782200117909,BBH,0.306884187601188,3.25379054497874,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.259228187919463,1.23042505592841,MUSR,0.378864583333333,5.65807291666667,MMLU-PRO,0.114195478723404,1.57727541371158,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-large,mit,280,0.812,0.180462238431619 +openai-community/gpt2-medium_bfloat16_6dcaa7a952f72f9298047fd5137cd6e4f05f41da_False,openai-community/gpt2-medium,6dcaa7a952f72f9298047fd5137cd6e4f05f41da,bfloat16,pretrained,Original,GPT2LMHeadModel,5.8268115862481,FALSE,IFEval,0.220844027181213,22.0844027181213,BBH,0.305028023217627,2.71997223835624,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.26258389261745,1.67785234899329,MUSR,0.388447916666667,6.15598958333333,MMLU-PRO,0.118184840425532,2.0205378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-medium,mit,163,0.38,0.121061915000596 +openai-community/gpt2-xl_bfloat16_15ea56dee5df4983c59b2538573817e1667135e2_False,openai-community/gpt2-xl,15ea56dee5df4983c59b2538573817e1667135e2,bfloat16,pretrained,Original,GPT2LMHeadModel,4.98018762739917,FALSE,IFEval,0.203857985700164,20.3857985700164,BBH,0.300857611232608,2.58096064745272,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.258389261744966,1.11856823266219,MUSR,0.370958333333333,4.03645833333333,MMLU-PRO,0.113115026595745,1.45722517730496,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-xl,mit,321,1.608,0.215313699838485 openbmb/MiniCPM-S-1B-sft-llama-format_bfloat16_7de07f8895c168a7ee01f624f50c44f6966c9735_True,openbmb/MiniCPM-S-1B-sft-llama-format,7de07f8895c168a7ee01f624f50c44f6966c9735,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,8.87018453155293,TRUE,IFEval,0.332876766978284,33.2876766978284,BBH,0.304931363220705,3.89845521424289,MATH Level 5,0.0234138972809668,2.34138972809668,GPQA,0.270973154362416,2.79642058165548,MUSR,0.331677083333333,1.35963541666667,MMLU-PRO,0.185837765957447,9.53752955082742,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-14,2024-11-19,0,openbmb/MiniCPM-S-1B-sft-llama-format,apache-2.0,4,1,0.540036847471136 openchat/openchat-3.5-0106_bfloat16_ff058fda49726ecf4ea53dc1635f917cdb8ba36b_True,openchat/openchat-3.5-0106,ff058fda49726ecf4ea53dc1635f917cdb8ba36b,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,22.6586834330757,TRUE,IFEval,0.595135351977198,59.5135351977198,BBH,0.461697870839606,24.0387112139116,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.307885906040268,7.71812080536913,MUSR,0.4254375,11.7463541666667,MMLU-PRO,0.329122340425532,25.4580378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-07,2024-06-27,1,mistralai/Mistral-7B-v0.1,apache-2.0,348,7.242,2.35495886433684 openchat/openchat-3.5-1210_bfloat16_801f5459b7577241500785f11c2b026912badd6e_True,openchat/openchat-3.5-1210,801f5459b7577241500785f11c2b026912badd6e,bfloat16,chatmodels,Original,MistralForCausalLM,22.6900852582059,TRUE,IFEval,0.603678240402133,60.3678240402133,BBH,0.453535684644798,23.2362965821665,MATH Level 5,0.0762839879154079,7.62839879154079,GPQA,0.301174496644295,6.82326621923937,MUSR,0.4414375,14.2796875,MMLU-PRO,0.314245345744681,23.8050384160756,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-12,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,276,7.242,0.516451060379658 @@ -2491,7 +2495,7 @@ princeton-nlp/Sheared-LLaMA-1.3B_bfloat16_a4b76938edbf571ea7d7d9904861cbdca08809 princeton-nlp/Sheared-LLaMA-2.7B_bfloat16_2f157a0306b75d37694ae05f6a4067220254d540_False,princeton-nlp/Sheared-LLaMA-2.7B,2f157a0306b75d37694ae05f6a4067220254d540,bfloat16,pretrained,Original,LlamaForCausalLM,6.3246270096586,FALSE,IFEval,0.241652149629649,24.1652149629649,BBH,0.32586855691246,5.65552132993844,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.275167785234899,3.35570469798658,MUSR,0.356729166666667,2.09114583333333,MMLU-PRO,0.118683510638298,2.07594562647754,TRUE,FALSE,FALSE,FALSE,FALSE,2023-10-10,2024-07-29,0,princeton-nlp/Sheared-LLaMA-2.7B,apache-2.0,60,2.7,0.470049763910811 princeton-nlp/gemma-2-9b-it-DPO_bfloat16_f646c99fc3aa7afc7b22c3c7115fd03a40fc1d22_True,princeton-nlp/gemma-2-9b-it-DPO,f646c99fc3aa7afc7b22c3c7115fd03a40fc1d22,bfloat16,chatmodels,Original,Gemma2ForCausalLM,19.4340345411901,TRUE,IFEval,0.276872032872778,27.6872032872778,BBH,0.594144468295665,41.5936544553845,MATH Level 5,0,0,GPQA,0.335570469798658,11.4093959731544,MUSR,0.38203125,5.65390625,MMLU-PRO,0.372340425531915,30.2600472813239,FALSE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2024-09-19,2,google/gemma-2-9b,"",6,9.242,2.89062697102829 princeton-nlp/gemma-2-9b-it-SimPO_bfloat16_8c87091f412e3aa6f74f66bd86c57fb81cbc3fde_True,princeton-nlp/gemma-2-9b-it-SimPO,8c87091f412e3aa6f74f66bd86c57fb81cbc3fde,bfloat16,chatmodels,Original,Gemma2ForCausalLM,21.1616516275693,TRUE,IFEval,0.320685780396016,32.0685780396016,BBH,0.583917992316212,40.0934299163717,MATH Level 5,0,0,GPQA,0.335570469798658,11.4093959731544,MUSR,0.412322916666667,10.3403645833333,MMLU-PRO,0.397523271276596,33.0581412529551,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2024-08-10,2,google/gemma-2-9b,mit,140,9.242,2.76900372425403 -prithivMLmods/Deepthink-Reasoning-7B_float16_0ccaa3825ded55cf8cfa18f7db53d91848e3733b_False,prithivMLmods/Deepthink-Reasoning-7B,0ccaa3825ded55cf8cfa18f7db53d91848e3733b,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,26.8941447787475,FALSE,IFEval,0.484002446841048,48.4002446841049,BBH,0.550507021614528,35.6237314485809,MATH Level 5,0.200906344410876,20.0906344410876,GPQA,0.299496644295302,6.59955257270694,MUSR,0.443229166666667,13.4369791666667,MMLU-PRO,0.434923537234043,37.2137263593381,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-28,2025-01-09,1,prithivMLmods/Deepthink-Reasoning-7B (Merge),creativeml-openrail-m,11,7.616,0.626997508275094 +prithivMLmods/Deepthink-Reasoning-7B_float16_0ccaa3825ded55cf8cfa18f7db53d91848e3733b_False,prithivMLmods/Deepthink-Reasoning-7B,0ccaa3825ded55cf8cfa18f7db53d91848e3733b,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,26.8941447787475,FALSE,IFEval,0.484002446841048,48.4002446841049,BBH,0.550507021614528,35.6237314485809,MATH Level 5,0.200906344410876,20.0906344410876,GPQA,0.299496644295302,6.59955257270694,MUSR,0.443229166666667,13.4369791666667,MMLU-PRO,0.434923537234043,37.2137263593381,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-28,2025-01-09,1,prithivMLmods/Deepthink-Reasoning-7B (Merge),creativeml-openrail-m,12,7.616,0.626997508275094 prithivMLmods/GWQ-9B-Preview_float16_5a0e00ac0ff885f54ef32e607508895bae864006_False,prithivMLmods/GWQ-9B-Preview,5a0e00ac0ff885f54ef32e607508895bae864006,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,29.9153622656812,FALSE,IFEval,0.506583642512977,50.6583642512977,BBH,0.580574580424751,40.6697225433022,MATH Level 5,0.212235649546828,21.2235649546828,GPQA,0.339765100671141,11.9686800894855,MUSR,0.495104166666667,21.8213541666667,MMLU-PRO,0.398354388297872,33.1504875886525,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-04,2025-01-08,0,prithivMLmods/GWQ-9B-Preview,gemma,9,9.242,2.46116170083518 prithivMLmods/GWQ-9B-Preview2_float16_42f5d4f7d19eb59c9408ff70cdbc30459ec1ad3d_False,prithivMLmods/GWQ-9B-Preview2,42f5d4f7d19eb59c9408ff70cdbc30459ec1ad3d,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,29.8709542737253,FALSE,IFEval,0.520896776109611,52.0896776109612,BBH,0.579721871084337,40.1848605331595,MATH Level 5,0.226586102719033,22.6586102719033,GPQA,0.326342281879195,10.1789709172259,MUSR,0.485989583333333,20.8153645833333,MMLU-PRO,0.399684175531915,33.2982417257683,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-04,2025-01-08,1,prithivMLmods/GWQ-9B-Preview2 (Merge),creativeml-openrail-m,13,9.242,2.45282385227226 prithivMLmods/QwQ-LCoT-7B-Instruct_float16_06f0076fcf5cb72222513e6c76bd33e1ebaa97b7_False,prithivMLmods/QwQ-LCoT-7B-Instruct,06f0076fcf5cb72222513e6c76bd33e1ebaa97b7,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,28.1321784254201,FALSE,IFEval,0.498690142156146,49.8690142156146,BBH,0.546646632601856,34.7809334234064,MATH Level 5,0.207703927492447,20.7703927492447,GPQA,0.302013422818792,6.93512304250559,MUSR,0.4801875,19.3901041666667,MMLU-PRO,0.433427526595745,37.0475029550828,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-14,2025-01-07,1,prithivMLmods/QwQ-LCoT-7B-Instruct (Merge),creativeml-openrail-m,22,7.616,0.650304701981961 @@ -2515,7 +2519,7 @@ qingy2024/Fusion-14B-Instruct_bfloat16_2e15219659b919e04ad5b56bef259489cc264f09_ qingy2024/Fusion2-14B-Instruct_bfloat16_df00288ce3d37ef518189c19e7973e71b47ef214_True,qingy2024/Fusion2-14B-Instruct,df00288ce3d37ef518189c19e7973e71b47ef214,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,35.1822684337256,TRUE,IFEval,0.606401015970957,60.6401015970957,BBH,0.611852372286455,44.7670438308547,MATH Level 5,0.308157099697885,30.8157099697885,GPQA,0.344798657718121,12.6398210290828,MUSR,0.463385416666667,17.2231770833333,MMLU-PRO,0.505069813829787,45.0077570921986,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-06,1,qingy2024/Fusion2-14B-Instruct (Merge),"",1,14.766,1.66866594603866 qingy2024/Fusion4-14B-Instruct_float16_3f3c7178006857d7fdf942ab7e86bd2b0d7b624d_True,qingy2024/Fusion4-14B-Instruct,3f3c7178006857d7fdf942ab7e86bd2b0d7b624d,float16,chatmodels,Original,Qwen2ForCausalLM,38.733953059072,TRUE,IFEval,0.764894923248093,76.4894923248093,BBH,0.654252046947762,50.6958556395896,MATH Level 5,0.339123867069486,33.9123867069486,GPQA,0.330536912751678,10.738255033557,MUSR,0.432572916666667,13.9716145833333,MMLU-PRO,0.519365026595745,46.5961140661939,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-25,2024-12-25,1,qingy2024/Fusion4-14B-Instruct (Merge),"",0,14.77,1.82283054036158 qingy2024/OwO-14B-Instruct_bfloat16_0c64ce33086d285d9374f0fb9360d52d0eb1ff92_False,qingy2024/OwO-14B-Instruct,0c64ce33086d285d9374f0fb9360d52d0eb1ff92,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,27.4234059318296,FALSE,IFEval,0.138311901310744,13.8311901310744,BBH,0.616480717276066,44.948452301126,MATH Level 5,0.304380664652568,30.4380664652568,GPQA,0.364093959731544,15.2125279642058,MUSR,0.4406875,13.6526041666667,MMLU-PRO,0.51811835106383,46.4575945626478,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-27,2024-12-30,2,Qwen/Qwen2.5-14B,apache-2.0,0,14.77,2.81476124208054 -qingy2024/QwQ-14B-Math-v0.2_float16_308f732e0f2c1ac9e416e9c1e0523c0198ac658c_True,qingy2024/QwQ-14B-Math-v0.2,308f732e0f2c1ac9e416e9c1e0523c0198ac658c,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,24.0889902509765,TRUE,IFEval,0.339096929480445,33.9096929480445,BBH,0.573097955260854,39.0992137429518,MATH Level 5,0.190332326283988,19.0332326283988,GPQA,0.26258389261745,1.67785234899329,MUSR,0.40209375,8.59505208333333,MMLU-PRO,0.479970079787234,42.2188977541371,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-20,2024-12-23,2,Qwen/Qwen2.5-14B,apache-2.0,16,14.77,3.41117129475758 +qingy2024/QwQ-14B-Math-v0.2_float16_308f732e0f2c1ac9e416e9c1e0523c0198ac658c_True,qingy2024/QwQ-14B-Math-v0.2,308f732e0f2c1ac9e416e9c1e0523c0198ac658c,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,24.0889902509765,TRUE,IFEval,0.339096929480445,33.9096929480445,BBH,0.573097955260854,39.0992137429518,MATH Level 5,0.190332326283988,19.0332326283988,GPQA,0.26258389261745,1.67785234899329,MUSR,0.40209375,8.59505208333333,MMLU-PRO,0.479970079787234,42.2188977541371,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-20,2024-12-23,2,Qwen/Qwen2.5-14B,apache-2.0,17,14.77,3.41117129475758 qingy2024/Qwen2.5-Math-14B-Instruct-Alpha_float16_c82727eb404d3d55450759301b80f838e4d3e1fc_True,qingy2024/Qwen2.5-Math-14B-Instruct-Alpha,c82727eb404d3d55450759301b80f838e4d3e1fc,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,32.2153945754645,TRUE,IFEval,0.770440209754562,77.0440209754562,BBH,0.646486159387426,50.1795027462589,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.348993288590604,13.1991051454139,MUSR,0.40209375,8.72838541666667,MMLU-PRO,0.496592420212766,44.0658244680851,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-03,2024-12-10,2,Qwen/Qwen2.5-14B,apache-2.0,1,14.77,1.56934662160497 qingy2024/Qwen2.5-Math-14B-Instruct-Preview_float16_7b9e9b94d69f0de9627f728e9328fb394f7fea14_True,qingy2024/Qwen2.5-Math-14B-Instruct-Preview,7b9e9b94d69f0de9627f728e9328fb394f7fea14,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,31.987593150848,TRUE,IFEval,0.782580220481655,78.2580220481655,BBH,0.629394224593443,47.0508075682843,MATH Level 5,0,0,GPQA,0.340604026845638,12.0805369127517,MUSR,0.411458333333333,10.165625,MMLU-PRO,0.499335106382979,44.3705673758865,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-10,3,Qwen/Qwen2.5-14B,apache-2.0,1,14.77,1.61898032712152 qingy2024/Qwen2.6-14B-Instruct_bfloat16_c21acf3c074e9522c5d0559ccc4ed715c48b8eff_False,qingy2024/Qwen2.6-14B-Instruct,c21acf3c074e9522c5d0559ccc4ed715c48b8eff,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,35.6249791042928,FALSE,IFEval,0.581097044730205,58.1097044730205,BBH,0.6394142844483,48.0479479900271,MATH Level 5,0.267371601208459,26.7371601208459,GPQA,0.379194630872483,17.2259507829978,MUSR,0.4569375,16.0171875,MMLU-PRO,0.528507313829787,47.6119237588653,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-04,2024-12-04,1,qingy2024/Qwen2.6-14B-Instruct (Merge),"",1,14.766,1.78928624417309 @@ -2575,9 +2579,9 @@ sakaltcommunity/sakaltum-7b_bfloat16_692d1c3efdae68a3ace336d865daceb713b93130_Fa sakhan10/quantized_open_llama_3b_v2_float16_e8d51ad5204806edf9c2eeb8c56139a440a70265_False,sakhan10/quantized_open_llama_3b_v2,e8d51ad5204806edf9c2eeb8c56139a440a70265,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,5.1425000282941,FALSE,IFEval,0.187222126180756,18.7222126180756,BBH,0.301980078012147,2.80573327336385,MATH Level 5,0,0,GPQA,0.276845637583893,3.57941834451902,MUSR,0.368166666666667,4.6875,MMLU-PRO,0.109541223404255,1.06013593380615,FALSE,FALSE,FALSE,FALSE,FALSE,2024-08-23,2024-08-28,1,openlm-research/open_llama_3b_v2,"",0,3,0.392700373603761 saltlux/luxia-21.4b-alignment-v1.0_float16_87d5673e6d9f60462f195e9414a0bf6874c89ceb_True,saltlux/luxia-21.4b-alignment-v1.0,87d5673e6d9f60462f195e9414a0bf6874c89ceb,float16,chatmodels,Original,LlamaForCausalLM,22.9258730304383,TRUE,IFEval,0.369296799159563,36.9296799159563,BBH,0.637334260677559,48.0211129616079,MATH Level 5,0.0657099697885196,6.57099697885196,GPQA,0.301174496644295,6.82326621923937,MUSR,0.43284375,12.50546875,MMLU-PRO,0.340342420212766,26.704713356974,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-12,2024-06-29,0,saltlux/luxia-21.4b-alignment-v1.0,apache-2.0,33,21.421,1.744047460401 saltlux/luxia-21.4b-alignment-v1.2_bfloat16_eed12b5574fa49cc81e57a88aff24c08c13721c0_True,saltlux/luxia-21.4b-alignment-v1.2,eed12b5574fa49cc81e57a88aff24c08c13721c0,bfloat16,chatmodels,Original,LlamaForCausalLM,23.4351918455184,TRUE,IFEval,0.411536944196953,41.1536944196953,BBH,0.637118070811237,47.7691647188475,MATH Level 5,0.0158610271903323,1.58610271903323,GPQA,0.307885906040268,7.71812080536913,MUSR,0.445895833333333,14.9036458333333,MMLU-PRO,0.347323803191489,27.4804225768322,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-27,2024-07-30,0,saltlux/luxia-21.4b-alignment-v1.2,apache-2.0,8,21.421,2.04592577623435 -sam-paech/Darkest-muse-v1_bfloat16_55f6ba0218e9615d18a76f244a874b941f8c434f_False,sam-paech/Darkest-muse-v1,55f6ba0218e9615d18a76f244a874b941f8c434f,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,31.810869013554,FALSE,IFEval,0.734420227219334,73.4420227219334,BBH,0.596843953070895,42.6117312683706,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.343959731543624,12.5279642058166,MUSR,0.450208333333333,15.2760416666667,MMLU-PRO,0.418384308510638,35.3760342789598,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-22,2024-10-26,1,sam-paech/Darkest-muse-v1 (Merge),apache-2.0,35,10.159,2.20694726611163 +sam-paech/Darkest-muse-v1_bfloat16_55f6ba0218e9615d18a76f244a874b941f8c434f_False,sam-paech/Darkest-muse-v1,55f6ba0218e9615d18a76f244a874b941f8c434f,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,31.810869013554,FALSE,IFEval,0.734420227219334,73.4420227219334,BBH,0.596843953070895,42.6117312683706,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.343959731543624,12.5279642058166,MUSR,0.450208333333333,15.2760416666667,MMLU-PRO,0.418384308510638,35.3760342789598,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-22,2024-10-26,1,sam-paech/Darkest-muse-v1 (Merge),apache-2.0,37,10.159,2.20694726611163 sam-paech/Delirium-v1_bfloat16_98dc2dad47af405013c0584d752504ca448bd8eb_False,sam-paech/Delirium-v1,98dc2dad47af405013c0584d752504ca448bd8eb,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,31.732318132305,FALSE,IFEval,0.720756481690803,72.0756481690803,BBH,0.596211383452173,42.3150790899333,MATH Level 5,0.129154078549849,12.9154078549849,GPQA,0.343120805369128,12.4161073825503,MUSR,0.451447916666667,15.2309895833333,MMLU-PRO,0.418966090425532,35.440676713948,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-17,2024-10-26,1,unsloth/gemma-2-9b-it,gemma,13,9.242,2.3955012459142 -sam-paech/Quill-v1_bfloat16_3cab1cac9d3de0d25b48ea86b4533aa220231f20_False,sam-paech/Quill-v1,3cab1cac9d3de0d25b48ea86b4533aa220231f20,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,31.5030208676919,FALSE,IFEval,0.712213593265868,71.2213593265868,BBH,0.596922634798949,42.5976691390359,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.339765100671141,11.9686800894855,MUSR,0.455479166666667,16.1348958333333,MMLU-PRO,0.417137632978723,35.2375147754137,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-20,2024-10-26,1,sam-paech/Quill-v1 (Merge),"",9,9.242,2.31346910671926 +sam-paech/Quill-v1_bfloat16_3cab1cac9d3de0d25b48ea86b4533aa220231f20_False,sam-paech/Quill-v1,3cab1cac9d3de0d25b48ea86b4533aa220231f20,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,31.5030208676919,FALSE,IFEval,0.712213593265868,71.2213593265868,BBH,0.596922634798949,42.5976691390359,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.339765100671141,11.9686800894855,MUSR,0.455479166666667,16.1348958333333,MMLU-PRO,0.417137632978723,35.2375147754137,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-20,2024-10-26,1,sam-paech/Quill-v1 (Merge),"",10,9.242,2.31346910671926 schnapss/testmerge-7b_bfloat16_ff84f5b87ba51db9622b1c553c076533890a8f50_False,schnapss/testmerge-7b,ff84f5b87ba51db9622b1c553c076533890a8f50,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,20.9134460848223,FALSE,IFEval,0.392228176793131,39.2228176793131,BBH,0.518747840563738,32.6381662414967,MATH Level 5,0.0687311178247734,6.87311178247734,GPQA,0.296140939597315,6.15212527964205,MUSR,0.4685625,17.7036458333333,MMLU-PRO,0.306017287234043,22.8908096926714,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-16,2024-11-16,1,schnapss/testmerge-7b (Merge),"",0,7.242,0.470154717477583 sci-m-wang/Mistral-7B-Instruct-sa-v0.1_bfloat16_2dcff66eac0c01dc50e4c41eea959968232187fe_True,sci-m-wang/Mistral-7B-Instruct-sa-v0.1,2dcff66eac0c01dc50e4c41eea959968232187fe,bfloat16,chatmodels,Adapter,?,12.2000642869982,TRUE,IFEval,0.433518619485188,43.3518619485188,BBH,0.327278215614117,5.74364607742995,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.259228187919463,1.23042505592841,MUSR,0.39,6.68333333333333,MMLU-PRO,0.236203457446809,15.1337174940898,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-31,2024-06-27,2,mistralai/Mistral-7B-v0.1,other,0,14.483,0.765082309391731 sci-m-wang/Phi-3-mini-4k-instruct-sa-v0.1_bfloat16_5a516f86087853f9d560c95eb9209c1d4ed9ff69_True,sci-m-wang/Phi-3-mini-4k-instruct-sa-v0.1,5a516f86087853f9d560c95eb9209c1d4ed9ff69,bfloat16,chatmodels,Adapter,?,25.7737920491517,TRUE,IFEval,0.502062305793073,50.2062305793073,BBH,0.550203872238305,36.6054191487681,MATH Level 5,0.145015105740181,14.5015105740181,GPQA,0.328859060402685,10.5145413870246,MUSR,0.407302083333333,9.64609375,MMLU-PRO,0.398520611702128,33.168956855792,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-01,2024-06-27,1,microsoft/Phi-3-mini-4k-instruct,other,0,7.642,1.28050267506016 @@ -2604,7 +2608,7 @@ sometimesanotion/IF-reasoning-experiment-40_bfloat16_0064fffb67d18b0f946b6e7bf32 sometimesanotion/IF-reasoning-experiment-80_bfloat16_d1441e8bd87f11235fd4c708f6ece69a9973c343_False,sometimesanotion/IF-reasoning-experiment-80,d1441e8bd87f11235fd4c708f6ece69a9973c343,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,21.7767402543259,FALSE,IFEval,0.546276102962362,54.6276102962362,BBH,0.421038361322393,17.4823395728022,MATH Level 5,0.0468277945619335,4.68277945619335,GPQA,0.284395973154362,4.58612975391499,MUSR,0.502458333333333,22.9739583333333,MMLU-PRO,0.336768617021277,26.3076241134752,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-29,0,Removed,"",0,7.383,1.88698243352404 sometimesanotion/Lamarck-14B-v0.1-experimental_bfloat16_b0600e08e8c97b25d1abca543b997d9927245442_False,sometimesanotion/Lamarck-14B-v0.1-experimental,b0600e08e8c97b25d1abca543b997d9927245442,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.6709959612302,FALSE,IFEval,0.535385000687066,53.5385000687066,BBH,0.658253923996733,50.7949076691947,MATH Level 5,0.305135951661631,30.5135951661631,GPQA,0.381711409395973,17.5615212527964,MUSR,0.47284375,18.6388020833333,MMLU-PRO,0.540807845744681,48.9786495271868,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-09,0,Removed,"",0,14.766,1.8946933781146 sometimesanotion/Lamarck-14B-v0.3_bfloat16_781637d1b65766fe933ebde070632e48f91390ab_False,sometimesanotion/Lamarck-14B-v0.3,781637d1b65766fe933ebde070632e48f91390ab,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.5760956938364,FALSE,IFEval,0.503161611191638,50.3161611191638,BBH,0.661140046537316,51.2743085882105,MATH Level 5,0.324018126888218,32.4018126888218,GPQA,0.388422818791946,18.4563758389262,MUSR,0.4688125,18.0015625,MMLU-PRO,0.541057180851064,49.006353427896,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-06,2024-12-09,1,sometimesanotion/Lamarck-14B-v0.3 (Merge),apache-2.0,2,14.766,7.63918131611033 -sometimesanotion/Lamarck-14B-v0.4-Qwenvergence_bfloat16_add9a151dd5614603bebcf3d3740fa92e5d67632_False,sometimesanotion/Lamarck-14B-v0.4-Qwenvergence,add9a151dd5614603bebcf3d3740fa92e5d67632,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.5697935328493,FALSE,IFEval,0.490647038746083,49.0647038746083,BBH,0.653514219232406,50.2080449984793,MATH Level 5,0.336858006042296,33.6858006042296,GPQA,0.378355704697987,17.1140939597315,MUSR,0.4846875,20.3859375,MMLU-PRO,0.540641622340426,48.9601802600473,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-12,2024-12-12,1,sometimesanotion/Lamarck-14B-v0.4-Qwenvergence (Merge),apache-2.0,3,14.766,1.74126349788564 +sometimesanotion/Lamarck-14B-v0.4-Qwenvergence_bfloat16_add9a151dd5614603bebcf3d3740fa92e5d67632_False,sometimesanotion/Lamarck-14B-v0.4-Qwenvergence,add9a151dd5614603bebcf3d3740fa92e5d67632,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.5697935328493,FALSE,IFEval,0.490647038746083,49.0647038746083,BBH,0.653514219232406,50.2080449984793,MATH Level 5,0.336858006042296,33.6858006042296,GPQA,0.378355704697987,17.1140939597315,MUSR,0.4846875,20.3859375,MMLU-PRO,0.540641622340426,48.9601802600473,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-12,0,Removed,"",0,14.766,1.74126349788564 sometimesanotion/Lamarck-14B-v0.6_bfloat16_e9c144208c045fe6954ef3f658a3bda38dbd0d82_False,sometimesanotion/Lamarck-14B-v0.6,e9c144208c045fe6954ef3f658a3bda38dbd0d82,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,40.3743925507204,FALSE,IFEval,0.697251071601129,69.7251071601129,BBH,0.646031223378293,49.2978946293996,MATH Level 5,0.356495468277946,35.6495468277946,GPQA,0.389261744966443,18.5682326621924,MUSR,0.4846875,20.1192708333333,MMLU-PRO,0.539976728723404,48.8863031914894,TRUE,TRUE,FALSE,FALSE,FALSE,2025-01-04,2025-01-05,1,sometimesanotion/Lamarck-14B-v0.6 (Merge),apache-2.0,7,14.766,1.92238474367017 sometimesanotion/Lamarck-14B-v0.6-002-model_stock_bfloat16_c2d5adb04b1839aeeca77a3f2a5be08864116da1_False,sometimesanotion/Lamarck-14B-v0.6-002-model_stock,c2d5adb04b1839aeeca77a3f2a5be08864116da1,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,38.8533497474969,FALSE,IFEval,0.669224324791553,66.9224324791553,BBH,0.61433491887247,45.0065835596136,MATH Level 5,0.341389728096677,34.1389728096677,GPQA,0.374161073825503,16.5548098434004,MUSR,0.518020833333333,25.4526041666667,MMLU-PRO,0.505402260638298,45.0446956264775,FALSE,FALSE,FALSE,FALSE,FALSE,"",2025-01-01,0,Removed,"",0,7.383,1.88792566629548 sometimesanotion/Lamarck-14B-v0.6-model_stock_bfloat16_4d4227285a889ffd23618ad32ff7b08d1bcfa5ae_False,sometimesanotion/Lamarck-14B-v0.6-model_stock,4d4227285a889ffd23618ad32ff7b08d1bcfa5ae,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,39.5809157697373,FALSE,IFEval,0.678966253983874,67.8966253983874,BBH,0.626943653275322,46.4913260828855,MATH Level 5,0.358761329305136,35.8761329305136,GPQA,0.384228187919463,17.8970917225951,MUSR,0.50065625,22.68203125,MMLU-PRO,0.519780585106383,46.6422872340426,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-31,0,Removed,"",0,7.383,1.86163928950389 @@ -2630,7 +2634,7 @@ sometimesanotion/Qwenvergence-14B-qv256_bfloat16_13e8b600da0b78b23481738858b7ed2 sometimesanotion/Qwenvergence-14B-v0.6-004-model_stock_bfloat16_1fa94759545d9b591bcbbe93a2c90f2a346f9580_False,sometimesanotion/Qwenvergence-14B-v0.6-004-model_stock,1fa94759545d9b591bcbbe93a2c90f2a346f9580,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,39.0050696147173,FALSE,IFEval,0.685985407607371,68.5985407607371,BBH,0.624933870754005,46.366653802814,MATH Level 5,0.313444108761329,31.3444108761329,GPQA,0.383389261744966,17.7852348993289,MUSR,0.503322916666667,23.3486979166667,MMLU-PRO,0.519281914893617,46.5868794326241,FALSE,FALSE,FALSE,FALSE,FALSE,"",2025-01-01,0,Removed,"",0,7.383,1.9097512481641 sometimesanotion/Qwenvergence-14B-v2-Prose_bfloat16_503b367e07a8ed3ce532d03ea35d40d8f17d6e35_False,sometimesanotion/Qwenvergence-14B-v2-Prose,503b367e07a8ed3ce532d03ea35d40d8f17d6e35,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.7410656363901,FALSE,IFEval,0.47048830436575,47.048830436575,BBH,0.651883047351897,49.9334719916437,MATH Level 5,0.342900302114804,34.2900302114804,GPQA,0.393456375838926,19.1275167785235,MUSR,0.49259375,21.47421875,MMLU-PRO,0.537150930851064,48.5723256501182,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-15,0,Removed,"",0,14,1.68478875223377 sometimesanotion/Qwenvergence-14B-v3_bfloat16_40c489fd71724f2fa3f7154e4874c6d00700c6c0_False,sometimesanotion/Qwenvergence-14B-v3,40c489fd71724f2fa3f7154e4874c6d00700c6c0,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.1648327984762,FALSE,IFEval,0.504410519643435,50.4410519643435,BBH,0.654823836148701,50.3526875150537,MATH Level 5,0.348187311178248,34.8187311178248,GPQA,0.384228187919463,17.8970917225951,MUSR,0.48859375,20.7408854166667,MMLU-PRO,0.538646941489362,48.7385490543735,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-21,0,Removed,"",0,7.383,1.9028150731847 -sometimesanotion/Qwenvergence-14B-v3-Prose_bfloat16_15e4222295ef31aee17c2e5b6e7a31ffd21e3c7b_False,sometimesanotion/Qwenvergence-14B-v3-Prose,15e4222295ef31aee17c2e5b6e7a31ffd21e3c7b,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.3708094176769,FALSE,IFEval,0.49177072390147,49.177072390147,BBH,0.651291317094932,49.7983666809914,MATH Level 5,0.355740181268882,35.5740181268882,GPQA,0.39513422818792,19.3512304250559,MUSR,0.493895833333333,21.7703125,MMLU-PRO,0.536984707446809,48.5538563829787,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,sometimesanotion/Qwenvergence-14B-v3-Prose (Merge),apache-2.0,2,14.766,1.71134135251856 +sometimesanotion/Qwenvergence-14B-v3-Prose_bfloat16_15e4222295ef31aee17c2e5b6e7a31ffd21e3c7b_False,sometimesanotion/Qwenvergence-14B-v3-Prose,15e4222295ef31aee17c2e5b6e7a31ffd21e3c7b,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.3708094176769,FALSE,IFEval,0.49177072390147,49.177072390147,BBH,0.651291317094932,49.7983666809914,MATH Level 5,0.355740181268882,35.5740181268882,GPQA,0.39513422818792,19.3512304250559,MUSR,0.493895833333333,21.7703125,MMLU-PRO,0.536984707446809,48.5538563829787,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-21,0,Removed,"",0,14.766,1.71134135251856 sometimesanotion/Qwenvergence-14B-v3-Reason_float16_1e613b0e6bfdb08e7c21a3e6ba3b84e361cf8350_False,sometimesanotion/Qwenvergence-14B-v3-Reason,1e613b0e6bfdb08e7c21a3e6ba3b84e361cf8350,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,37.0468000181585,FALSE,IFEval,0.536683776823273,53.6683776823274,BBH,0.656128395746618,50.6944479886705,MATH Level 5,0.324018126888218,32.4018126888218,GPQA,0.386744966442953,18.2326621923937,MUSR,0.474020833333333,18.4526041666667,MMLU-PRO,0.539478058510638,48.8308953900709,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-21,0,Removed,"",0,7.383,1.89560397778342 sometimesanotion/Qwenvergence-14B-v3-Reason_bfloat16_6acf3cbc9c36b19d66ac683f073e32a9bf86d56e_False,sometimesanotion/Qwenvergence-14B-v3-Reason,6acf3cbc9c36b19d66ac683f073e32a9bf86d56e,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.7140481268604,FALSE,IFEval,0.527816194364287,52.7816194364287,BBH,0.655743756682434,50.6357761372748,MATH Level 5,0.311933534743202,31.1933534743202,GPQA,0.384228187919463,17.8970917225951,MUSR,0.475416666666667,18.9270833333333,MMLU-PRO,0.539644281914894,48.8493646572104,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-21,0,Removed,"",0,7.383,1.92617191333061 sometimesanotion/Qwenvergence-14B-v6-Prose_bfloat16_bbb6b0900b630a3120d036d3434ca0fa508ed559_False,sometimesanotion/Qwenvergence-14B-v6-Prose,bbb6b0900b630a3120d036d3434ca0fa508ed559,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,38.8249662267441,FALSE,IFEval,0.599007300628998,59.9007300628998,BBH,0.65437502308072,50.1199760400256,MATH Level 5,0.348942598187311,34.8942598187311,GPQA,0.388422818791946,18.4563758389262,MUSR,0.48865625,21.0153645833333,MMLU-PRO,0.537067819148936,48.5630910165485,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-26,0,Removed,"",0,7.383,1.93526414003491 @@ -2656,7 +2660,7 @@ spow12/ChatWaifu_v2.0_22B_float16_54771319920ed791ba3f0262b036f37a92b880f2_True, spow12/ChatWaifu_v2.0_22B_bfloat16_a6e7c206d9af77d3f85faf0ce4a711d62815b2ab_True,spow12/ChatWaifu_v2.0_22B,a6e7c206d9af77d3f85faf0ce4a711d62815b2ab,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,28.8686591874693,TRUE,IFEval,0.651738498295633,65.1738498295633,BBH,0.5908050619551,42.0197980925151,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.323825503355705,9.84340044742729,MUSR,0.384197916666667,5.59140625,MMLU-PRO,0.381233377659575,31.2481530732861,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-11,2024-10-14,1,spow12/ChatWaifu_v2.0_22B (Merge),cc-by-nc-4.0,8,22.247,1.39586011554328 ssmits/Qwen2.5-95B-Instruct_bfloat16_9c0e7df57a4fcf4d364efd916a0fc0abdd2d20a3_True,ssmits/Qwen2.5-95B-Instruct,9c0e7df57a4fcf4d364efd916a0fc0abdd2d20a3,bfloat16,chatmodels,Original,Qwen2ForCausalLM,37.4401249883746,TRUE,IFEval,0.843105183136301,84.3105183136301,BBH,0.703779969748824,58.5303513228511,MATH Level 5,0.061178247734139,6.1178247734139,GPQA,0.364093959731544,15.2125279642058,MUSR,0.428385416666667,13.61484375,MMLU-PRO,0.521692154255319,46.8546838061466,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-24,2024-09-26,1,ssmits/Qwen2.5-95B-Instruct (Merge),other,3,94.648,19.2334948028144 stabilityai/StableBeluga2_bfloat16_cb47d3db70ea3ddc2cabdeb358c303b328f65900_False,stabilityai/StableBeluga2,cb47d3db70ea3ddc2cabdeb358c303b328f65900,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,22.6828417931441,FALSE,IFEval,0.378714034317832,37.8714034317832,BBH,0.582412813455381,41.2632611272238,MATH Level 5,0.0362537764350453,3.62537764350453,GPQA,0.316275167785235,8.83668903803132,MUSR,0.47296875,18.6544270833333,MMLU-PRO,0.332613031914894,25.8458924349882,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-20,2024-06-13,0,stabilityai/StableBeluga2,"",884,68.977,6.25467365604401 -stabilityai/stablelm-2-12b_bfloat16_fead13ddbf4492970666650c3cd6f85f485411ec_False,stabilityai/stablelm-2-12b,fead13ddbf4492970666650c3cd6f85f485411ec,bfloat16,pretrained,Original,StableLmForCausalLM,13.9357224770686,FALSE,IFEval,0.156921412962052,15.6921412962052,BBH,0.450865417111477,22.685797482044,MATH Level 5,0.0392749244712991,3.92749244712991,GPQA,0.278523489932886,3.80313199105145,MUSR,0.447885416666667,14.4856770833333,MMLU-PRO,0.30718085106383,23.0200945626478,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-21,2024-06-12,0,stabilityai/stablelm-2-12b,other,117,12.143,1.47327922426156 +stabilityai/stablelm-2-12b_bfloat16_fead13ddbf4492970666650c3cd6f85f485411ec_False,stabilityai/stablelm-2-12b,fead13ddbf4492970666650c3cd6f85f485411ec,bfloat16,pretrained,Original,StableLmForCausalLM,13.9357224770686,FALSE,IFEval,0.156921412962052,15.6921412962052,BBH,0.450865417111477,22.685797482044,MATH Level 5,0.0392749244712991,3.92749244712991,GPQA,0.278523489932886,3.80313199105145,MUSR,0.447885416666667,14.4856770833333,MMLU-PRO,0.30718085106383,23.0200945626478,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-21,2024-06-12,0,stabilityai/stablelm-2-12b,other,118,12.143,1.47327922426156 stabilityai/stablelm-2-12b-chat_bfloat16_b6b62cd451b84e848514c00fafa66d9ead9297c5_True,stabilityai/stablelm-2-12b-chat,b6b62cd451b84e848514c00fafa66d9ead9297c5,bfloat16,chatmodels,Original,StableLmForCausalLM,16.2494771147373,TRUE,IFEval,0.408164780560025,40.8164780560025,BBH,0.467202473128281,25.2536970908126,MATH Level 5,0.0219033232628399,2.19033232628399,GPQA,0.266778523489933,2.23713646532438,MUSR,0.391427083333333,7.72838541666667,MMLU-PRO,0.2734375,19.2708333333333,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-04,2024-06-12,0,stabilityai/stablelm-2-12b-chat,other,88,12.143,1.08809668593683 stabilityai/stablelm-2-1_6b_float16_8879812cccd176fbbe9ceb747b815bcc7d6499f8_False,stabilityai/stablelm-2-1_6b,8879812cccd176fbbe9ceb747b815bcc7d6499f8,float16,pretrained,Original,StableLmForCausalLM,5.21612653885089,FALSE,IFEval,0.115705217711228,11.5705217711228,BBH,0.338457720511071,8.63269520496884,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.248322147651007,0,MUSR,0.388197916666667,5.79140625,MMLU-PRO,0.146359707446809,5.15107860520095,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-18,2024-06-12,0,stabilityai/stablelm-2-1_6b,other,187,1.645,0.549871827675722 stabilityai/stablelm-2-1_6b-chat_bfloat16_f3fe67057c2789ae1bb1fe42b038da99840d4f13_True,stabilityai/stablelm-2-1_6b-chat,f3fe67057c2789ae1bb1fe42b038da99840d4f13,bfloat16,chatmodels,Original,StableLmForCausalLM,8.64077458938206,TRUE,IFEval,0.305999193251683,30.5999193251683,BBH,0.339017239548652,7.49337829741063,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.24748322147651,0,MUSR,0.35796875,5.71276041666667,MMLU-PRO,0.162150930851064,6.90565898345154,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-08,2024-06-12,0,stabilityai/stablelm-2-1_6b-chat,other,32,1.645,0.495426508518865 @@ -2719,17 +2723,17 @@ tiiuae/Falcon3-10B-Base_bfloat16_0b20cceec08ec598ed2de7a6dfbeb208f1eae656_False, tiiuae/Falcon3-10B-Instruct_bfloat16_9be8471432d7c4f35f72505fa2ca4101f0a2ed6d_True,tiiuae/Falcon3-10B-Instruct,9be8471432d7c4f35f72505fa2ca4101f0a2ed6d,bfloat16,chatmodels,Original,LlamaForCausalLM,35.1858847768594,TRUE,IFEval,0.78165600606391,78.1656006063911,BBH,0.617046939805208,44.8215398248313,MATH Level 5,0.259063444108761,25.9063444108761,GPQA,0.328859060402685,10.5145413870246,MUSR,0.432322916666667,13.60703125,MMLU-PRO,0.442902260638298,38.1002511820331,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-14,2024-12-16,1,tiiuae/Falcon3-10B-Base,other,81,10.306,0.840411143061328 tiiuae/Falcon3-1B-Base_bfloat16_cc56a5a7c3923821312ad14f52c5a7c3fa835cbc_False,tiiuae/Falcon3-1B-Base,cc56a5a7c3923821312ad14f52c5a7c3fa835cbc,bfloat16,pretrained,Original,LlamaForCausalLM,9.8377436362263,FALSE,IFEval,0.242801322712625,24.2801322712625,BBH,0.357115391801564,11.3431732658549,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.279362416107383,3.91498881431767,MUSR,0.414739583333333,9.70911458333333,MMLU-PRO,0.160821143617021,6.7579048463357,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-13,2024-12-16,0,tiiuae/Falcon3-1B-Base,other,13,1.669,0.401369486782322 tiiuae/Falcon3-1B-Instruct_bfloat16_27dd70ccb22fd3cc71c5adbc95eb670455afff3d_True,tiiuae/Falcon3-1B-Instruct,27dd70ccb22fd3cc71c5adbc95eb670455afff3d,bfloat16,chatmodels,Original,LlamaForCausalLM,15.3211934957275,TRUE,IFEval,0.555667850193043,55.5667850193043,BBH,0.374453569136667,12.9613740625082,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.266778523489933,2.23713646532438,MUSR,0.418895833333333,10.5619791666667,MMLU-PRO,0.183843085106383,9.31589834515366,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-14,2024-12-16,1,tiiuae/Falcon3-1B-Base,other,28,1.669,0.397020363950145 -tiiuae/Falcon3-3B-Base_bfloat16_3d49753006a0fa5384031a737c60fbcd0f60b7f2_False,tiiuae/Falcon3-3B-Base,3d49753006a0fa5384031a737c60fbcd0f60b7f2,bfloat16,pretrained,Original,LlamaForCausalLM,15.7513313104367,FALSE,IFEval,0.27649857932508,27.649857932508,BBH,0.442136782587439,21.5847842937733,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.296979865771812,6.26398210290828,MUSR,0.374989583333333,6.27369791666667,MMLU-PRO,0.287898936170213,20.8776595744681,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-13,2024-12-13,0,tiiuae/Falcon3-3B-Base,other,14,3.228,0.481216475612645 +tiiuae/Falcon3-3B-Base_bfloat16_3d49753006a0fa5384031a737c60fbcd0f60b7f2_False,tiiuae/Falcon3-3B-Base,3d49753006a0fa5384031a737c60fbcd0f60b7f2,bfloat16,pretrained,Original,LlamaForCausalLM,15.7513313104367,FALSE,IFEval,0.27649857932508,27.649857932508,BBH,0.442136782587439,21.5847842937733,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.296979865771812,6.26398210290828,MUSR,0.374989583333333,6.27369791666667,MMLU-PRO,0.287898936170213,20.8776595744681,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-13,2024-12-13,0,tiiuae/Falcon3-3B-Base,other,15,3.228,0.481216475612645 tiiuae/Falcon3-3B-Instruct_bfloat16_552213004cecf9bb6ce332f46da0d4324c8347f1_True,tiiuae/Falcon3-3B-Instruct,552213004cecf9bb6ce332f46da0d4324c8347f1,bfloat16,chatmodels,Original,LlamaForCausalLM,26.5519924326426,TRUE,IFEval,0.697675501004003,69.7675501004003,BBH,0.475443033216757,26.2872294684327,MATH Level 5,0.246978851963746,24.6978851963746,GPQA,0.288590604026846,5.14541387024609,MUSR,0.41359375,11.1325520833333,MMLU-PRO,0.300531914893617,22.2813238770686,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-14,2024-12-16,0,tiiuae/Falcon3-3B-Instruct,other,22,3.228,0.480463645995229 tiiuae/Falcon3-7B-Base_bfloat16_a1cf49eb7a53210fc2ee82f3876bbc7efb2244fd_False,tiiuae/Falcon3-7B-Base,a1cf49eb7a53210fc2ee82f3876bbc7efb2244fd,bfloat16,pretrained,Original,LlamaForCausalLM,24.7205491267482,FALSE,IFEval,0.341594746384039,34.1594746384039,BBH,0.509888046642671,31.5599185475034,MATH Level 5,0.192598187311178,19.2598187311178,GPQA,0.346476510067114,12.8635346756152,MUSR,0.470208333333333,18.1427083333333,MMLU-PRO,0.391040558510638,32.3378398345154,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-21,2024-12-12,0,tiiuae/Falcon3-7B-Base,other,21,7.456,0.609372047303554 tiiuae/Falcon3-7B-Instruct_bfloat16_7aae4f3953f3dbfaa81aeecbb404a6bbba0e0c06_True,tiiuae/Falcon3-7B-Instruct,7aae4f3953f3dbfaa81aeecbb404a6bbba0e0c06,bfloat16,chatmodels,Original,LlamaForCausalLM,34.9066990629732,TRUE,IFEval,0.761247933261524,76.1247933261524,BBH,0.563244278519333,37.9158124591715,MATH Level 5,0.318731117824773,31.8731117824773,GPQA,0.310402684563758,8.05369127516779,MUSR,0.482677083333333,21.16796875,MMLU-PRO,0.40874335106383,34.30481678487,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-29,2024-12-16,1,tiiuae/Falcon3-7B-Base,other,43,7.456,0.618760668612507 -tiiuae/Falcon3-Mamba-7B-Base_bfloat16_f08d14145ce86c32dd04f18bacb3f12b247042e2_False,tiiuae/Falcon3-Mamba-7B-Base,f08d14145ce86c32dd04f18bacb3f12b247042e2,bfloat16,pretrained,Original,FalconMambaForCausalLM,18.1262038589633,FALSE,IFEval,0.289112887139457,28.9112887139457,BBH,0.469928018882704,25.5340488029532,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.309563758389262,7.94183445190157,MUSR,0.343145833333333,4.39322916666667,MMLU-PRO,0.303773271276596,22.6414745862884,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2024-12-12,0,tiiuae/Falcon3-Mamba-7B-Base,other,17,7.273,0.83631814366917 +tiiuae/Falcon3-Mamba-7B-Base_bfloat16_f08d14145ce86c32dd04f18bacb3f12b247042e2_False,tiiuae/Falcon3-Mamba-7B-Base,f08d14145ce86c32dd04f18bacb3f12b247042e2,bfloat16,pretrained,Original,FalconMambaForCausalLM,18.1262038589633,FALSE,IFEval,0.289112887139457,28.9112887139457,BBH,0.469928018882704,25.5340488029532,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.309563758389262,7.94183445190157,MUSR,0.343145833333333,4.39322916666667,MMLU-PRO,0.303773271276596,22.6414745862884,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2024-12-12,0,tiiuae/Falcon3-Mamba-7B-Base,other,18,7.273,0.83631814366917 tiiuae/Falcon3-Mamba-7B-Instruct_bfloat16_382561849d1509b5f1a4d7a38bb286b3c4f46fbd_True,tiiuae/Falcon3-Mamba-7B-Instruct,382561849d1509b5f1a4d7a38bb286b3c4f46fbd,bfloat16,chatmodels,Original,FalconMambaForCausalLM,27.643894386327,TRUE,IFEval,0.716509971320541,71.6509971320541,BBH,0.467895768841069,25.2035051723981,MATH Level 5,0.272658610271903,27.2658610271903,GPQA,0.303691275167785,7.15883668903803,MUSR,0.386864583333333,8.25807291666667,MMLU-PRO,0.336934840425532,26.3260933806147,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-13,2024-12-13,1,tiiuae/Falcon3-Mamba-7B-Instruct (Merge),other,19,7.273,0.828497506621677 tiiuae/falcon-11B_bfloat16_066e3bf4e2d9aaeefa129af0a6d39727d27816b3_False,tiiuae/falcon-11B,066e3bf4e2d9aaeefa129af0a6d39727d27816b3,bfloat16,pretrained,Original,FalconForCausalLM,13.814138235727,FALSE,IFEval,0.326132439704429,32.6132439704429,BBH,0.439163703554938,21.9379994628903,MATH Level 5,0.0256797583081571,2.56797583081571,GPQA,0.270973154362416,2.79642058165548,MUSR,0.398645833333333,7.53072916666667,MMLU-PRO,0.238946143617021,15.4384604018913,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-09,2024-06-09,0,tiiuae/falcon-11B,unknown,212,11.103,1.08287099141766 tiiuae/falcon-40b_bfloat16_4a70170c215b36a3cce4b4253f6d0612bb7d4146_False,tiiuae/falcon-40b,4a70170c215b36a3cce4b4253f6d0612bb7d4146,bfloat16,pretrained,Original,FalconForCausalLM,11.3635401118469,FALSE,IFEval,0.249645385355302,24.9645385355302,BBH,0.40185324955958,16.5833047303122,MATH Level 5,0.0158610271903323,1.58610271903323,GPQA,0.273489932885906,3.13199105145414,MUSR,0.363145833333333,5.19322916666667,MMLU-PRO,0.250498670212766,16.7220744680851,TRUE,FALSE,FALSE,FALSE,TRUE,2023-05-24,2024-06-09,0,tiiuae/falcon-40b,apache-2.0,2424,40,21.7935839014342 tiiuae/falcon-40b-instruct_bfloat16_ecb78d97ac356d098e79f0db222c9ce7c5d9ee5f_False,tiiuae/falcon-40b-instruct,ecb78d97ac356d098e79f0db222c9ce7c5d9ee5f,bfloat16,chatmodels,Original,FalconForCausalLM,10.4341543148279,FALSE,IFEval,0.24544874266945,24.544874266945,BBH,0.40538675151592,17.2201142032645,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.25,0,MUSR,0.376229166666667,5.16197916666667,MMLU-PRO,0.226146941489362,14.0163268321513,TRUE,FALSE,FALSE,FALSE,TRUE,2023-05-25,2024-06-09,0,tiiuae/falcon-40b-instruct,apache-2.0,1174,40,19.7332454871768 tiiuae/falcon-7b_bfloat16_898df1396f35e447d5fe44e0a3ccaaaa69f30d36_False,tiiuae/falcon-7b,898df1396f35e447d5fe44e0a3ccaaaa69f30d36,bfloat16,pretrained,Original,FalconForCausalLM,5.11050413623086,FALSE,IFEval,0.182051401392749,18.2051401392749,BBH,0.328524461173222,5.96393691187605,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.24496644295302,0,MUSR,0.37784375,4.49713541666667,MMLU-PRO,0.112533244680851,1.39258274231678,TRUE,FALSE,FALSE,FALSE,TRUE,2023-04-24,2024-06-09,0,tiiuae/falcon-7b,apache-2.0,1083,7,0.785841237420765 -tiiuae/falcon-7b-instruct_bfloat16_cf4b3c42ce2fdfe24f753f0f0d179202fea59c99_False,tiiuae/falcon-7b-instruct,cf4b3c42ce2fdfe24f753f0f0d179202fea59c99,bfloat16,chatmodels,Original,FalconForCausalLM,5.01586897414341,FALSE,IFEval,0.196888699761078,19.6888699761078,BBH,0.320342215123558,4.82317846067443,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.24748322147651,0,MUSR,0.363364583333333,3.25390625,MMLU-PRO,0.115525265957447,1.72502955082742,TRUE,FALSE,FALSE,FALSE,TRUE,2023-04-25,2024-06-09,0,tiiuae/falcon-7b-instruct,apache-2.0,935,7,0.766214525605888 +tiiuae/falcon-7b-instruct_bfloat16_cf4b3c42ce2fdfe24f753f0f0d179202fea59c99_False,tiiuae/falcon-7b-instruct,cf4b3c42ce2fdfe24f753f0f0d179202fea59c99,bfloat16,chatmodels,Original,FalconForCausalLM,5.01586897414341,FALSE,IFEval,0.196888699761078,19.6888699761078,BBH,0.320342215123558,4.82317846067443,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.24748322147651,0,MUSR,0.363364583333333,3.25390625,MMLU-PRO,0.115525265957447,1.72502955082742,TRUE,FALSE,FALSE,FALSE,TRUE,2023-04-25,2024-06-09,0,tiiuae/falcon-7b-instruct,apache-2.0,936,7,0.766214525605888 tiiuae/falcon-mamba-7b_bfloat16_5337fd73f19847e111ba2291f3f0e1617b90c37d_False,tiiuae/falcon-mamba-7b,5337fd73f19847e111ba2291f3f0e1617b90c37d,bfloat16,pretrained,Original,FalconMambaForCausalLM,15.1162974435226,FALSE,IFEval,0.333576022730799,33.3576022730799,BBH,0.428485498860437,19.8768778035434,MATH Level 5,0.040785498489426,4.0785498489426,GPQA,0.310402684563758,8.05369127516779,MUSR,0.42103125,10.8622395833333,MMLU-PRO,0.230219414893617,14.4688238770686,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-17,2024-07-23,0,tiiuae/falcon-mamba-7b,other,225,7,3.61040791749829 tklohj/WindyFloLLM_float16_21f4241ab3f091d1d309e9076a8d8e3f014908a8_False,tklohj/WindyFloLLM,21f4241ab3f091d1d309e9076a8d8e3f014908a8,float16,pretrained,Original,LlamaForCausalLM,14.2058910531351,FALSE,IFEval,0.26685638550158,26.685638550158,BBH,0.463661600705879,24.3987631978505,MATH Level 5,0.013595166163142,1.3595166163142,GPQA,0.275167785234899,3.35570469798658,MUSR,0.4253125,11.8640625,MMLU-PRO,0.258144946808511,17.5716607565012,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-30,2024-07-10,1,tklohj/WindyFloLLM (Merge),"",0,13.016,1.09851209304988 togethercomputer/GPT-JT-6B-v1_float16_f34aa35f906895602c1f86f5685e598afdea8051_False,togethercomputer/GPT-JT-6B-v1,f34aa35f906895602c1f86f5685e598afdea8051,float16,fine-tunedondomain-specificdatasets,Original,GPTJForCausalLM,6.82735436046721,FALSE,IFEval,0.206106464181705,20.6106464181705,BBH,0.330266091274267,7.31852396514161,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.260906040268456,1.45413870246085,MUSR,0.37365625,3.87369791666667,MMLU-PRO,0.162566489361702,6.95183215130023,TRUE,FALSE,FALSE,FALSE,TRUE,2022-11-24,2024-06-12,0,togethercomputer/GPT-JT-6B-v1,apache-2.0,301,6,37.9588106808561 @@ -2744,9 +2748,9 @@ togethercomputer/RedPajama-INCITE-Chat-3B-v1_float16_f0e0995eba801096ed04cb87931 togethercomputer/RedPajama-INCITE-Instruct-3B-v1_float16_0c66778ee09a036886741707733620b91057909a_False,togethercomputer/RedPajama-INCITE-Instruct-3B-v1,0c66778ee09a036886741707733620b91057909a,float16,fine-tunedondomain-specificdatasets,Original,GPTNeoXForCausalLM,5.67652662558519,FALSE,IFEval,0.212426362052687,21.2426362052687,BBH,0.314601775205724,4.51078636892698,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.24748322147651,0,MUSR,0.388604166666667,6.40885416666667,MMLU-PRO,0.110954122340426,1.21712470449173,TRUE,FALSE,FALSE,FALSE,TRUE,2023-05-05,2024-06-12,0,togethercomputer/RedPajama-INCITE-Instruct-3B-v1,apache-2.0,93,3,0.760671034709841 tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1_bfloat16_1fae784584dd03680b72dd4de7eefbc5b7cabcd5_True,tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1,1fae784584dd03680b72dd4de7eefbc5b7cabcd5,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,22.3073854674577,TRUE,IFEval,0.550771951754678,55.0771951754678,BBH,0.5009389976232,29.2679661316177,MATH Level 5,0.0725075528700906,7.25075528700906,GPQA,0.289429530201342,5.2572706935123,MUSR,0.435697916666667,13.7955729166667,MMLU-PRO,0.308759973404255,23.1955526004728,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-26,2024-09-12,0,tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1,llama3,18,8.03,0.858110170753023 unsloth/Phi-3-mini-4k-instruct_float16_636c707430a5509c80b1aa51d05c127ed339a975_True,unsloth/Phi-3-mini-4k-instruct,636c707430a5509c80b1aa51d05c127ed339a975,float16,basemergesandmoerges,Original,MistralForCausalLM,27.1783743374799,TRUE,IFEval,0.544027624480822,54.4027624480822,BBH,0.550023946744103,36.732473265614,MATH Level 5,0.154078549848943,15.4078549848943,GPQA,0.322986577181208,9.73154362416107,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.403091755319149,33.6768617021277,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-29,2024-11-25,0,unsloth/Phi-3-mini-4k-instruct,mit,41,3.821,0.469533108024419 -unsloth/phi-4_bfloat16_682399cd249206f583fc19473d5a28af0a9bcea7_True,unsloth/phi-4,682399cd249206f583fc19473d5a28af0a9bcea7,bfloat16,chatmodels,Original,LlamaForCausalLM,34.4845983494698,TRUE,IFEval,0.688208398161323,68.8208398161323,BBH,0.688587440604014,55.2531449984701,MATH Level 5,0.125377643504532,12.5377643504532,GPQA,0.336409395973154,11.5212527964206,MUSR,0.411427083333333,10.1283854166667,MMLU-PRO,0.537815824468085,48.6462027186761,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-09,1,microsoft/phi-4,mit,41,14.66,0.943269263333302 +unsloth/phi-4_bfloat16_682399cd249206f583fc19473d5a28af0a9bcea7_True,unsloth/phi-4,682399cd249206f583fc19473d5a28af0a9bcea7,bfloat16,chatmodels,Original,LlamaForCausalLM,34.4845983494698,TRUE,IFEval,0.688208398161323,68.8208398161323,BBH,0.688587440604014,55.2531449984701,MATH Level 5,0.125377643504532,12.5377643504532,GPQA,0.336409395973154,11.5212527964206,MUSR,0.411427083333333,10.1283854166667,MMLU-PRO,0.537815824468085,48.6462027186761,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-09,1,microsoft/phi-4,mit,45,14.66,0.943269263333302 unsloth/phi-4-bnb-4bit_bfloat16_85ca2925f3cc4f3c42de4168e9ba0695be5d5845_True,unsloth/phi-4-bnb-4bit,85ca2925f3cc4f3c42de4168e9ba0695be5d5845,bfloat16,chatmodels,Original,LlamaForCausalLM,34.616889577097,TRUE,IFEval,0.672971050146944,67.2971050146944,BBH,0.676985424233919,53.535199121413,MATH Level 5,0.194108761329305,19.4108761329305,GPQA,0.338087248322148,11.744966442953,MUSR,0.400729166666667,8.42447916666667,MMLU-PRO,0.525598404255319,47.2887115839244,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-09,1,microsoft/phi-4,mit,9,8.058,1.52387156863529 -unsloth/phi-4-unsloth-bnb-4bit_bfloat16_227e8cbc0de0cd783703a3a2f217159a86041a5f_True,unsloth/phi-4-unsloth-bnb-4bit,227e8cbc0de0cd783703a3a2f217159a86041a5f,bfloat16,chatmodels,Original,LlamaForCausalLM,34.9490798045053,TRUE,IFEval,0.679390683386747,67.9390683386747,BBH,0.679108989696876,53.8400810593204,MATH Level 5,0.200151057401813,20.0151057401813,GPQA,0.336409395973154,11.5212527964206,MUSR,0.403395833333333,8.7578125,MMLU-PRO,0.528590425531915,47.621158392435,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-09,1,microsoft/phi-4,mit,21,8.483,1.51876798310742 +unsloth/phi-4-unsloth-bnb-4bit_bfloat16_227e8cbc0de0cd783703a3a2f217159a86041a5f_True,unsloth/phi-4-unsloth-bnb-4bit,227e8cbc0de0cd783703a3a2f217159a86041a5f,bfloat16,chatmodels,Original,LlamaForCausalLM,34.9490798045053,TRUE,IFEval,0.679390683386747,67.9390683386747,BBH,0.679108989696876,53.8400810593204,MATH Level 5,0.200151057401813,20.0151057401813,GPQA,0.336409395973154,11.5212527964206,MUSR,0.403395833333333,8.7578125,MMLU-PRO,0.528590425531915,47.621158392435,TRUE,FALSE,FALSE,FALSE,FALSE,2025-01-08,2025-01-09,1,microsoft/phi-4,mit,24,8.483,1.51876798310742 upstage/SOLAR-10.7B-Instruct-v1.0_float16_c08c25ed66414a878fe0401a3596d536c083606c_True,upstage/SOLAR-10.7B-Instruct-v1.0,c08c25ed66414a878fe0401a3596d536c083606c,float16,chatmodels,Original,LlamaForCausalLM,19.6282553318946,TRUE,IFEval,0.473660997265035,47.3660997265035,BBH,0.516249494144699,31.8724018880021,MATH Level 5,0,0,GPQA,0.308724832214765,7.82997762863535,MUSR,0.3899375,6.9421875,MMLU-PRO,0.313829787234043,23.7588652482269,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-12,2024-06-12,1,upstage/SOLAR-10.7B-Instruct-v1.0 (Merge),cc-by-nc-4.0,619,10.732,0.782775785638588 upstage/SOLAR-10.7B-v1.0_float16_a45090b8e56bdc2b8e32e46b3cd782fc0bea1fa5_False,upstage/SOLAR-10.7B-v1.0,a45090b8e56bdc2b8e32e46b3cd782fc0bea1fa5,float16,pretrained,Original,LlamaForCausalLM,4.9164478862809,FALSE,IFEval,0.171584728520326,17.1584728520326,BBH,0.299835173754951,2.14716276381869,MATH Level 5,0.0234138972809668,2.34138972809668,GPQA,0.260906040268456,1.45413870246085,MUSR,0.368197916666667,4.52473958333333,MMLU-PRO,0.116855053191489,1.87278368794326,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-12,2024-06-12,0,upstage/SOLAR-10.7B-v1.0,apache-2.0,295,10.732,1.51919401838023 upstage/solar-pro-preview-instruct_bfloat16_b4db141b5fb08b23f8bc323bc34e2cff3e9675f8_True,upstage/solar-pro-preview-instruct,b4db141b5fb08b23f8bc323bc34e2cff3e9675f8,bfloat16,chatmodels,Original,SolarForCausalLM,39.9008905140799,TRUE,IFEval,0.841581448334863,84.1581448334863,BBH,0.681684305137953,54.8223509998353,MATH Level 5,0.218277945619335,21.8277945619335,GPQA,0.370805369127517,16.1073825503356,MUSR,0.44165625,15.00703125,MMLU-PRO,0.52734375,47.4826388888889,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-09,2024-09-11,0,upstage/solar-pro-preview-instruct,mit,439,22.14,1.7417631529201 diff --git a/csv/merged.csv b/csv/merged.csv index 9d45837..9b88679 100644 --- a/csv/merged.csv +++ b/csv/merged.csv @@ -6,10 +6,10 @@ dolly-v2-12b,databricks/dolly-v2-12b_bfloat16_19308160448536e378e3db21a73a751579 gemma-1.1-2b-it,google/gemma-1.1-2b-it_bfloat16_bf4924f313df5166dee1467161e886e55f2eb4d4_True,google/gemma-1.1-2b-it,bf4924f313df5166dee1467161e886e55f2eb4d4,bfloat16,chatmodels,Original,GemmaForCausalLM,7.77643528435205,TRUE,IFEval,0.306748316688608,30.6748316688608,BBH,0.318463497481492,5.86282672277435,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.269295302013423,2.57270693512304,MUSR,0.339395833333333,2.02447916666667,MMLU-PRO,0.148354388297872,5.3727098108747,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-26,2024-06-12,0,google/gemma-1.1-2b-it,gemma,154,2.506,0.32921478142276,162,152,Gemma-1.1-2b-it,1021,+5/-5,11352,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-2b-it gemma-1.1-7b-it,google/gemma-1.1-7b-it_bfloat16_16128b0aeb50762ea96430c0c06a37941bf9f274_True,google/gemma-1.1-7b-it,16128b0aeb50762ea96430c0c06a37941bf9f274,bfloat16,chatmodels,Original,GemmaForCausalLM,17.4795862430713,TRUE,IFEval,0.503910734628563,50.3910734628563,BBH,0.393529796283325,15.9342093850132,MATH Level 5,0.0362537764350453,3.62537764350453,GPQA,0.293624161073826,5.8165548098434,MUSR,0.423020833333333,11.5109375,MMLU-PRO,0.258394281914894,17.5993646572104,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-26,2024-06-12,0,google/gemma-1.1-7b-it,gemma,267,8.538,0.578299189963354,129,121,Gemma-1.1-7B-it,1084,+3/-4,25062,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it gemma-2-27b-it,google/gemma-2-27b-it_bfloat16_f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b_True,google/gemma-2-27b-it,f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b,bfloat16,chatmodels,Original,Gemma2ForCausalLM,32.3223187688799,TRUE,IFEval,0.797767700811624,79.7767700811624,BBH,0.64513874331688,49.2728421513039,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.375,16.6666666666667,MUSR,0.403302083333333,9.11276041666667,MMLU-PRO,0.445146276595745,38.3495862884161,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-08-07,1,google/gemma-2-27b,gemma,495,27.227,4.82621118669274,52,46,Gemma-2-27B-it,1220,+3/-3,70811,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-27b-it -gemma-2-2b-it,google/gemma-2-2b-it_bfloat16_2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f_True,google/gemma-2-2b-it,2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f,bfloat16,fine-tunedondomain-specificdatasets,Original,InternLM2ForCausalLM,17.0469392949665,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.419923089142747,17.9807928815234,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.274328859060403,3.24384787472036,MUSR,0.392885416666667,7.07734375,MMLU-PRO,0.25498670212766,17.2207446808511,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,1,google/gemma-2-2b,gemma,860,2.614,1.23474327420585,97,113,Gemma-2-2b-it,1142,+3/-3,40232,Google,Gemma license,2024/7,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-2b-it -gemma-2-9b-it,google/gemma-2-9b-it_bfloat16_1937c70277fcc5f7fb0fc772fc5bc69378996e71_True,google/gemma-2-9b-it,1937c70277fcc5f7fb0fc772fc5bc69378996e71,bfloat16,chatmodels,Original,Gemma2ForCausalLM,28.8627904641512,TRUE,IFEval,0.743562636027961,74.3562636027961,BBH,0.599034250416413,42.1366196836647,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.360738255033557,14.7651006711409,MUSR,0.407270833333333,9.7421875,MMLU-PRO,0.387549867021277,31.9499852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,1,google/gemma-2-9b,gemma,616,9,5.01449702077493,73,69,Gemma-2-9B-it,1191,+4/-3,48642,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-9b-it +gemma-2-2b-it,google/gemma-2-2b-it_bfloat16_2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f_True,google/gemma-2-2b-it,2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f,bfloat16,fine-tunedondomain-specificdatasets,Original,InternLM2ForCausalLM,17.0469392949665,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.419923089142747,17.9807928815234,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.274328859060403,3.24384787472036,MUSR,0.392885416666667,7.07734375,MMLU-PRO,0.25498670212766,17.2207446808511,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,1,google/gemma-2-2b,gemma,862,2.614,1.23474327420585,97,113,Gemma-2-2b-it,1142,+3/-3,40232,Google,Gemma license,2024/7,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-2b-it +gemma-2-9b-it,google/gemma-2-9b-it_bfloat16_1937c70277fcc5f7fb0fc772fc5bc69378996e71_True,google/gemma-2-9b-it,1937c70277fcc5f7fb0fc772fc5bc69378996e71,bfloat16,chatmodels,Original,Gemma2ForCausalLM,28.8627904641512,TRUE,IFEval,0.743562636027961,74.3562636027961,BBH,0.599034250416413,42.1366196836647,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.360738255033557,14.7651006711409,MUSR,0.407270833333333,9.7421875,MMLU-PRO,0.387549867021277,31.9499852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,1,google/gemma-2-9b,gemma,617,9,5.01449702077493,73,69,Gemma-2-9B-it,1191,+4/-3,48642,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-9b-it gemma-2-9b-it-simpo,princeton-nlp/gemma-2-9b-it-SimPO_bfloat16_8c87091f412e3aa6f74f66bd86c57fb81cbc3fde_True,princeton-nlp/gemma-2-9b-it-SimPO,8c87091f412e3aa6f74f66bd86c57fb81cbc3fde,bfloat16,chatmodels,Original,Gemma2ForCausalLM,21.1616516275693,TRUE,IFEval,0.320685780396016,32.0685780396016,BBH,0.583917992316212,40.0934299163717,MATH Level 5,0,0,GPQA,0.335570469798658,11.4093959731544,MUSR,0.412322916666667,10.3403645833333,MMLU-PRO,0.397523271276596,33.0581412529551,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2024-08-10,2,google/gemma-2-9b,mit,140,9.242,2.76900372425403,53,46,Gemma-2-9B-it-SimPO,1216,+5/-6,10555,Princeton,MIT,2024/7,https://huggingface.co/princeton-nlp/gemma-2-9b-it-SimPO -gemma-2b-it,google/gemma-2b-it_bfloat16_de144fb2268dee1066f515465df532c05e699d48_True,google/gemma-2b-it,de144fb2268dee1066f515465df532c05e699d48,bfloat16,chatmodels,Original,GemmaForCausalLM,7.22145367714292,TRUE,IFEval,0.269029508371122,26.9029508371122,BBH,0.315081919887885,5.21430302216362,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.278523489932886,3.80313199105145,MUSR,0.334125,3.03229166666667,MMLU-PRO,0.13530585106383,3.92287234042553,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b-it,gemma,692,2.506,0.352950331047759,170,168,Gemma-2B-it,989,+7/-10,4919,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it +gemma-2b-it,google/gemma-2b-it_bfloat16_de144fb2268dee1066f515465df532c05e699d48_True,google/gemma-2b-it,de144fb2268dee1066f515465df532c05e699d48,bfloat16,chatmodels,Original,GemmaForCausalLM,7.22145367714292,TRUE,IFEval,0.269029508371122,26.9029508371122,BBH,0.315081919887885,5.21430302216362,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.278523489932886,3.80313199105145,MUSR,0.334125,3.03229166666667,MMLU-PRO,0.13530585106383,3.92287234042553,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b-it,gemma,693,2.506,0.352950331047759,170,168,Gemma-2B-it,989,+7/-10,4919,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it gemma-7b-it,google/gemma-7b-it_bfloat16_18329f019fb74ca4b24f97371785268543d687d2_True,google/gemma-7b-it,18329f019fb74ca4b24f97371785268543d687d2,bfloat16,chatmodels,Original,GemmaForCausalLM,12.8681419014102,TRUE,IFEval,0.386832493339894,38.6832493339894,BBH,0.364558292227017,11.8800913445494,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.284395973154362,4.58612975391499,MUSR,0.427427083333333,12.5283854166667,MMLU-PRO,0.169464760638298,7.71830673758865,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-13,2024-06-12,1,google/gemma-7b,gemma,1148,8.538,1.0999544452693,151,147,Gemma-7B-it,1037,+7/-6,9177,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it granite-3.0-2b-instruct,ibm-granite/granite-3.0-2b-instruct_bfloat16_342f92f4a0b4d6d83c0b61dc6c122e253a4efebd_True,ibm-granite/granite-3.0-2b-instruct,342f92f4a0b4d6d83c0b61dc6c122e253a4efebd,bfloat16,chatmodels,Original,GraniteForCausalLM,18.3205664133779,TRUE,IFEval,0.513977357854936,51.3977357854936,BBH,0.441197720626303,21.7378914109024,MATH Level 5,0.0876132930513595,8.76132930513595,GPQA,0.299496644295302,6.59955257270694,MUSR,0.351489583333333,1.26953125,MMLU-PRO,0.281416223404255,20.1573581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,"",1,ibm-granite/granite-3.0-2b-instruct (Merge),apache-2.0,47,2.634,1.01894808156813,132,127,Granite-3.0-2B-Instruct,1074,+8/-7,7195,IBM,Apache 2.0,Unknown,https://huggingface.co/ibm-granite/granite-3.0-2b-instruct granite-3.0-8b-instruct,ibm-granite/granite-3.0-8b-instruct_bfloat16_e0a466fb25b9e07e9c2dc93380a360189700d1f8_True,ibm-granite/granite-3.0-8b-instruct,e0a466fb25b9e07e9c2dc93380a360189700d1f8,bfloat16,chatmodels,Original,GraniteForCausalLM,23.8640332348529,TRUE,IFEval,0.530963399335984,53.0963399335984,BBH,0.519187463184023,31.5881590647151,MATH Level 5,0.132175226586103,13.2175226586103,GPQA,0.332214765100671,10.9619686800895,MUSR,0.3900625,7.02447916666667,MMLU-PRO,0.345661569148936,27.2957299054374,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,2024-10-20,1,ibm-granite/granite-3.0-8b-instruct (Merge),apache-2.0,198,8.171,1.7129925870079,120,113,Granite-3.0-8B-Instruct,1093,+7/-5,7003,IBM,Apache 2.0,Unknown,https://huggingface.co/ibm-granite/granite-3.0-8b-instruct @@ -19,20 +19,20 @@ llama-3.1-tulu-3-70b,allenai/Llama-3.1-Tulu-3-70B_bfloat16_c4280450c0cd91a2fb6f4 llama-3.1-tulu-3-70b,allenai/Llama-3.1-Tulu-3-70B_float16_c4280450c0cd91a2fb6f41a25c6a1662c6966b01_True,allenai/Llama-3.1-Tulu-3-70B,c4280450c0cd91a2fb6f41a25c6a1662c6966b01,float16,chatmodels,Original,LlamaForCausalLM,41.4545274065984,TRUE,IFEval,0.837934458348294,83.7934458348294,BBH,0.615684716955611,45.259480995205,MATH Level 5,0.382930513595166,38.2930513595166,GPQA,0.373322147651007,16.4429530201342,MUSR,0.498802083333333,24.3169270833333,MMLU-PRO,0.465591755319149,40.6213061465721,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-27,1,allenai/Llama-3.1-Tulu-3-70B (Merge),llama3.1,44,70.554,38.022026223354,34,40,Llama-3.1-Tulu-3-70B,1245,+11/-12,2054,Ai2,Llama 3.1,Unknown,https://huggingface.co/allenai/Llama-3.1-Tulu-3-70B llama-3.1-tulu-3-8b,allenai/Llama-3.1-Tulu-3-8B_bfloat16_63b75e0dd6eac3725319f869716b9b70c16a6a65_True,allenai/Llama-3.1-Tulu-3-8B,63b75e0dd6eac3725319f869716b9b70c16a6a65,bfloat16,chatmodels,Original,LlamaForCausalLM,26.0349980816721,TRUE,IFEval,0.826668794354535,82.6668794354535,BBH,0.404983310273191,16.671812993248,MATH Level 5,0.196374622356495,19.6374622356495,GPQA,0.298657718120805,6.48769574944072,MUSR,0.41746875,10.4502604166667,MMLU-PRO,0.28266289893617,20.2958776595745,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-21,1,allenai/Llama-3.1-Tulu-3-8B (Merge),llama3.1,115,8.03,0.703774148994329,71,82,Llama-3.1-Tulu-3-8B,1188,+10/-13,2040,Ai2,Llama 3.1,Unknown,https://huggingface.co/allenai/Llama-3.1-Tulu-3-8B llama-3.1-tulu-3-8b,allenai/Llama-3.1-Tulu-3-8B_float16_50fef8756a9a4ca2010587d128aebb3a18ec897d_True,allenai/Llama-3.1-Tulu-3-8B,50fef8756a9a4ca2010587d128aebb3a18ec897d,float16,chatmodels,Original,LlamaForCausalLM,25.8832245109219,TRUE,IFEval,0.825469753587149,82.5469753587149,BBH,0.40608256120952,16.8580520694028,MATH Level 5,0.188821752265861,18.8821752265861,GPQA,0.296979865771812,6.26398210290828,MUSR,0.41746875,10.5169270833333,MMLU-PRO,0.282081117021277,20.2312352245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-28,1,allenai/Llama-3.1-Tulu-3-8B (Merge),llama3.1,115,8.03,0.701232116583257,71,82,Llama-3.1-Tulu-3-8B,1188,+10/-13,2040,Ai2,Llama 3.1,Unknown,https://huggingface.co/allenai/Llama-3.1-Tulu-3-8B -llama-3.3-70b-instruct,meta-llama/Llama-3.3-70B-Instruct_bfloat16__True,meta-llama/Llama-3.3-70B-Instruct,"",bfloat16,chatmodels,Original,LlamaForCausalLM,36.8288410384085,TRUE,IFEval,0.899758197139146,89.9758197139146,BBH,0.691931282832581,56.5614107880222,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446125,15.565625,MMLU-PRO,0.533161569148936,48.1290632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-26,2024-12-03,1,meta-llama/Llama-3.3-70B-Instruct (Merge),llama3.3,1579,70.554,38.2795370537265,31,23,Llama-3.3-70B-Instruct,1256,+5/-6,12451,Meta,Llama-3.3,Unknown,https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct -meta-llama-3.1-70b-instruct,meta-llama/Meta-Llama-3.1-70B-Instruct_bfloat16_b9461463b511ed3c0762467538ea32cf7c9669f2_True,meta-llama/Meta-Llama-3.1-70B-Instruct,b9461463b511ed3c0762467538ea32cf7c9669f2,bfloat16,chatmodels,Original,LlamaForCausalLM,42.1763127975088,TRUE,IFEval,0.866885419575615,86.6885419575615,BBH,0.691728745366365,55.9279917389847,MATH Level 5,0.306646525679758,30.6646525679758,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4580625,17.6911458333333,MMLU-PRO,0.530917553191489,47.8797281323877,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-15,1,meta-llama/Meta-Llama-3.1-70B,llama3.1,768,70.554,26.8020157168701,37,43,Meta-Llama-3.1-70B-Instruct,1248,+3/-3,58806,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ -meta-llama-3.1-8b-instruct,meta-llama/Meta-Llama-3.1-8B-Instruct_bfloat16_df34336b42332c6d360959e259cd6271c6a09fd4_True,meta-llama/Meta-Llama-3.1-8B-Instruct,df34336b42332c6d360959e259cd6271c6a09fd4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2044584981019,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.26761744966443,2.3489932885906,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376163563829787,30.6848404255319,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-08-15,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,3418,8.03,2.48701186834409,78,103,Meta-Llama-3.1-8B-Instruct,1176,+3/-3,52649,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ +llama-3.3-70b-instruct,meta-llama/Llama-3.3-70B-Instruct_bfloat16__True,meta-llama/Llama-3.3-70B-Instruct,"",bfloat16,chatmodels,Original,LlamaForCausalLM,36.8288410384085,TRUE,IFEval,0.899758197139146,89.9758197139146,BBH,0.691931282832581,56.5614107880222,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446125,15.565625,MMLU-PRO,0.533161569148936,48.1290632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-26,2024-12-03,1,meta-llama/Llama-3.3-70B-Instruct (Merge),llama3.3,1592,70.554,38.2795370537265,31,23,Llama-3.3-70B-Instruct,1256,+5/-6,12451,Meta,Llama-3.3,Unknown,https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct +meta-llama-3.1-70b-instruct,meta-llama/Meta-Llama-3.1-70B-Instruct_bfloat16_b9461463b511ed3c0762467538ea32cf7c9669f2_True,meta-llama/Meta-Llama-3.1-70B-Instruct,b9461463b511ed3c0762467538ea32cf7c9669f2,bfloat16,chatmodels,Original,LlamaForCausalLM,42.1763127975088,TRUE,IFEval,0.866885419575615,86.6885419575615,BBH,0.691728745366365,55.9279917389847,MATH Level 5,0.306646525679758,30.6646525679758,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4580625,17.6911458333333,MMLU-PRO,0.530917553191489,47.8797281323877,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-15,1,meta-llama/Meta-Llama-3.1-70B,llama3.1,769,70.554,26.8020157168701,37,43,Meta-Llama-3.1-70B-Instruct,1248,+3/-3,58806,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ +meta-llama-3.1-8b-instruct,meta-llama/Meta-Llama-3.1-8B-Instruct_bfloat16_df34336b42332c6d360959e259cd6271c6a09fd4_True,meta-llama/Meta-Llama-3.1-8B-Instruct,df34336b42332c6d360959e259cd6271c6a09fd4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2044584981019,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.26761744966443,2.3489932885906,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376163563829787,30.6848404255319,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-08-15,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,3423,8.03,2.48701186834409,78,103,Meta-Llama-3.1-8B-Instruct,1176,+3/-3,52649,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ mistral-7b-instruct-v0.1,mistralai/Mistral-7B-Instruct-v0.1_bfloat16_73068f3702d050a2fd5aa2ca1e612e5036429398_True,mistralai/Mistral-7B-Instruct-v0.1,73068f3702d050a2fd5aa2ca1e612e5036429398,bfloat16,chatmodels,Original,MistralForCausalLM,12.6957006941243,TRUE,IFEval,0.448706099815157,44.8706099815157,BBH,0.33548084759811,7.64702053582754,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.25,0,MUSR,0.384760416666667,6.12838541666667,MMLU-PRO,0.241439494680851,15.7154994089835,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-27,2024-06-27,1,mistralai/Mistral-7B-v0.1,apache-2.0,1544,7.242,1.21604471748007,165,163,Mistral-7B-Instruct-v0.1,1008,+5/-6,9145,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 mistral-7b-instruct-v0.2,mistralai/Mistral-7B-Instruct-v0.2_bfloat16_41b61a33a2483885c981aa79e0df6b32407ed873_True,mistralai/Mistral-7B-Instruct-v0.2,41b61a33a2483885c981aa79e0df6b32407ed873,bfloat16,chatmodels,Original,MistralForCausalLM,18.4575391254667,TRUE,IFEval,0.549622778671702,54.9622778671702,BBH,0.445973552032928,22.9106019367136,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.276006711409396,3.4675615212528,MUSR,0.396604166666667,7.60885416666667,MMLU-PRO,0.271692154255319,19.0769060283688,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-11,2024-06-12,0,mistralai/Mistral-7B-Instruct-v0.2,apache-2.0,2610,7.242,0.534406629050985,134,138,Mistral-7B-Instruct-v0.2,1072,+4/-4,20054,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 mixtral-8x22b-instruct-v0.1,mistralai/Mixtral-8x22B-Instruct-v0.1_bfloat16_b0c3516041d014f640267b14feb4e9a84c8e8c71_True,mistralai/Mixtral-8x22B-Instruct-v0.1,b0c3516041d014f640267b14feb4e9a84c8e8c71,bfloat16,chatmodels,Original,MixtralForCausalLM,33.885680288082,TRUE,IFEval,0.718358400156031,71.8358400156031,BBH,0.612492492627202,44.1143455872484,MATH Level 5,0.187311178247734,18.7311178247734,GPQA,0.373322147651007,16.4429530201342,MUSR,0.431114583333333,13.4893229166667,MMLU-PRO,0.448304521276596,38.7005023640662,TRUE,FALSE,TRUE,FALSE,TRUE,2024-04-16,2024-06-12,1,mistralai/Mixtral-8x22B-v0.1,apache-2.0,699,140.621,47.147578592378,95,89,Mixtral-8x22b-Instruct-v0.1,1148,+3/-3,53792,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ -mixtral-8x7b-instruct-v0.1,mistralai/Mixtral-8x7B-Instruct-v0.1_bfloat16_1e637f2d7cb0a9d6fb1922f305cb784995190a83_True,mistralai/Mixtral-8x7B-Instruct-v0.1,1e637f2d7cb0a9d6fb1922f305cb784995190a83,bfloat16,chatmodels,Original,MixtralForCausalLM,23.8422789394817,TRUE,IFEval,0.559914360563305,55.9914360563305,BBH,0.496236540133565,29.7423983809673,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.302852348993289,7.04697986577182,MUSR,0.420322916666667,11.0736979166667,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-10,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,4260,46.703,13.7649393661468,112,113,Mixtral-8x7B-Instruct-v0.1,1114,+0/-0,76131,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ +mixtral-8x7b-instruct-v0.1,mistralai/Mixtral-8x7B-Instruct-v0.1_bfloat16_1e637f2d7cb0a9d6fb1922f305cb784995190a83_True,mistralai/Mixtral-8x7B-Instruct-v0.1,1e637f2d7cb0a9d6fb1922f305cb784995190a83,bfloat16,chatmodels,Original,MixtralForCausalLM,23.8422789394817,TRUE,IFEval,0.559914360563305,55.9914360563305,BBH,0.496236540133565,29.7423983809673,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.302852348993289,7.04697986577182,MUSR,0.420322916666667,11.0736979166667,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-10,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,4264,46.703,13.7649393661468,112,113,Mixtral-8x7B-Instruct-v0.1,1114,+0/-0,76131,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ nous-hermes-2-mixtral-8x7b-dpo,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO_bfloat16_286ae6737d048ad1d965c2e830864df02db50f2f_True,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,286ae6737d048ad1d965c2e830864df02db50f2f,bfloat16,chatmodels,Original,MixtralForCausalLM,27.290249854483,TRUE,IFEval,0.58968980083955,58.968980083955,BBH,0.553885138403382,37.1077837913399,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.321308724832215,9.50782997762864,MUSR,0.459541666666667,16.6760416666667,MMLU-PRO,0.366605718085106,29.6228575650118,TRUE,FALSE,TRUE,FALSE,TRUE,2024-01-11,2024-07-27,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,420,46.703,12.8651437241499,125,133,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+9/-7,3836,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO openchat-3.5-0106,openchat/openchat-3.5-0106_bfloat16_ff058fda49726ecf4ea53dc1635f917cdb8ba36b_True,openchat/openchat-3.5-0106,ff058fda49726ecf4ea53dc1635f917cdb8ba36b,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,22.6586834330757,TRUE,IFEval,0.595135351977198,59.5135351977198,BBH,0.461697870839606,24.0387112139116,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.307885906040268,7.71812080536913,MUSR,0.4254375,11.7463541666667,MMLU-PRO,0.329122340425532,25.4580378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-07,2024-06-27,1,mistralai/Mistral-7B-v0.1,apache-2.0,348,7.242,2.35495886433684,122,118,OpenChat-3.5-0106,1092,+6/-5,12984,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 openhermes-2.5-mistral-7b,teknium/OpenHermes-2.5-Mistral-7B_bfloat16_24c0bea14d53e6f67f1fbe2eca5bfe7cae389b33_True,teknium/OpenHermes-2.5-Mistral-7B,24c0bea14d53e6f67f1fbe2eca5bfe7cae389b33,bfloat16,chatmodels,Original,MistralForCausalLM,21.2668365601522,TRUE,IFEval,0.557141717310071,55.7141717310071,BBH,0.487001325992498,27.7700263678076,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.283557046979866,4.47427293064877,MUSR,0.424197916666667,12.0580729166667,MMLU-PRO,0.305435505319149,22.8261672576832,TRUE,FALSE,FALSE,FALSE,TRUE,2023-10-29,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,821,7.242,0.472783300310566,131,122,OpenHermes-2.5-Mistral-7B,1074,+9/-8,5087,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B phi-3-medium-4k-instruct,microsoft/Phi-3-medium-4k-instruct_bfloat16_d194e4e74ffad5a5e193e26af25bcfc80c7f1ffc_True,microsoft/Phi-3-medium-4k-instruct,d194e4e74ffad5a5e193e26af25bcfc80c7f1ffc,bfloat16,chatmodels,Original,Phi3ForCausalLM,32.8962495702928,TRUE,IFEval,0.642271395452954,64.2271395452954,BBH,0.641246489055555,49.3806100742202,MATH Level 5,0.183534743202417,18.3534743202417,GPQA,0.336409395973154,11.5212527964206,MUSR,0.42575,13.0520833333333,MMLU-PRO,0.467586436170213,40.8429373522459,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-12,0,microsoft/Phi-3-medium-4k-instruct,mit,215,13.96,1.45526252332937,106,112,Phi-3-Medium-4k-Instruct,1123,+4/-4,26106,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct phi-3-mini-128k-instruct,microsoft/Phi-3-mini-128k-instruct_bfloat16_5be6479b4bc06a081e8f4c6ece294241ccd32dec_True,microsoft/Phi-3-mini-128k-instruct,5be6479b4bc06a081e8f4c6ece294241ccd32dec,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.6262872732554,TRUE,IFEval,0.597633168880792,59.7633168880792,BBH,0.557453179267985,37.0997666322403,MATH Level 5,0.0974320241691843,9.74320241691843,GPQA,0.317953020134228,9.06040268456376,MUSR,0.3936875,7.7109375,MMLU-PRO,0.373420877659575,30.3800975177305,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-08-21,0,microsoft/Phi-3-mini-128k-instruct,mit,1626,3.821,24.2222515926888,151,148,Phi-3-Mini-128k-Instruct,1037,+5/-3,21620,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ -phi-3-mini-4k-instruct,microsoft/Phi-3-mini-4k-instruct_bfloat16_ff07dc01615f8113924aed013115ab2abd32115b_True,microsoft/Phi-3-mini-4k-instruct,ff07dc01615f8113924aed013115ab2abd32115b,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.9677326380416,TRUE,IFEval,0.561288492311511,56.1288492311511,BBH,0.567597262633488,39.2693352377728,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.319630872483222,9.2841163310962,MUSR,0.395020833333333,7.64427083333334,MMLU-PRO,0.386635638297872,31.8484042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-06-12,0,microsoft/Phi-3-mini-4k-instruct,mit,1110,3.821,0.804074829912372,137,144,Phi-3-Mini-4k-Instruct,1066,+4/-5,21090,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -phi-3-mini-4k-instruct,microsoft/Phi-3-mini-4k-instruct_float16_c1358f8a35e6d2af81890deffbbfa575b978c62f_True,microsoft/Phi-3-mini-4k-instruct,c1358f8a35e6d2af81890deffbbfa575b978c62f,float16,chatmodels,Original,Phi3ForCausalLM,27.4111166417796,TRUE,IFEval,0.547674614467391,54.7674614467391,BBH,0.549071891949582,36.5598553051879,MATH Level 5,0.154833836858006,15.4833836858006,GPQA,0.332214765100671,10.9619686800895,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.402177526595745,33.5752807328605,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-07-02,0,microsoft/Phi-3-mini-4k-instruct,mit,1110,3.821,0.786699265454341,137,144,Phi-3-Mini-4k-Instruct,1066,+4/-5,21090,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +phi-3-mini-4k-instruct,microsoft/Phi-3-mini-4k-instruct_bfloat16_ff07dc01615f8113924aed013115ab2abd32115b_True,microsoft/Phi-3-mini-4k-instruct,ff07dc01615f8113924aed013115ab2abd32115b,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.9677326380416,TRUE,IFEval,0.561288492311511,56.1288492311511,BBH,0.567597262633488,39.2693352377728,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.319630872483222,9.2841163310962,MUSR,0.395020833333333,7.64427083333334,MMLU-PRO,0.386635638297872,31.8484042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-06-12,0,microsoft/Phi-3-mini-4k-instruct,mit,1112,3.821,0.804074829912372,137,144,Phi-3-Mini-4k-Instruct,1066,+4/-5,21090,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +phi-3-mini-4k-instruct,microsoft/Phi-3-mini-4k-instruct_float16_c1358f8a35e6d2af81890deffbbfa575b978c62f_True,microsoft/Phi-3-mini-4k-instruct,c1358f8a35e6d2af81890deffbbfa575b978c62f,float16,chatmodels,Original,Phi3ForCausalLM,27.4111166417796,TRUE,IFEval,0.547674614467391,54.7674614467391,BBH,0.549071891949582,36.5598553051879,MATH Level 5,0.154833836858006,15.4833836858006,GPQA,0.332214765100671,10.9619686800895,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.402177526595745,33.5752807328605,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-07-02,0,microsoft/Phi-3-mini-4k-instruct,mit,1112,3.821,0.786699265454341,137,144,Phi-3-Mini-4k-Instruct,1066,+4/-5,21090,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct phi-3-mini-4k-instruct,unsloth/Phi-3-mini-4k-instruct_float16_636c707430a5509c80b1aa51d05c127ed339a975_True,unsloth/Phi-3-mini-4k-instruct,636c707430a5509c80b1aa51d05c127ed339a975,float16,basemergesandmoerges,Original,MistralForCausalLM,27.1783743374799,TRUE,IFEval,0.544027624480822,54.4027624480822,BBH,0.550023946744103,36.732473265614,MATH Level 5,0.154078549848943,15.4078549848943,GPQA,0.322986577181208,9.73154362416107,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.403091755319149,33.6768617021277,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-29,2024-11-25,0,unsloth/Phi-3-mini-4k-instruct,mit,41,3.821,0.469533108024419,137,144,Phi-3-Mini-4k-Instruct,1066,+4/-5,21090,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct phi-3-small-8k-instruct,microsoft/Phi-3-small-8k-instruct_bfloat16_1535ae26fb4faada95c6950e8bc6e867cdad6b00_True,microsoft/Phi-3-small-8k-instruct,1535ae26fb4faada95c6950e8bc6e867cdad6b00,bfloat16,chatmodels,Original,Phi3SmallForCausalLM,29.6709218521057,TRUE,IFEval,0.649665110794913,64.9665110794913,BBH,0.620836488087056,46.2055703663891,MATH Level 5,0.0284301430770108,2.84301430770108,GPQA,0.312080536912752,8.27740492170022,MUSR,0.455791666666667,16.7739583333333,MMLU-PRO,0.45063164893617,38.9590721040189,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-13,0,microsoft/Phi-3-small-8k-instruct,mit,159,7.392,1.0254536035218,116,121,Phi-3-Small-8k-Instruct,1102,+4/-5,18479,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-small-8k-instruct qwen1.5-110b-chat,Qwen/Qwen1.5-110B-Chat_bfloat16_85f86cec25901f2dbd870a86e06756903c9a876a_True,Qwen/Qwen1.5-110B-Chat,85f86cec25901f2dbd870a86e06756903c9a876a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,29.2248366843256,TRUE,IFEval,0.593886443525402,59.3886443525402,BBH,0.618380038558863,44.9845452561663,MATH Level 5,0,0,GPQA,0.341442953020134,12.1923937360179,MUSR,0.452166666666667,16.2875,MMLU-PRO,0.482463430851064,42.4959367612293,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-25,2024-06-12,0,Qwen/Qwen1.5-110B-Chat,other,123,111.21,72.5652930561157,89,82,Qwen1.5-110B-Chat,1162,+3/-4,27470,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ @@ -41,9 +41,9 @@ qwen1.5-32b-chat,Qwen/Qwen1.5-32B-Chat_bfloat16_0997b012af6ddd5465d40465a8415535 qwen1.5-4b-chat,Qwen/Qwen1.5-4B-Chat_bfloat16_a7a4d4945d28bac955554c9abd2f74a71ebbf22f_True,Qwen/Qwen1.5-4B-Chat,a7a4d4945d28bac955554c9abd2f74a71ebbf22f,bfloat16,chatmodels,Original,Qwen2ForCausalLM,12.3377534239841,TRUE,IFEval,0.315665766832006,31.5665766832006,BBH,0.400554856114861,16.2970785289083,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.266778523489933,2.23713646532438,MUSR,0.39778125,7.35598958333333,MMLU-PRO,0.239611037234043,15.5123374704492,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-30,2024-06-12,0,Qwen/Qwen1.5-4B-Chat,other,38,3.95,0.866150647838799,170,166,Qwen1.5-4B-Chat,988,+7/-6,7811,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ qwen1.5-7b-chat,Qwen/Qwen1.5-7B-Chat_bfloat16_5f4f5e69ac7f1d508f8369e977de208b4803444b_True,Qwen/Qwen1.5-7B-Chat,5f4f5e69ac7f1d508f8369e977de208b4803444b,bfloat16,chatmodels,Original,Qwen2ForCausalLM,16.5761729315825,TRUE,IFEval,0.437115741787347,43.7115741787347,BBH,0.451005311652135,22.3791295999528,MATH Level 5,0,0,GPQA,0.302852348993289,7.04697986577182,MUSR,0.37790625,4.63828125,MMLU-PRO,0.295129654255319,21.6810726950355,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-30,2024-06-12,0,Qwen/Qwen1.5-7B-Chat,other,164,7.721,1.07882659669136,132,138,Qwen1.5-7B-Chat,1070,+10/-9,4869,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ qwen2-72b-instruct,Qwen/Qwen2-72B-Instruct_bfloat16_1af63c698f59c4235668ec9c1395468cb7cd7e79_False,Qwen/Qwen2-72B-Instruct,1af63c698f59c4235668ec9c1395468cb7cd7e79,bfloat16,chatmodels,Original,Qwen2ForCausalLM,42.9143041555209,FALSE,IFEval,0.7989168738946,79.89168738946,BBH,0.697730968386067,57.483009118763,MATH Level 5,0.376888217522659,37.6888217522659,GPQA,0.37248322147651,16.331096196868,MUSR,0.456010416666667,17.16796875,MMLU-PRO,0.540309175531915,48.9232417257683,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-28,2024-06-26,1,Qwen/Qwen2-72B,other,694,72.706,37.5539744227,74,66,Qwen2-72B-Instruct,1187,+3/-3,38884,Alibaba,Qianwen LICENSE,2024/6,https://qwenlm.github.io/blog/qwen2/ -qwen2.5-72b-instruct,Qwen/Qwen2.5-72B-Instruct_bfloat16_a13fff9ad76700c7ecff2769f75943ba8395b4a7_True,Qwen/Qwen2.5-72B-Instruct,a13fff9ad76700c7ecff2769f75943ba8395b4a7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,38.2120812616148,TRUE,IFEval,0.863837949972739,86.3837949972739,BBH,0.727274732174482,61.8732556687879,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.375,16.6666666666667,MUSR,0.420604166666667,11.7421875,MMLU-PRO,0.562583111702128,51.3981235224587,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-72B,other,667,72.706,33.0067683243991,31,38,Qwen2.5-72B-Instruct,1258,+4/-3,38466,Alibaba,Qwen,2024/9,https://qwenlm.github.io/blog/qwen2.5/ -qwen2.5-coder-32b-instruct,Qwen/Qwen2.5-Coder-32B-Instruct_float16_b47205940b83b5b484577359f71ee7b88472df67_False,Qwen/Qwen2.5-Coder-32B-Instruct,b47205940b83b5b484577359f71ee7b88472df67,float16,chatmodels,Original,Qwen2ForCausalLM,38.7525412608276,FALSE,IFEval,0.726526726862503,72.6526726862503,BBH,0.662522222240513,52.2665152094361,MATH Level 5,0.427492447129909,42.7492447129909,GPQA,0.348993288590604,13.1991051454139,MUSR,0.438583333333333,13.7229166666667,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-12-10,1,Qwen/Qwen2.5-Coder-32B-Instruct (Merge),apache-2.0,1442,32.764,4.69438966297979,52,56,Qwen2.5-Coder-32B-Instruct,1217,+7/-6,5725,Alibaba,Apache 2.0,Unknown,https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct -qwq-32b-preview,Qwen/QwQ-32B-Preview_bfloat16_1032e81cb936c486aae1d33da75b2fbcd5deed4a_True,Qwen/QwQ-32B-Preview,1032e81cb936c486aae1d33da75b2fbcd5deed4a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,30.444123257489,TRUE,IFEval,0.403543708471301,40.3543708471301,BBH,0.669138148225274,53.3876763517132,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.281879194630873,4.25055928411634,MUSR,0.410989583333333,9.80703125,MMLU-PRO,0.56781914893617,51.9799054373523,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-27,2024-11-29,2,Qwen/Qwen2.5-32B,apache-2.0,1528,32.764,10.2103897762396,90,123,QwQ-32B-Preview,1154,+7/-10,3420,Alibaba,Apache 2.0,Unknown,https://huggingface.co/Qwen/QwQ-32B-Preview +qwen2.5-72b-instruct,Qwen/Qwen2.5-72B-Instruct_bfloat16_a13fff9ad76700c7ecff2769f75943ba8395b4a7_True,Qwen/Qwen2.5-72B-Instruct,a13fff9ad76700c7ecff2769f75943ba8395b4a7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,38.2120812616148,TRUE,IFEval,0.863837949972739,86.3837949972739,BBH,0.727274732174482,61.8732556687879,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.375,16.6666666666667,MUSR,0.420604166666667,11.7421875,MMLU-PRO,0.562583111702128,51.3981235224587,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-72B,other,668,72.706,33.0067683243991,31,38,Qwen2.5-72B-Instruct,1258,+4/-3,38466,Alibaba,Qwen,2024/9,https://qwenlm.github.io/blog/qwen2.5/ +qwen2.5-coder-32b-instruct,Qwen/Qwen2.5-Coder-32B-Instruct_float16_b47205940b83b5b484577359f71ee7b88472df67_False,Qwen/Qwen2.5-Coder-32B-Instruct,b47205940b83b5b484577359f71ee7b88472df67,float16,chatmodels,Original,Qwen2ForCausalLM,38.7525412608276,FALSE,IFEval,0.726526726862503,72.6526726862503,BBH,0.662522222240513,52.2665152094361,MATH Level 5,0.427492447129909,42.7492447129909,GPQA,0.348993288590604,13.1991051454139,MUSR,0.438583333333333,13.7229166666667,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-12-10,1,Qwen/Qwen2.5-Coder-32B-Instruct (Merge),apache-2.0,1451,32.764,4.69438966297979,52,56,Qwen2.5-Coder-32B-Instruct,1217,+7/-6,5725,Alibaba,Apache 2.0,Unknown,https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct +qwq-32b-preview,Qwen/QwQ-32B-Preview_bfloat16_1032e81cb936c486aae1d33da75b2fbcd5deed4a_True,Qwen/QwQ-32B-Preview,1032e81cb936c486aae1d33da75b2fbcd5deed4a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,30.444123257489,TRUE,IFEval,0.403543708471301,40.3543708471301,BBH,0.669138148225274,53.3876763517132,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.281879194630873,4.25055928411634,MUSR,0.410989583333333,9.80703125,MMLU-PRO,0.56781914893617,51.9799054373523,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-27,2024-11-29,2,Qwen/Qwen2.5-32B,apache-2.0,1535,32.764,10.2103897762396,90,123,QwQ-32B-Preview,1154,+7/-10,3420,Alibaba,Apache 2.0,Unknown,https://huggingface.co/Qwen/QwQ-32B-Preview smollm2-1.7b-instruct,HuggingFaceTB/SmolLM2-1.7B-Instruct_bfloat16_d1bb90bcfbe0f211109880f4da18da66f229c4f6_True,HuggingFaceTB/SmolLM2-1.7B-Instruct,d1bb90bcfbe0f211109880f4da18da66f229c4f6,bfloat16,chatmodels,Original,LlamaForCausalLM,14.7453390971056,TRUE,IFEval,0.536783512192095,53.6783512192095,BBH,0.359861753141516,10.9179892262081,MATH Level 5,0.0415407854984894,4.15407854984894,GPQA,0.279362416107383,3.91498881431767,MUSR,0.342125,4.09895833333334,MMLU-PRO,0.205369015957447,11.7076684397163,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,1,HuggingFaceTB/SmolLM2-1.7B-Instruct (Merge),apache-2.0,465,1.711,0.63234061656892,143,143,SmolLM2-1.7B-Instruct,1047,+14/-11,2379,HuggingFace,Apache 2.0,Unknown,https://huggingface.co/HuggingFaceTB/SmolLM2-1.7B-Instruct solar-10.7b-instruct-v1.0,upstage/SOLAR-10.7B-Instruct-v1.0_float16_c08c25ed66414a878fe0401a3596d536c083606c_True,upstage/SOLAR-10.7B-Instruct-v1.0,c08c25ed66414a878fe0401a3596d536c083606c,float16,chatmodels,Original,LlamaForCausalLM,19.6282553318946,TRUE,IFEval,0.473660997265035,47.3660997265035,BBH,0.516249494144699,31.8724018880021,MATH Level 5,0,0,GPQA,0.308724832214765,7.82997762863535,MUSR,0.3899375,6.9421875,MMLU-PRO,0.313829787234043,23.7588652482269,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-12,2024-06-12,1,upstage/SOLAR-10.7B-Instruct-v1.0 (Merge),cc-by-nc-4.0,619,10.732,0.782775785638588,136,138,SOLAR-10.7B-Instruct-v1.0,1062,+8/-8,4288,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 starling-lm-7b-alpha,berkeley-nest/Starling-LM-7B-alpha_bfloat16_1dddf3b95bc1391f6307299eb1c162c194bde9bd_True,berkeley-nest/Starling-LM-7B-alpha,1dddf3b95bc1391f6307299eb1c162c194bde9bd,bfloat16,chatmodels,Original,MistralForCausalLM,20.8267729304501,TRUE,IFEval,0.548049176185854,54.8049176185854,BBH,0.4440065261164,21.9540280871593,MATH Level 5,0.0830815709969789,8.30815709969789,GPQA,0.296979865771812,6.26398210290828,MUSR,0.412010416666667,9.50130208333333,MMLU-PRO,0.317154255319149,24.1282505910166,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-25,2024-06-12,0,berkeley-nest/Starling-LM-7B-alpha,apache-2.0,558,7.242,0.551628886692049,125,130,Starling-LM-7B-alpha,1088,+6/-6,10416,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha