diff --git a/csv/huggingface_v2.csv b/csv/huggingface_v2.csv index 0cf551d..d609e42 100644 --- a/csv/huggingface_v2.csv +++ b/csv/huggingface_v2.csv @@ -44,7 +44,7 @@ Aashraf995/Gemma-Evo-10B_float16_5ec9c5763ca6662dd897cd292e08014ec10b0d74_False, Aashraf995/Qwen-Evo-7B_bfloat16_641aac3f105805414efe0a55b18736dce73da0a0_False,Aashraf995/Qwen-Evo-7B,641aac3f105805414efe0a55b18736dce73da0a0,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,30.0358843631694,FALSE,IFEval,0.475734384765755,47.5734384765755,BBH,0.570936153859028,38.5853269905061,MATH Level 5,0.299848942598187,29.9848942598187,GPQA,0.325503355704698,10.0671140939597,MUSR,0.454145833333333,15.5348958333333,MMLU-PRO,0.446226728723404,38.4696365248227,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-13,2024-12-13,1,Aashraf995/Qwen-Evo-7B (Merge),apache-2.0,1,7,0.634007609969498 Aashraf995/QwenStock-14B_float16_b91871dcd31fe2e445c233a449d021b47ebfe1fb_False,Aashraf995/QwenStock-14B,b91871dcd31fe2e445c233a449d021b47ebfe1fb,float16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.7397897181765,FALSE,IFEval,0.500863265025687,50.0863265025688,BBH,0.655013034810801,50.4338987071688,MATH Level 5,0.333836858006042,33.3836858006042,GPQA,0.389261744966443,18.5682326621924,MUSR,0.479260416666667,19.27421875,MMLU-PRO,0.538231382978723,48.6923758865248,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-13,2024-12-13,1,Aashraf995/QwenStock-14B (Merge),apache-2.0,1,14,1.87494565293633 AbacusResearch/Jallabi-34B_float16_f65696da4ed82c9a20e94b200d9dccffa07af682_False,AbacusResearch/Jallabi-34B,f65696da4ed82c9a20e94b200d9dccffa07af682,float16,basemergesandmoerges,Original,LlamaForCausalLM,25.9720839348152,FALSE,IFEval,0.352860410377798,35.2860410377798,BBH,0.602338060319627,43.6157649871951,MATH Level 5,0.0392749244712991,3.92749244712991,GPQA,0.338926174496644,11.8568232662192,MUSR,0.482177083333333,20.2388020833333,MMLU-PRO,0.468168218085106,40.907579787234,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-01,2024-06-27,0,AbacusResearch/Jallabi-34B,apache-2.0,2,34.389,3.28649233978473 -Alibaba-NLP/gte-Qwen2-7B-instruct_bfloat16_e26182b2122f4435e8b3ebecbf363990f409b45b_True,Alibaba-NLP/gte-Qwen2-7B-instruct,e26182b2122f4435e8b3ebecbf363990f409b45b,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,13.4061800867193,TRUE,IFEval,0.225540454881936,22.5540454881936,BBH,0.449514499081847,21.9254824856624,MATH Level 5,0.0385196374622357,3.85196374622357,GPQA,0.24496644295302,0,MUSR,0.355854166666667,6.31510416666667,MMLU-PRO,0.332114361702128,25.7904846335697,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-15,2024-08-05,0,Alibaba-NLP/gte-Qwen2-7B-instruct,apache-2.0,237,7.613,2.17211334857993 +Alibaba-NLP/gte-Qwen2-7B-instruct_bfloat16_e26182b2122f4435e8b3ebecbf363990f409b45b_True,Alibaba-NLP/gte-Qwen2-7B-instruct,e26182b2122f4435e8b3ebecbf363990f409b45b,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,13.4061800867193,TRUE,IFEval,0.225540454881936,22.5540454881936,BBH,0.449514499081847,21.9254824856624,MATH Level 5,0.0385196374622357,3.85196374622357,GPQA,0.24496644295302,0,MUSR,0.355854166666667,6.31510416666667,MMLU-PRO,0.332114361702128,25.7904846335697,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-15,2024-08-05,0,Alibaba-NLP/gte-Qwen2-7B-instruct,apache-2.0,238,7.613,2.17211334857993 Alsebay/Qwen2.5-7B-test-novelist_float16_89f34e5e67378dc38ce0da19d347ea26c23fbca5_False,Alsebay/Qwen2.5-7B-test-novelist,89f34e5e67378dc38ce0da19d347ea26c23fbca5,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,25.9392136516748,FALSE,IFEval,0.535160042021835,53.5160042021835,BBH,0.515121518446605,30.417500036353,MATH Level 5,0.160876132930514,16.0876132930514,GPQA,0.291107382550336,5.48098434004475,MUSR,0.474885416666667,18.2940104166667,MMLU-PRO,0.386552526595745,31.8391696217494,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-12,2024-12-12,3,Qwen/Qwen2.5-7B,apache-2.0,1,7,0.667192826185036 ArliAI/ArliAI-RPMax-12B-v1.1_bfloat16_645db1cf8ad952eb57854a133e8e15303b898b04_True,ArliAI/ArliAI-RPMax-12B-v1.1,645db1cf8ad952eb57854a133e8e15303b898b04,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,20.8126943934558,TRUE,IFEval,0.534885215672194,53.4885215672194,BBH,0.475181760840119,24.8090633179328,MATH Level 5,0.102719033232628,10.2719033232628,GPQA,0.281879194630873,4.25055928411633,MUSR,0.36184375,5.56380208333334,MMLU-PRO,0.33843085106383,26.49231678487,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-31,2024-09-05,0,ArliAI/ArliAI-RPMax-12B-v1.1,apache-2.0,41,12.248,1.83340230532795 ArliAI/Llama-3.1-8B-ArliAI-RPMax-v1.1_bfloat16_540bd352e59c63900af91b95a932b33aaee70c76_True,ArliAI/Llama-3.1-8B-ArliAI-RPMax-v1.1,540bd352e59c63900af91b95a932b33aaee70c76,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,23.9169670346878,TRUE,IFEval,0.635901629897561,63.5901629897561,BBH,0.501561345603908,28.7870140994428,MATH Level 5,0.129909365558912,12.9909365558912,GPQA,0.283557046979866,4.47427293064877,MUSR,0.3576875,5.3109375,MMLU-PRO,0.355136303191489,28.3484781323877,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-23,2024-09-19,0,ArliAI/Llama-3.1-8B-ArliAI-RPMax-v1.1,llama3,28,8.03,0.892744758538456 @@ -62,7 +62,7 @@ Azure99/blossom-v5-32b_bfloat16_ccd4d86e3de01187043683dea1e28df904f7408e_True,Az Azure99/blossom-v5-llama3-8b_bfloat16_91ea35e2e65516988021e4bb3b908e3e497e05c2_True,Azure99/blossom-v5-llama3-8b,91ea35e2e65516988021e4bb3b908e3e497e05c2,bfloat16,chatmodels,Original,LlamaForCausalLM,14.4730816408212,TRUE,IFEval,0.434293230849701,43.4293230849701,BBH,0.418490919708726,18.3065354056184,MATH Level 5,0.0438066465256798,4.38066465256798,GPQA,0.26510067114094,2.01342281879195,MUSR,0.367020833333333,5.3109375,MMLU-PRO,0.220578457446809,13.3976063829787,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-20,2024-09-21,0,Azure99/blossom-v5-llama3-8b,apache-2.0,4,8.03,0.872152892744747 Azure99/blossom-v5.1-34b_bfloat16_2c803204f5dbf4ce37e2df98eb0205cdc53de10d_True,Azure99/blossom-v5.1-34b,2c803204f5dbf4ce37e2df98eb0205cdc53de10d,bfloat16,chatmodels,Original,LlamaForCausalLM,28.5992859205074,TRUE,IFEval,0.569656289755626,56.9656289755626,BBH,0.610911009661116,44.1477045883846,MATH Level 5,0.157099697885196,15.7099697885196,GPQA,0.309563758389262,7.94183445190157,MUSR,0.392791666666667,7.29895833333333,MMLU-PRO,0.455784574468085,39.5316193853428,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-19,2024-07-27,0,Azure99/blossom-v5.1-34b,apache-2.0,5,34.389,9.59148345680845 Azure99/blossom-v5.1-9b_bfloat16_6044a3dc1e04529fe883aa513d37f266a320d793_True,Azure99/blossom-v5.1-9b,6044a3dc1e04529fe883aa513d37f266a320d793,bfloat16,chatmodels,Original,LlamaForCausalLM,24.8715035717806,TRUE,IFEval,0.508581674401699,50.8581674401699,BBH,0.534329237791637,34.2012444903117,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.335570469798658,11.4093959731544,MUSR,0.399395833333333,8.02447916666667,MMLU-PRO,0.397938829787234,33.1043144208038,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-15,2024-07-24,0,Azure99/blossom-v5.1-9b,apache-2.0,2,8.829,2.2157204712429 -BAAI/Gemma2-9B-IT-Simpo-Infinity-Preference_bfloat16_028a91b1a4f14d365c6db08093b03348455c7bad_True,BAAI/Gemma2-9B-IT-Simpo-Infinity-Preference,028a91b1a4f14d365c6db08093b03348455c7bad,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,20.9840685500934,TRUE,IFEval,0.31763831079314,31.763831079314,BBH,0.597945966423006,42.1908440590662,MATH Level 5,0,0,GPQA,0.339765100671141,11.9686800894855,MUSR,0.396572916666667,8.10494791666667,MMLU-PRO,0.386884973404255,31.8761081560284,FALSE,FALSE,FALSE,FALSE,FALSE,2024-08-28,2024-09-05,2,google/gemma-2-9b,"",15,9.242,5.86346048215024 +BAAI/Gemma2-9B-IT-Simpo-Infinity-Preference_bfloat16_028a91b1a4f14d365c6db08093b03348455c7bad_True,BAAI/Gemma2-9B-IT-Simpo-Infinity-Preference,028a91b1a4f14d365c6db08093b03348455c7bad,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,20.9840685500934,TRUE,IFEval,0.31763831079314,31.763831079314,BBH,0.597945966423006,42.1908440590662,MATH Level 5,0,0,GPQA,0.339765100671141,11.9686800894855,MUSR,0.396572916666667,8.10494791666667,MMLU-PRO,0.386884973404255,31.8761081560284,FALSE,FALSE,FALSE,FALSE,FALSE,2024-08-28,2024-09-05,2,google/gemma-2-9b,"",16,9.242,5.86346048215024 BAAI/Infinity-Instruct-3M-0613-Llama3-70B_bfloat16_9fc53668064bdda22975ca72c5a287f8241c95b3_True,BAAI/Infinity-Instruct-3M-0613-Llama3-70B,9fc53668064bdda22975ca72c5a287f8241c95b3,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,34.697074731983,TRUE,IFEval,0.682113458955571,68.2113458955571,BBH,0.66416144843486,51.3271609825221,MATH Level 5,0.16238670694864,16.238670694864,GPQA,0.358221476510067,14.4295302013423,MUSR,0.452260416666667,16.5325520833333,MMLU-PRO,0.472988696808511,41.443188534279,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-27,2024-06-28,0,BAAI/Infinity-Instruct-3M-0613-Llama3-70B,apache-2.0,5,70.554,10.5269069674078 BAAI/Infinity-Instruct-3M-0613-Mistral-7B_bfloat16_c7a742e539ec264b9eaeefe2aed29e92e8a7ebd6_True,BAAI/Infinity-Instruct-3M-0613-Mistral-7B,c7a742e539ec264b9eaeefe2aed29e92e8a7ebd6,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,22.1802369566482,TRUE,IFEval,0.53198734912255,53.198734912255,BBH,0.495823337632589,28.9929364703206,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.296140939597315,6.15212527964205,MUSR,0.435083333333333,13.2520833333333,MMLU-PRO,0.316073803191489,24.0082003546099,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-21,2024-06-27,0,BAAI/Infinity-Instruct-3M-0613-Mistral-7B,apache-2.0,11,7.242,0.949374628745906 BAAI/Infinity-Instruct-3M-0625-Llama3-70B_float16_6d8ceada57e55cff3503191adc4d6379ff321fe2_True,BAAI/Infinity-Instruct-3M-0625-Llama3-70B,6d8ceada57e55cff3503191adc4d6379ff321fe2,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,36.1422168425565,TRUE,IFEval,0.744212024096065,74.4212024096065,BBH,0.667033787293025,52.0281616428052,MATH Level 5,0.179003021148036,17.9003021148036,GPQA,0.357382550335571,14.3176733780761,MUSR,0.46165625,18.3403645833333,MMLU-PRO,0.458610372340426,39.8455969267139,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-09,2024-08-30,0,BAAI/Infinity-Instruct-3M-0625-Llama3-70B,apache-2.0,3,70.554,10.4309551406194 @@ -119,14 +119,14 @@ ClaudioItaly/Albacus_bfloat16_a53faf62d0f99b67478ed9d262872c821a3ba83c_False,Cla ClaudioItaly/Book-Gut12B_bfloat16_ae54351faca8170c93bf1de3a51bf16650f5bcf5_False,ClaudioItaly/Book-Gut12B,ae54351faca8170c93bf1de3a51bf16650f5bcf5,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,23.3437456450211,FALSE,IFEval,0.399846850800321,39.9846850800321,BBH,0.541737019444323,34.6321925897331,MATH Level 5,0.0989425981873112,9.89425981873112,GPQA,0.307046979865772,7.60626398210291,MUSR,0.463541666666667,18.2760416666667,MMLU-PRO,0.367021276595745,29.6690307328605,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-12,2024-09-17,1,ClaudioItaly/Book-Gut12B (Merge),mit,1,12.248,1.45224822331955 ClaudioItaly/Evolutionstory-7B-v2.2_bfloat16_9f838721d24a5195bed59a5ed8d9af536f7f2459_False,ClaudioItaly/Evolutionstory-7B-v2.2,9f838721d24a5195bed59a5ed8d9af536f7f2459,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,20.7982472157572,FALSE,IFEval,0.481379406641046,48.1379406641046,BBH,0.510804340656884,31.6238647440248,MATH Level 5,0.0702416918429003,7.02416918429003,GPQA,0.275167785234899,3.35570469798658,MUSR,0.41353125,10.6580729166667,MMLU-PRO,0.315907579787234,23.9897310874705,TRUE,TRUE,FALSE,FALSE,FALSE,2024-08-30,2024-09-01,1,ClaudioItaly/Evolutionstory-7B-v2.2 (Merge),mit,1,7.242,0.560231988335538 ClaudioItaly/intelligence-cod-rag-7b-v3_bfloat16_2b21473c8a086f8d0c54b82c3454bf5499cdde3a_True,ClaudioItaly/intelligence-cod-rag-7b-v3,2b21473c8a086f8d0c54b82c3454bf5499cdde3a,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,27.1290106554156,TRUE,IFEval,0.689782000647172,68.9782000647172,BBH,0.536633971883911,34.7761585394944,MATH Level 5,0.0981873111782477,9.81873111782477,GPQA,0.272651006711409,3.02013422818792,MUSR,0.415270833333333,10.6755208333333,MMLU-PRO,0.419547872340426,35.5053191489362,TRUE,TRUE,FALSE,FALSE,FALSE,2024-11-29,2024-12-02,1,ClaudioItaly/intelligence-cod-rag-7b-v3 (Merge),mit,0,7.616,0.660472333052409 -CohereForAI/aya-23-35B_float16_31d6fd858f20539a55401c7ad913086f54d9ca2c_True,CohereForAI/aya-23-35B,31d6fd858f20539a55401c7ad913086f54d9ca2c,float16,chatmodels,Original,CohereForCausalLM,24.6798797460333,TRUE,IFEval,0.646193211789164,64.6193211789164,BBH,0.539955145073127,34.8583604677546,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.294463087248322,5.92841163310962,MUSR,0.430989583333333,13.4736979166667,MMLU-PRO,0.335605053191489,26.1783392434988,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-19,2024-06-12,0,CohereForAI/aya-23-35B,cc-by-nc-4.0,267,34.981,16.9853170194836 +CohereForAI/aya-23-35B_float16_31d6fd858f20539a55401c7ad913086f54d9ca2c_True,CohereForAI/aya-23-35B,31d6fd858f20539a55401c7ad913086f54d9ca2c,float16,chatmodels,Original,CohereForCausalLM,24.6798797460333,TRUE,IFEval,0.646193211789164,64.6193211789164,BBH,0.539955145073127,34.8583604677546,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.294463087248322,5.92841163310962,MUSR,0.430989583333333,13.4736979166667,MMLU-PRO,0.335605053191489,26.1783392434988,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-19,2024-06-12,0,CohereForAI/aya-23-35B,cc-by-nc-4.0,268,34.981,16.9853170194836 CohereForAI/aya-23-8B_float16_ec151d218a24031eb039d92fb83d10445427efc9_True,CohereForAI/aya-23-8B,ec151d218a24031eb039d92fb83d10445427efc9,float16,chatmodels,Original,CohereForCausalLM,15.998395031351,TRUE,IFEval,0.469888783982057,46.9888783982057,BBH,0.429616151922031,20.2037606467394,MATH Level 5,0.0158610271903323,1.58610271903323,GPQA,0.284395973154362,4.58612975391499,MUSR,0.3940625,8.42447916666666,MMLU-PRO,0.227809175531915,14.2010195035461,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-19,2024-06-12,0,CohereForAI/aya-23-8B,cc-by-nc-4.0,396,8.028,1.19517208132096 -CohereForAI/aya-expanse-32b_float16_08b69cfa4240e2009c80ad304f000b491d1b8c38_True,CohereForAI/aya-expanse-32b,08b69cfa4240e2009c80ad304f000b491d1b8c38,float16,chatmodels,Original,CohereForCausalLM,29.3912190893162,TRUE,IFEval,0.730173716849072,73.0173716849072,BBH,0.564867009921211,38.7096114330142,MATH Level 5,0.13368580060423,13.368580060423,GPQA,0.325503355704698,10.0671140939597,MUSR,0.387270833333333,6.40885416666667,MMLU-PRO,0.41298204787234,34.7757830969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-23,2024-10-24,0,CohereForAI/aya-expanse-32b,cc-by-nc-4.0,192,32.296,5.5177350999101 -CohereForAI/aya-expanse-8b_float16_b9848575c8731981dfcf2e1f3bfbcb917a2e585d_True,CohereForAI/aya-expanse-8b,b9848575c8731981dfcf2e1f3bfbcb917a2e585d,float16,chatmodels,Original,CohereForCausalLM,22.1422232448213,TRUE,IFEval,0.63585176221315,63.585176221315,BBH,0.497720305573641,28.5234825042885,MATH Level 5,0.0702416918429003,7.02416918429003,GPQA,0.302852348993289,7.04697986577182,MUSR,0.372885416666667,4.41067708333333,MMLU-PRO,0.300365691489362,22.2628546099291,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-23,2024-10-24,0,CohereForAI/aya-expanse-8b,cc-by-nc-4.0,307,8.028,1.1696890688757 +CohereForAI/aya-expanse-32b_float16_08b69cfa4240e2009c80ad304f000b491d1b8c38_True,CohereForAI/aya-expanse-32b,08b69cfa4240e2009c80ad304f000b491d1b8c38,float16,chatmodels,Original,CohereForCausalLM,29.3912190893162,TRUE,IFEval,0.730173716849072,73.0173716849072,BBH,0.564867009921211,38.7096114330142,MATH Level 5,0.13368580060423,13.368580060423,GPQA,0.325503355704698,10.0671140939597,MUSR,0.387270833333333,6.40885416666667,MMLU-PRO,0.41298204787234,34.7757830969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-23,2024-10-24,0,CohereForAI/aya-expanse-32b,cc-by-nc-4.0,195,32.296,5.5177350999101 +CohereForAI/aya-expanse-8b_float16_b9848575c8731981dfcf2e1f3bfbcb917a2e585d_True,CohereForAI/aya-expanse-8b,b9848575c8731981dfcf2e1f3bfbcb917a2e585d,float16,chatmodels,Original,CohereForCausalLM,22.1422232448213,TRUE,IFEval,0.63585176221315,63.585176221315,BBH,0.497720305573641,28.5234825042885,MATH Level 5,0.0702416918429003,7.02416918429003,GPQA,0.302852348993289,7.04697986577182,MUSR,0.372885416666667,4.41067708333333,MMLU-PRO,0.300365691489362,22.2628546099291,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-23,2024-10-24,0,CohereForAI/aya-expanse-8b,cc-by-nc-4.0,309,8.028,1.1696890688757 CohereForAI/c4ai-command-r-plus_float16_fa1bd7fb1572ceb861bbbbecfa8af83b29fa8cca_True,CohereForAI/c4ai-command-r-plus,fa1bd7fb1572ceb861bbbbecfa8af83b29fa8cca,float16,chatmodels,Original,CohereForCausalLM,30.961246846254,TRUE,IFEval,0.766418658049531,76.6418658049531,BBH,0.581542357407793,39.9199542314318,MATH Level 5,0.081570996978852,8.1570996978852,GPQA,0.305369127516779,7.38255033557047,MUSR,0.48071875,20.4231770833333,MMLU-PRO,0.399185505319149,33.2428339243499,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-03,2024-06-13,0,CohereForAI/c4ai-command-r-plus,cc-by-nc-4.0,1700,103.811,28.6315317116708 -CohereForAI/c4ai-command-r-plus-08-2024_float16_2d8cf3ab0af78b9e43546486b096f86adf3ba4d0_True,CohereForAI/c4ai-command-r-plus-08-2024,2d8cf3ab0af78b9e43546486b096f86adf3ba4d0,float16,chatmodels,Original,CohereForCausalLM,33.5845340114894,TRUE,IFEval,0.753953953288386,75.3953953288386,BBH,0.599599991302719,42.836865407707,MATH Level 5,0.120090634441088,12.0090634441088,GPQA,0.350671140939597,13.4228187919463,MUSR,0.482947916666667,19.83515625,MMLU-PRO,0.442071143617021,38.0079048463357,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-21,2024-09-19,0,CohereForAI/c4ai-command-r-plus-08-2024,cc-by-nc-4.0,206,103.811,22.3188766676731 +CohereForAI/c4ai-command-r-plus-08-2024_float16_2d8cf3ab0af78b9e43546486b096f86adf3ba4d0_True,CohereForAI/c4ai-command-r-plus-08-2024,2d8cf3ab0af78b9e43546486b096f86adf3ba4d0,float16,chatmodels,Original,CohereForCausalLM,33.5845340114894,TRUE,IFEval,0.753953953288386,75.3953953288386,BBH,0.599599991302719,42.836865407707,MATH Level 5,0.120090634441088,12.0090634441088,GPQA,0.350671140939597,13.4228187919463,MUSR,0.482947916666667,19.83515625,MMLU-PRO,0.442071143617021,38.0079048463357,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-21,2024-09-19,0,CohereForAI/c4ai-command-r-plus-08-2024,cc-by-nc-4.0,207,103.811,22.3188766676731 CohereForAI/c4ai-command-r-v01_float16_16881ccde1c68bbc7041280e6a66637bc46bfe88_True,CohereForAI/c4ai-command-r-v01,16881ccde1c68bbc7041280e6a66637bc46bfe88,float16,chatmodels,Original,CohereForCausalLM,25.3499784613365,TRUE,IFEval,0.674819478982433,67.4819478982433,BBH,0.540641551276786,34.5566592570583,MATH Level 5,0,0,GPQA,0.307046979865772,7.60626398210291,MUSR,0.451697916666667,16.12890625,MMLU-PRO,0.336934840425532,26.3260933806147,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-11,2024-06-13,0,CohereForAI/c4ai-command-r-v01,cc-by-nc-4.0,1070,34.981,13.3954372669898 -CohereForAI/c4ai-command-r7b-12-2024_bfloat16_a9650f3bda8b0e00825ee36592e086b4ee621102_True,CohereForAI/c4ai-command-r7b-12-2024,a9650f3bda8b0e00825ee36592e086b4ee621102,bfloat16,chatmodels,Original,Cohere2ForCausalLM,31.0762402648343,TRUE,IFEval,0.771314556487897,77.1314556487897,BBH,0.550264215185564,36.0245641700103,MATH Level 5,0.266616314199396,26.6616314199396,GPQA,0.308724832214765,7.82997762863535,MUSR,0.412510416666667,10.23046875,MMLU-PRO,0.357214095744681,28.5793439716312,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2024-12-20,0,CohereForAI/c4ai-command-r7b-12-2024,cc-by-nc-4.0,306,8.028,2.45480693599537 +CohereForAI/c4ai-command-r7b-12-2024_bfloat16_a9650f3bda8b0e00825ee36592e086b4ee621102_True,CohereForAI/c4ai-command-r7b-12-2024,a9650f3bda8b0e00825ee36592e086b4ee621102,bfloat16,chatmodels,Original,Cohere2ForCausalLM,31.0762402648343,TRUE,IFEval,0.771314556487897,77.1314556487897,BBH,0.550264215185564,36.0245641700103,MATH Level 5,0.266616314199396,26.6616314199396,GPQA,0.308724832214765,7.82997762863535,MUSR,0.412510416666667,10.23046875,MMLU-PRO,0.357214095744681,28.5793439716312,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2024-12-20,0,CohereForAI/c4ai-command-r7b-12-2024,cc-by-nc-4.0,311,8.028,2.45480693599537 Columbia-NLP/LION-Gemma-2b-dpo-v1.0_float16_a5f780075831374f8850324448acf94976dea504_True,Columbia-NLP/LION-Gemma-2b-dpo-v1.0,a5f780075831374f8850324448acf94976dea504,float16,chatmodels,Original,GemmaForCausalLM,11.4839947622434,TRUE,IFEval,0.327831265486686,32.7831265486686,BBH,0.391995636132075,14.5859760938158,MATH Level 5,0.0430513595166163,4.30513595166163,GPQA,0.249161073825503,0,MUSR,0.412010416666667,9.83463541666667,MMLU-PRO,0.16655585106383,7.39509456264775,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-28,2024-07-04,0,Columbia-NLP/LION-Gemma-2b-dpo-v1.0,"",0,2.506,0.97964847425047 Columbia-NLP/LION-Gemma-2b-dpo-v1.0_bfloat16_a5f780075831374f8850324448acf94976dea504_True,Columbia-NLP/LION-Gemma-2b-dpo-v1.0,a5f780075831374f8850324448acf94976dea504,bfloat16,chatmodels,Original,GemmaForCausalLM,11.1487995452652,TRUE,IFEval,0.310245703621945,31.0245703621945,BBH,0.388103091595545,14.2430456477269,MATH Level 5,0.0468277945619336,4.68277945619336,GPQA,0.253355704697987,0.447427293064876,MUSR,0.408072916666667,9.10911458333334,MMLU-PRO,0.166472739361702,7.38585992907801,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-28,2024-07-04,0,Columbia-NLP/LION-Gemma-2b-dpo-v1.0,"",0,2.506,0.99456912017475 Columbia-NLP/LION-Gemma-2b-odpo-v1.0_bfloat16_090d9f59c3b47ab8dd099ddd278c058aa6d2d529_True,Columbia-NLP/LION-Gemma-2b-odpo-v1.0,090d9f59c3b47ab8dd099ddd278c058aa6d2d529,bfloat16,chatmodels,Original,GemmaForCausalLM,11.4567947643227,TRUE,IFEval,0.306648581319787,30.6648581319787,BBH,0.389583621070688,14.0239216654163,MATH Level 5,0.0430513595166163,4.30513595166163,GPQA,0.24244966442953,0,MUSR,0.427916666666667,12.05625,MMLU-PRO,0.169215425531915,7.69060283687943,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-28,2024-07-13,0,Columbia-NLP/LION-Gemma-2b-odpo-v1.0,"",4,2.506,0.962068098338517 @@ -151,7 +151,7 @@ CortexLM/btlm-7b-base-v0.2_bfloat16_eda8b4298365a26c8981316e09427c237b11217f_Fal Cran-May/T.E-8.1_bfloat16_5f84709710dcce7cc05fa12473e8bb207fe25849_True,Cran-May/T.E-8.1,5f84709710dcce7cc05fa12473e8bb207fe25849,bfloat16,chatmodels,Original,Qwen2ForCausalLM,29.4054568316594,TRUE,IFEval,0.707692256545965,70.7692256545965,BBH,0.558175470812389,37.0243766258437,MATH Level 5,0.06797583081571,6.797583081571,GPQA,0.312919463087248,8.38926174496644,MUSR,0.450520833333333,15.3151041666667,MMLU-PRO,0.443234707446809,38.1371897163121,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-27,2024-09-29,1,Cran-May/T.E-8.1 (Merge),cc-by-nc-sa-4.0,3,7.616,1.09063280035837 CultriX/Qwen2.5-14B-Broca_bfloat16_51204ee25a629abfd6d5e77a850b5e7a36c78462_False,CultriX/Qwen2.5-14B-Broca,51204ee25a629abfd6d5e77a850b5e7a36c78462,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.7230909019459,FALSE,IFEval,0.560414145578177,56.0414145578177,BBH,0.652714598154036,50.0344117817011,MATH Level 5,0.345921450151057,34.5921450151057,GPQA,0.386744966442953,18.2326621923937,MUSR,0.47665625,18.9486979166667,MMLU-PRO,0.536402925531915,48.4892139479906,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,CultriX/Qwen2.5-14B-Broca (Merge),"",1,7.383,2.07700146650508 CultriX/Qwen2.5-14B-Brocav3_bfloat16_6f3fe686a79dcbcd5835ca100e194c49f493167b_False,CultriX/Qwen2.5-14B-Brocav3,6f3fe686a79dcbcd5835ca100e194c49f493167b,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,38.7642540094264,FALSE,IFEval,0.695177684100409,69.5177684100409,BBH,0.645235347618276,49.0491117834814,MATH Level 5,0.322507552870091,32.2507552870091,GPQA,0.359060402684564,14.5413870246085,MUSR,0.475635416666667,19.2544270833333,MMLU-PRO,0.531748670212766,47.9720744680851,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,CultriX/Qwen2.5-14B-Brocav3 (Merge),"",1,7.383,1.8167389899472 -CultriX/Qwen2.5-14B-Brocav6_bfloat16_bd981505b6950df69216b260c3c0d86124fded7b_False,CultriX/Qwen2.5-14B-Brocav6,bd981505b6950df69216b260c3c0d86124fded7b,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,38.3175682007454,FALSE,IFEval,0.699523929839493,69.9523929839493,BBH,0.638883526662656,47.819224806074,MATH Level 5,0.29607250755287,29.607250755287,GPQA,0.36744966442953,15.6599552572707,MUSR,0.474208333333333,18.8760416666667,MMLU-PRO,0.531914893617021,47.9905437352246,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,CultriX/Qwen2.5-14B-Brocav6 (Merge),"",0,7.383,1.7914011355599 +CultriX/Qwen2.5-14B-Brocav6_bfloat16_bd981505b6950df69216b260c3c0d86124fded7b_False,CultriX/Qwen2.5-14B-Brocav6,bd981505b6950df69216b260c3c0d86124fded7b,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,38.3175682007454,FALSE,IFEval,0.699523929839493,69.9523929839493,BBH,0.638883526662656,47.819224806074,MATH Level 5,0.29607250755287,29.607250755287,GPQA,0.36744966442953,15.6599552572707,MUSR,0.474208333333333,18.8760416666667,MMLU-PRO,0.531914893617021,47.9905437352246,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,CultriX/Qwen2.5-14B-Brocav6 (Merge),"",1,7.383,1.7914011355599 CultriX/Qwen2.5-14B-Brocav7_float16_06acee7f6e9796081ced6201001784907c77f96f_False,CultriX/Qwen2.5-14B-Brocav7,06acee7f6e9796081ced6201001784907c77f96f,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,38.5222137472979,FALSE,IFEval,0.67237152976325,67.237152976325,BBH,0.644402698132718,48.9053607833169,MATH Level 5,0.318731117824773,31.8731117824773,GPQA,0.36744966442953,15.6599552572707,MUSR,0.479604166666667,20.1505208333333,MMLU-PRO,0.525764627659575,47.3071808510638,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,CultriX/Qwen2.5-14B-Brocav7 (Merge),"",0,7.383,1.70134942259186 CultriX/Qwen2.5-14B-Emerged_bfloat16_8bf0e31b23ee22858bbde2cee44dde88963f5084_False,CultriX/Qwen2.5-14B-Emerged,8bf0e31b23ee22858bbde2cee44dde88963f5084,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.6626166580798,FALSE,IFEval,0.700023714854364,70.0023714854364,BBH,0.626003368070331,45.9324193686847,MATH Level 5,0.307401812688822,30.7401812688822,GPQA,0.357382550335571,14.3176733780761,MUSR,0.46909375,18.4700520833333,MMLU-PRO,0.518617021276596,46.5130023640662,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,CultriX/Qwen2.5-14B-Emerged (Merge),"",0,7.383,1.80736016762088 CultriX/Qwen2.5-14B-Emergedv3_bfloat16_f4df1b9c2bf37bbfd6b2e8f2ff244c6029a5d546_False,CultriX/Qwen2.5-14B-Emergedv3,f4df1b9c2bf37bbfd6b2e8f2ff244c6029a5d546,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,34.8420924559616,FALSE,IFEval,0.638849364131615,63.8849364131615,BBH,0.619072841105603,44.7316082426086,MATH Level 5,0.206948640483384,20.6948640483384,GPQA,0.360738255033557,14.7651006711409,MUSR,0.4728125,18.6015625,MMLU-PRO,0.517370345744681,46.3744828605201,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,CultriX/Qwen2.5-14B-Emergedv3 (Merge),"",1,7.383,1.91892827649725 @@ -176,6 +176,9 @@ DRXD1000/Atlas-7B_bfloat16_967ee983e2a0b163c12da69f1f81aaf8ffb2a456_True,DRXD100 DRXD1000/Phoenix-7B_bfloat16_a5caa8036d8b7819eb723debe3f037471b5c4882_True,DRXD1000/Phoenix-7B,a5caa8036d8b7819eb723debe3f037471b5c4882,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,12.1432156087241,TRUE,IFEval,0.320961714916422,32.0961714916422,BBH,0.393156603472822,15.6201796643319,MATH Level 5,0,0,GPQA,0.278523489932886,3.80313199105145,MUSR,0.384947916666667,6.41848958333333,MMLU-PRO,0.234291888297872,14.9213209219858,TRUE,FALSE,FALSE,FALSE,FALSE,2024-01-10,2024-12-11,0,DRXD1000/Phoenix-7B,apache-2.0,17,7,0.470872419197835 DUAL-GPO/zephyr-7b-ipo-0k-15k-i1_bfloat16_564d269c67dfcc5c07a4fbc270a6a48da1929d30_False,DUAL-GPO/zephyr-7b-ipo-0k-15k-i1,564d269c67dfcc5c07a4fbc270a6a48da1929d30,bfloat16,chatmodels,Adapter,?,15.4929476596832,FALSE,IFEval,0.275624232591745,27.5624232591746,BBH,0.447271244756595,22.6586426600964,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.291107382550336,5.48098434004475,MUSR,0.41734375,10.56796875,MMLU-PRO,0.312998670212766,23.6665189125296,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-20,2024-09-22,1,DUAL-GPO/zephyr-7b-ipo-qlora-v0-merged,"",0,14.483,0.971423382137328 DZgas/GIGABATEMAN-7B_float16_edf2840350e7fd55895d9df560b489ac10ecb95e_False,DZgas/GIGABATEMAN-7B,edf2840350e7fd55895d9df560b489ac10ecb95e,float16,basemergesandmoerges,Original,MistralForCausalLM,20.4462927397202,FALSE,IFEval,0.460746375173429,46.0746375173429,BBH,0.503218434286276,29.827516654014,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.289429530201342,5.2572706935123,MUSR,0.43284375,11.9721354166667,MMLU-PRO,0.317652925531915,24.183658392435,FALSE,FALSE,FALSE,FALSE,FALSE,2024-04-17,2024-09-15,1,DZgas/GIGABATEMAN-7B (Merge),"",5,7.242,0.630337327119902 +Daemontatox/AetherDrake-SFT_float16_17a0f90f0c06f2adc885faccd0a6172a7b996126_False,Daemontatox/AetherDrake-SFT,17a0f90f0c06f2adc885faccd0a6172a7b996126,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,22.8270284619053,FALSE,IFEval,0.480355456854479,48.0355456854479,BBH,0.487200755072202,27.1392523216301,MATH Level 5,0.146525679758308,14.6525679758308,GPQA,0.320469798657718,9.39597315436242,MUSR,0.40884375,9.97213541666667,MMLU-PRO,0.349900265957447,27.7666962174941,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-24,2024-12-25,1,Daemontatox/AetherDrake-SFT (Merge),apache-2.0,1,4.015,1.44931329121135 +Daemontatox/PathfinderAI_float16_14c6a91351006b7be0aff85292733470ff1b546d_False,Daemontatox/PathfinderAI,14c6a91351006b7be0aff85292733470ff1b546d,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,38.1313135250406,FALSE,IFEval,0.374517391631981,37.4517391631981,BBH,0.666785433123254,52.6465473343533,MATH Level 5,0.47583081570997,47.583081570997,GPQA,0.394295302013423,19.2393736017897,MUSR,0.485833333333333,20.8291666666667,MMLU-PRO,0.559341755319149,51.0379728132388,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-24,2024-12-25,1,Daemontatox/PathfinderAI (Merge),apache-2.0,0,16.382,4.54091822797527 +Daemontatox/RA_Reasoner_float16_e799c6877cb70b6e78c1e337eaa58383040c8fa9_False,Daemontatox/RA_Reasoner,e799c6877cb70b6e78c1e337eaa58383040c8fa9,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,29.0191808385312,FALSE,IFEval,0.559215104810791,55.9215104810791,BBH,0.605369241720503,43.0730077734737,MATH Level 5,0.200906344410876,20.0906344410876,GPQA,0.331375838926175,10.8501118568233,MUSR,0.396354166666667,7.5109375,MMLU-PRO,0.430019946808511,36.6688829787234,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-20,2024-12-25,2,tiiuae/Falcon3-10B-Base,apache-2.0,1,5.153,0.779073366733575 Dampfinchen/Llama-3.1-8B-Ultra-Instruct_bfloat16_46662d14130cfd34f7d90816540794f24a301f86_True,Dampfinchen/Llama-3.1-8B-Ultra-Instruct,46662d14130cfd34f7d90816540794f24a301f86,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,29.1270514428358,TRUE,IFEval,0.808109150387638,80.8109150387638,BBH,0.525753245224657,32.4945868042057,MATH Level 5,0.158610271903323,15.8610271903323,GPQA,0.291946308724832,5.59284116331097,MUSR,0.400322916666667,8.60703125,MMLU-PRO,0.382563164893617,31.3959072104019,TRUE,TRUE,FALSE,FALSE,FALSE,2024-08-26,2024-08-26,1,Dampfinchen/Llama-3.1-8B-Ultra-Instruct (Merge),llama3,7,8.03,0.836478665207706 Danielbrdz/Barcenas-14b-Phi-3-medium-ORPO_float16_b749dbcb19901b8fd0e9f38c923a24533569f895_True,Danielbrdz/Barcenas-14b-Phi-3-medium-ORPO,b749dbcb19901b8fd0e9f38c923a24533569f895,float16,chatmodels,Original,MistralForCausalLM,31.7384475839978,TRUE,IFEval,0.479905539524019,47.9905539524019,BBH,0.653618488664863,51.0294184032803,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.326342281879195,10.1789709172259,MUSR,0.48075,20.5270833333333,MMLU-PRO,0.472323803191489,41.369311465721,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-15,2024-08-13,0,Danielbrdz/Barcenas-14b-Phi-3-medium-ORPO,mit,5,13.96,1.57231518388353 Danielbrdz/Barcenas-Llama3-8b-ORPO_float16_66c848c4526d3db1ec41468c0f73ac4448c6abe9_True,Danielbrdz/Barcenas-Llama3-8b-ORPO,66c848c4526d3db1ec41468c0f73ac4448c6abe9,float16,chatmodels,Original,LlamaForCausalLM,26.519005053592,TRUE,IFEval,0.737242738156979,73.7242738156979,BBH,0.498655785599113,28.6006234999819,MATH Level 5,0.0657099697885197,6.57099697885197,GPQA,0.307046979865772,7.60626398210291,MUSR,0.418958333333333,11.1697916666667,MMLU-PRO,0.382978723404255,31.4420803782506,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-29,2024-06-29,0,Danielbrdz/Barcenas-Llama3-8b-ORPO,other,7,8.03,0.774159185697872 @@ -255,9 +258,9 @@ DreadPoor/WIP_Damascus-8B-TIES_bfloat16_c7720a0b0a8d24e62bf71b0e955b1aca8e62f1cb DreadPoor/felix_dies-mistral-7B-model_stock_bfloat16_bb317aa7565625327e18c5158aebd4710aa1d925_False,DreadPoor/felix_dies-mistral-7B-model_stock,bb317aa7565625327e18c5158aebd4710aa1d925,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,18.1018281017421,FALSE,IFEval,0.300778600779266,30.0778600779266,BBH,0.490091807352742,28.8907980509645,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.291946308724832,5.59284116331097,MUSR,0.451822916666667,15.4778645833333,MMLU-PRO,0.310920877659575,23.4356530732861,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-30,0,Removed,"",0,7.242,0.661571667363575 DreadPoor/remember_to_breathe-8b-Model-Stock_bfloat16_fa88f1b06cf9ca7bd0d859c6a4b2240485363ae0_True,DreadPoor/remember_to_breathe-8b-Model-Stock,fa88f1b06cf9ca7bd0d859c6a4b2240485363ae0,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,28.1684073595337,TRUE,IFEval,0.710415032114789,71.0415032114789,BBH,0.541165443559992,34.6789907623163,MATH Level 5,0.143504531722054,14.3504531722054,GPQA,0.301174496644295,6.82326621923937,MUSR,0.414458333333333,11.440625,MMLU-PRO,0.37608045212766,30.6756057919622,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-06,0,Removed,"",0,8.03,0.663540162076869 EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2_bfloat16_2590214b30391392b9a84e7cbe40fff3a92c6814_True,EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2,2590214b30391392b9a84e7cbe40fff3a92c6814,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,43.5418377172999,TRUE,IFEval,0.687883704127271,68.7883704127271,BBH,0.708801222804876,59.0667326828602,MATH Level 5,0.390483383685801,39.0483383685801,GPQA,0.408557046979866,21.1409395973154,MUSR,0.471979166666667,19.7307291666667,MMLU-PRO,0.581283244680851,53.4759160756501,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-21,2024-11-27,1,Qwen/Qwen2.5-72B,other,10,72.706,22.95509846631 -EleutherAI/gpt-j-6b_bfloat16_47e169305d2e8376be1d31e765533382721b2cc1_False,EleutherAI/gpt-j-6b,47e169305d2e8376be1d31e765533382721b2cc1,bfloat16,pretrained,Original,GPTJForCausalLM,6.55782365211081,FALSE,IFEval,0.252218557870894,25.2218557870894,BBH,0.319104443103728,4.91281806832369,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.245805369127517,0,MUSR,0.36575,5.25208333333333,MMLU-PRO,0.124085771276596,2.67619680851064,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-19,0,EleutherAI/gpt-j-6b,apache-2.0,1456,6,0.767432156385538 +EleutherAI/gpt-j-6b_bfloat16_47e169305d2e8376be1d31e765533382721b2cc1_False,EleutherAI/gpt-j-6b,47e169305d2e8376be1d31e765533382721b2cc1,bfloat16,pretrained,Original,GPTJForCausalLM,6.55782365211081,FALSE,IFEval,0.252218557870894,25.2218557870894,BBH,0.319104443103728,4.91281806832369,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.245805369127517,0,MUSR,0.36575,5.25208333333333,MMLU-PRO,0.124085771276596,2.67619680851064,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-19,0,EleutherAI/gpt-j-6b,apache-2.0,1457,6,0.767432156385538 EleutherAI/gpt-neo-1.3B_bfloat16_dbe59a7f4a88d01d1ba9798d78dbe3fe038792c8_False,EleutherAI/gpt-neo-1.3B,dbe59a7f4a88d01d1ba9798d78dbe3fe038792c8,bfloat16,pretrained,Original,GPTNeoForCausalLM,5.34073838155464,FALSE,IFEval,0.207905025332784,20.7905025332784,BBH,0.303923158693564,3.02456918093099,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.255872483221477,0.782997762863532,MUSR,0.38165625,4.87369791666667,MMLU-PRO,0.116356382978723,1.81737588652482,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,EleutherAI/gpt-neo-1.3B,mit,270,1.366,0.359424061519048 -EleutherAI/gpt-neo-125m_bfloat16_21def0189f5705e2521767faed922f1f15e7d7db_False,EleutherAI/gpt-neo-125m,21def0189f5705e2521767faed922f1f15e7d7db,bfloat16,pretrained,Original,GPTNeoForCausalLM,4.3821456739786,FALSE,IFEval,0.190544422133273,19.0544422133273,BBH,0.311515688579152,3.4367389514267,MATH Level 5,0.00453172205438066,0.453172205438066,GPQA,0.253355704697987,0.447427293064876,MUSR,0.359333333333333,2.61666666666667,MMLU-PRO,0.102559840425532,0.28442671394799,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-10,0,EleutherAI/gpt-neo-125m,mit,186,0.15,0.202902486593259 +EleutherAI/gpt-neo-125m_bfloat16_21def0189f5705e2521767faed922f1f15e7d7db_False,EleutherAI/gpt-neo-125m,21def0189f5705e2521767faed922f1f15e7d7db,bfloat16,pretrained,Original,GPTNeoForCausalLM,4.3821456739786,FALSE,IFEval,0.190544422133273,19.0544422133273,BBH,0.311515688579152,3.4367389514267,MATH Level 5,0.00453172205438066,0.453172205438066,GPQA,0.253355704697987,0.447427293064876,MUSR,0.359333333333333,2.61666666666667,MMLU-PRO,0.102559840425532,0.28442671394799,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-10,0,EleutherAI/gpt-neo-125m,mit,187,0.15,0.202902486593259 EleutherAI/gpt-neo-2.7B_bfloat16_e24fa291132763e59f4a5422741b424fb5d59056_False,EleutherAI/gpt-neo-2.7B,e24fa291132763e59f4a5422741b424fb5d59056,bfloat16,pretrained,Original,GPTNeoForCausalLM,6.3555191000811,FALSE,IFEval,0.258962885144749,25.8962885144749,BBH,0.313951603331525,4.17860266708101,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.265939597315436,2.12527964205817,MUSR,0.355364583333333,3.52057291666667,MMLU-PRO,0.116273271276596,1.80814125295508,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,EleutherAI/gpt-neo-2.7B,mit,447,2.718,0.508381401623291 EleutherAI/gpt-neox-20b_float16_c292233c833e336628618a88a648727eb3dff0a7_False,EleutherAI/gpt-neox-20b,c292233c833e336628618a88a648727eb3dff0a7,float16,pretrained,Original,GPTNeoXForCausalLM,6.00322910111482,FALSE,IFEval,0.258688058795108,25.8688058795108,BBH,0.316503803208776,4.9291142015269,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.243288590604027,0,MUSR,0.364666666666667,2.81666666666667,MMLU-PRO,0.115525265957447,1.72502955082742,TRUE,FALSE,FALSE,FALSE,TRUE,2022-04-07,2024-06-09,0,EleutherAI/gpt-neox-20b,apache-2.0,544,20.739,3.14673637361504 EleutherAI/pythia-12b_float16_35c9d7f32fbb108fb8b5bdd574eb03369d1eed49_False,EleutherAI/pythia-12b,35c9d7f32fbb108fb8b5bdd574eb03369d1eed49,float16,pretrained,Original,GPTNeoXForCausalLM,5.93396032476546,FALSE,IFEval,0.247147568451708,24.7147568451708,BBH,0.317965395793534,4.98753103829051,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.246644295302013,0,MUSR,0.364697916666667,3.78723958333333,MMLU-PRO,0.110871010638298,1.20789007092199,TRUE,FALSE,FALSE,FALSE,TRUE,2023-02-28,2024-06-12,0,EleutherAI/pythia-12b,apache-2.0,131,12,1.11800715316637 @@ -377,7 +380,7 @@ HelpingAI/Priya-10B_float16_82f217b1c0b50c3941a6d3f0cff94812aa10c0b9_True,Helpin HelpingAI/Priya-3B_bfloat16_43681968e92d52df5b171aff6aa59baf4f3cdeba_True,HelpingAI/Priya-3B,43681968e92d52df5b171aff6aa59baf4f3cdeba,bfloat16,continuouslypretrained,Original,LlamaForCausalLM,13.2785347643778,TRUE,IFEval,0.452578048466957,45.2578048466957,BBH,0.396118486332784,14.3352734096268,MATH Level 5,0.00528700906344411,0.528700906344411,GPQA,0.256711409395973,0.894854586129753,MUSR,0.371302083333333,3.77942708333333,MMLU-PRO,0.233876329787234,14.8751477541371,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-14,0,HelpingAI/Priya-3B,other,1,3,0.641329872110001 HiroseKoichi/Llama-Salad-4x8B-V3_bfloat16_a343915429779efbd1478f01ba1f7fd9d8d226c0_True,HiroseKoichi/Llama-Salad-4x8B-V3,a343915429779efbd1478f01ba1f7fd9d8d226c0,bfloat16,basemergesandmoerges,Original,MixtralForCausalLM,24.9352898410171,TRUE,IFEval,0.665352376139754,66.5352376139754,BBH,0.524464978900175,31.9288488107451,MATH Level 5,0.0966767371601208,9.66767371601208,GPQA,0.302852348993289,7.04697986577182,MUSR,0.37403125,6.45390625,MMLU-PRO,0.351811835106383,27.9790927895981,TRUE,TRUE,TRUE,FALSE,FALSE,2024-06-17,2024-06-26,0,HiroseKoichi/Llama-Salad-4x8B-V3,llama3,5,24.942,2.13769520215148 HuggingFaceH4/zephyr-7b-alpha_bfloat16_2ce2d025864af849b3e5029e2ec9d568eeda892d_True,HuggingFaceH4/zephyr-7b-alpha,2ce2d025864af849b3e5029e2ec9d568eeda892d,bfloat16,chatmodels,Original,MistralForCausalLM,18.5718642203846,TRUE,IFEval,0.519148082642943,51.9148082642943,BBH,0.458786350590441,23.9552914270685,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.297818791946309,6.3758389261745,MUSR,0.394958333333333,7.503125,MMLU-PRO,0.279504654255319,19.9449615839244,TRUE,FALSE,FALSE,FALSE,TRUE,2023-10-09,2024-06-12,1,mistralai/Mistral-7B-v0.1,mit,1103,7.242,0.79567519919312 -HuggingFaceH4/zephyr-7b-beta_bfloat16_b70e0c9a2d9e14bd1e812d3c398e5f313e93b473_True,HuggingFaceH4/zephyr-7b-beta,b70e0c9a2d9e14bd1e812d3c398e5f313e93b473,bfloat16,chatmodels,Original,MistralForCausalLM,17.767060993735,TRUE,IFEval,0.495043152169577,49.5043152169577,BBH,0.431582191918003,21.4875421828067,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.290268456375839,5.36912751677852,MUSR,0.392541666666667,7.734375,MMLU-PRO,0.278091755319149,19.7879728132388,TRUE,FALSE,FALSE,FALSE,TRUE,2023-10-26,2024-06-12,1,mistralai/Mistral-7B-v0.1,mit,1621,7.242,0.555023090869454 +HuggingFaceH4/zephyr-7b-beta_bfloat16_b70e0c9a2d9e14bd1e812d3c398e5f313e93b473_True,HuggingFaceH4/zephyr-7b-beta,b70e0c9a2d9e14bd1e812d3c398e5f313e93b473,bfloat16,chatmodels,Original,MistralForCausalLM,17.767060993735,TRUE,IFEval,0.495043152169577,49.5043152169577,BBH,0.431582191918003,21.4875421828067,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.290268456375839,5.36912751677852,MUSR,0.392541666666667,7.734375,MMLU-PRO,0.278091755319149,19.7879728132388,TRUE,FALSE,FALSE,FALSE,TRUE,2023-10-26,2024-06-12,1,mistralai/Mistral-7B-v0.1,mit,1627,7.242,0.555023090869454 HuggingFaceH4/zephyr-7b-gemma-v0.1_bfloat16_03b3427d0ed07d2e0f86c0a7e53d82d4beef9540_True,HuggingFaceH4/zephyr-7b-gemma-v0.1,03b3427d0ed07d2e0f86c0a7e53d82d4beef9540,bfloat16,chatmodels,Original,GemmaForCausalLM,15.9293384077098,TRUE,IFEval,0.336374153911621,33.6374153911621,BBH,0.462373501467975,23.7511627492013,MATH Level 5,0.0755287009063444,7.55287009063444,GPQA,0.294463087248322,5.92841163310962,MUSR,0.37396875,4.17942708333333,MMLU-PRO,0.284740691489362,20.526743498818,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-01,2024-06-12,2,google/gemma-7b,other,121,8.538,1.48177514162897 HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1_float16_a3be084543d278e61b64cd600f28157afc79ffd3_True,HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1,a3be084543d278e61b64cd600f28157afc79ffd3,float16,chatmodels,Original,MixtralForCausalLM,34.0630228005823,TRUE,IFEval,0.65108911022753,65.108911022753,BBH,0.629043972852409,47.5037962865412,MATH Level 5,0.200906344410876,20.0906344410876,GPQA,0.378355704697987,17.1140939597315,MUSR,0.446520833333333,14.7151041666667,MMLU-PRO,0.458610372340426,39.8455969267139,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-10,2024-06-12,1,mistral-community/Mixtral-8x22B-v0.1,apache-2.0,262,140.621,42.0677864230678 HuggingFaceTB/SmolLM-1.7B_bfloat16_673a07602ca1191e5bc2ddda428e2f608a0a14c0_False,HuggingFaceTB/SmolLM-1.7B,673a07602ca1191e5bc2ddda428e2f608a0a14c0,bfloat16,pretrained,Original,LlamaForCausalLM,5.42539853445636,FALSE,IFEval,0.236156730807591,23.6156730807591,BBH,0.318051653896478,4.4111278515492,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.241610738255034,0,MUSR,0.34209375,2.12838541666667,MMLU-PRO,0.114777260638298,1.64191784869976,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-07-18,0,HuggingFaceTB/SmolLM-1.7B,apache-2.0,164,1.71,0.324307256517662 @@ -387,7 +390,7 @@ HuggingFaceTB/SmolLM-135M-Instruct_bfloat16_8ca7af58e27777cae460ad8ca3ab9db15f5c HuggingFaceTB/SmolLM-360M_bfloat16_318cc630b73730bfd712e5873063156ffb8936b5_False,HuggingFaceTB/SmolLM-360M,318cc630b73730bfd712e5873063156ffb8936b5,bfloat16,pretrained,Original,LlamaForCausalLM,6.14759580602707,FALSE,IFEval,0.213350576470432,21.3350576470432,BBH,0.306451603331525,3.28491530324659,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.26761744966443,2.3489932885906,MUSR,0.40178125,8.08932291666667,MMLU-PRO,0.112367021276596,1.3741134751773,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-07-18,0,HuggingFaceTB/SmolLM-360M,apache-2.0,62,0.36,0.365259532167126 HuggingFaceTB/SmolLM-360M-Instruct_bfloat16_8e951de8c220295ea4f85d078c4e320df7137535_True,HuggingFaceTB/SmolLM-360M-Instruct,8e951de8c220295ea4f85d078c4e320df7137535,bfloat16,chatmodels,Original,LlamaForCausalLM,4.70678415207999,TRUE,IFEval,0.195165494221998,19.5165494221998,BBH,0.288511143632177,2.08037429085374,MATH Level 5,0,0,GPQA,0.264261744966443,1.90156599552573,MUSR,0.347177083333333,2.89713541666667,MMLU-PRO,0.116605718085106,1.84507978723404,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-15,2024-08-20,1,HuggingFaceTB/SmolLM-360M,apache-2.0,77,0.362,0.366501024298985 HuggingFaceTB/SmolLM2-1.7B_bfloat16_4fa12cab4f5f53670b05125fb9d2873af587d231_False,HuggingFaceTB/SmolLM2-1.7B,4fa12cab4f5f53670b05125fb9d2873af587d231,bfloat16,pretrained,Original,LlamaForCausalLM,9.49550422402913,FALSE,IFEval,0.244000363480011,24.4000363480011,BBH,0.345259437716626,9.30178845955168,MATH Level 5,0.0211480362537764,2.11480362537764,GPQA,0.279362416107383,3.91498881431767,MUSR,0.348541666666667,4.60104166666667,MMLU-PRO,0.21376329787234,12.64036643026,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-30,2024-11-06,0,HuggingFaceTB/SmolLM2-1.7B,apache-2.0,85,1.71,0.325025991140308 -HuggingFaceTB/SmolLM2-1.7B-Instruct_bfloat16_d1bb90bcfbe0f211109880f4da18da66f229c4f6_True,HuggingFaceTB/SmolLM2-1.7B-Instruct,d1bb90bcfbe0f211109880f4da18da66f229c4f6,bfloat16,chatmodels,Original,LlamaForCausalLM,14.7453390971056,TRUE,IFEval,0.536783512192095,53.6783512192095,BBH,0.359861753141516,10.9179892262081,MATH Level 5,0.0415407854984894,4.15407854984894,GPQA,0.279362416107383,3.91498881431767,MUSR,0.342125,4.09895833333334,MMLU-PRO,0.205369015957447,11.7076684397163,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,1,HuggingFaceTB/SmolLM2-1.7B-Instruct (Merge),apache-2.0,442,1.71,0.63234061656892 +HuggingFaceTB/SmolLM2-1.7B-Instruct_bfloat16_d1bb90bcfbe0f211109880f4da18da66f229c4f6_True,HuggingFaceTB/SmolLM2-1.7B-Instruct,d1bb90bcfbe0f211109880f4da18da66f229c4f6,bfloat16,chatmodels,Original,LlamaForCausalLM,14.7453390971056,TRUE,IFEval,0.536783512192095,53.6783512192095,BBH,0.359861753141516,10.9179892262081,MATH Level 5,0.0415407854984894,4.15407854984894,GPQA,0.279362416107383,3.91498881431767,MUSR,0.342125,4.09895833333334,MMLU-PRO,0.205369015957447,11.7076684397163,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,1,HuggingFaceTB/SmolLM2-1.7B-Instruct (Merge),apache-2.0,443,1.71,0.63234061656892 HuggingFaceTB/SmolLM2-135M_bfloat16_28e66ca6931668447a3bac213f23d990ad3b0e2b_False,HuggingFaceTB/SmolLM2-135M,28e66ca6931668447a3bac213f23d990ad3b0e2b,bfloat16,pretrained,Original,LlamaForCausalLM,5.55767745404167,FALSE,IFEval,0.183300309844546,18.3300309844546,BBH,0.304423424687714,3.70807758683998,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.248322147651007,0,MUSR,0.411177083333333,10.03046875,MMLU-PRO,0.109458111702128,1.05090130023641,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,0,HuggingFaceTB/SmolLM2-135M,apache-2.0,44,0.135,0.333904566630153 HuggingFaceTB/SmolLM2-135M-Instruct_bfloat16_5a33ba103645800d7b3790c4448546c1b73efc71_True,HuggingFaceTB/SmolLM2-135M-Instruct,5a33ba103645800d7b3790c4448546c1b73efc71,bfloat16,chatmodels,Original,LlamaForCausalLM,6.46736472035882,TRUE,IFEval,0.288313896018121,28.8313896018121,BBH,0.312432132806668,4.72080766080528,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.235738255033557,0,MUSR,0.36621875,3.67734375,MMLU-PRO,0.111452792553191,1.27253250591016,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-06,1,HuggingFaceTB/SmolLM2-135M-Instruct (Merge),apache-2.0,79,0.135,0.338375628206877 HuggingFaceTB/SmolLM2-135M-Instruct_float16_5a33ba103645800d7b3790c4448546c1b73efc71_False,HuggingFaceTB/SmolLM2-135M-Instruct,5a33ba103645800d7b3790c4448546c1b73efc71,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,2.99259897065637,FALSE,IFEval,0.0592516744460254,5.92516744460254,BBH,0.313475029473359,4.79627574466244,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.234060402684564,0,MUSR,0.387145833333333,6.05989583333334,MMLU-PRO,0.109208776595745,1.02319739952719,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-11-14,1,HuggingFaceTB/SmolLM2-135M-Instruct (Merge),apache-2.0,79,0.135,0.348753843693507 @@ -410,7 +413,7 @@ Isaak-Carter/JOSIEv4o-8b-stage1-v4_bfloat16_a8380a7be51b547761824e524b3d95ac7320 Isaak-Carter/Josiefied-Qwen2.5-7B-Instruct-abliterated_bfloat16_879168f9ce9fac315a19dd4f4c7df5253bb660f2_True,Isaak-Carter/Josiefied-Qwen2.5-7B-Instruct-abliterated,879168f9ce9fac315a19dd4f4c7df5253bb660f2,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,26.8572954599091,TRUE,IFEval,0.73174731933492,73.174731933492,BBH,0.539637628446092,34.9043156883231,MATH Level 5,0,0,GPQA,0.302852348993289,7.04697986577182,MUSR,0.408666666666667,9.61666666666667,MMLU-PRO,0.427609707446809,36.4010786052009,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-21,0,Removed,"",0,7.616,1.07679067507346 Isaak-Carter/Josiefied-Qwen2.5-7B-Instruct-abliterated-v2_bfloat16_5d07f58562422feb9f25c9c048e40356d2cf7e4b_True,Isaak-Carter/Josiefied-Qwen2.5-7B-Instruct-abliterated-v2,5d07f58562422feb9f25c9c048e40356d2cf7e4b,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,27.8179595712917,TRUE,IFEval,0.784103955283093,78.4103955283093,BBH,0.531092359918207,33.2945398202129,MATH Level 5,0,0,GPQA,0.298657718120805,6.48769574944072,MUSR,0.435395833333333,13.9578125,MMLU-PRO,0.412815824468085,34.7573138297872,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-20,2024-09-21,1,Qwen/Qwen2.5-7B,apache-2.0,5,7.616,1.13091464679065 J-LAB/Thynk_orpo_float16_c6606d402f26d005b9f1a71a1cde9139d1cffb2a_False,J-LAB/Thynk_orpo,c6606d402f26d005b9f1a71a1cde9139d1cffb2a,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,16.9744070421119,FALSE,IFEval,0.210177883571147,21.0177883571147,BBH,0.446311387787096,22.0627839441444,MATH Level 5,0.130664652567976,13.0664652567976,GPQA,0.292785234899329,5.70469798657718,MUSR,0.451479166666667,15.2015625,MMLU-PRO,0.32313829787234,24.7931442080378,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-10-14,0,Removed,"",0,3.086,1.21476411071604 -JackFram/llama-160m_bfloat16_aca9b687d1425f863dcf5de9a4c96e3fe36266dd_False,JackFram/llama-160m,aca9b687d1425f863dcf5de9a4c96e3fe36266dd,bfloat16,pretrained,Original,LlamaForCausalLM,4.59966056180143,FALSE,IFEval,0.179103667158695,17.9103667158695,BBH,0.288802175390424,2.03360615285273,MATH Level 5,0,0,GPQA,0.261744966442953,1.56599552572707,MUSR,0.379208333333333,4.66770833333333,MMLU-PRO,0.112782579787234,1.420286643026,TRUE,FALSE,FALSE,FALSE,FALSE,2023-05-26,2024-11-30,0,JackFram/llama-160m,apache-2.0,34,0.162,0.0934743941743699 +JackFram/llama-160m_bfloat16_aca9b687d1425f863dcf5de9a4c96e3fe36266dd_False,JackFram/llama-160m,aca9b687d1425f863dcf5de9a4c96e3fe36266dd,bfloat16,pretrained,Original,LlamaForCausalLM,4.59966056180143,FALSE,IFEval,0.179103667158695,17.9103667158695,BBH,0.288802175390424,2.03360615285273,MATH Level 5,0,0,GPQA,0.261744966442953,1.56599552572707,MUSR,0.379208333333333,4.66770833333333,MMLU-PRO,0.112782579787234,1.420286643026,TRUE,FALSE,FALSE,FALSE,FALSE,2023-05-26,2024-11-30,0,JackFram/llama-160m,apache-2.0,33,0.162,0.0934743941743699 JackFram/llama-68m_bfloat16_964a5d77df908b69f8d6476fb70e940425b04cb5_False,JackFram/llama-68m,964a5d77df908b69f8d6476fb70e940425b04cb5,bfloat16,pretrained,Original,LlamaForCausalLM,4.86263476563279,FALSE,IFEval,0.17263416623448,17.263416623448,BBH,0.293629865093364,2.59104780683548,MATH Level 5,0,0,GPQA,0.258389261744966,1.11856823266219,MUSR,0.390989583333333,6.60703125,MMLU-PRO,0.11436170212766,1.59574468085106,TRUE,FALSE,FALSE,FALSE,FALSE,2023-07-19,2024-11-30,0,JackFram/llama-68m,apache-2.0,25,0.068,0.0605579039184109 Jacoby746/Casual-Magnum-34B_float16_b628c6959441db75460cfd49536322b1ea46130e_False,Jacoby746/Casual-Magnum-34B,b628c6959441db75460cfd49536322b1ea46130e,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,23.5713346184245,FALSE,IFEval,0.193016751109279,19.3016751109279,BBH,0.603204688054297,43.0515676284677,MATH Level 5,0.0785498489425982,7.85498489425982,GPQA,0.37248322147651,16.331096196868,MUSR,0.407760416666667,8.40338541666667,MMLU-PRO,0.518367686170213,46.485298463357,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-01,2024-10-23,1,Jacoby746/Casual-Magnum-34B (Merge),apache-2.0,1,34.389,3.42669714201879 Jacoby746/Inf-Silent-Kunoichi-v0.1-2x7B_float16_9ab68beb6fe16cab2ab708b9af4417c89751d297_False,Jacoby746/Inf-Silent-Kunoichi-v0.1-2x7B,9ab68beb6fe16cab2ab708b9af4417c89751d297,float16,basemergesandmoerges,Original,MixtralForCausalLM,20.0099476497453,FALSE,IFEval,0.387981666422869,38.7981666422869,BBH,0.518546209727402,32.3870042041129,MATH Level 5,0.0604229607250755,6.04229607250755,GPQA,0.289429530201342,5.2572706935123,MUSR,0.428041666666667,12.3385416666667,MMLU-PRO,0.327127659574468,25.2364066193853,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-19,2024-09-20,1,Jacoby746/Inf-Silent-Kunoichi-v0.1-2x7B (Merge),apache-2.0,0,12.879,1.86005330272532 @@ -419,6 +422,12 @@ Jacoby746/Proto-Athena-4x7B_float16_450fcba7a630fb61a662f71936d37979226fced8_Fal Jacoby746/Proto-Athena-v0.2-4x7B_bfloat16_01feeded217ea83a8794e7968c8850859b5f0b14_False,Jacoby746/Proto-Athena-v0.2-4x7B,01feeded217ea83a8794e7968c8850859b5f0b14,bfloat16,basemergesandmoerges,Original,MixtralForCausalLM,19.1438976257104,FALSE,IFEval,0.375242135312083,37.5242135312083,BBH,0.506773100542496,30.3408443303037,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.298657718120805,6.48769574944072,MUSR,0.42128125,10.96015625,MMLU-PRO,0.319730718085106,24.4145242316785,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-21,2024-09-21,1,Jacoby746/Proto-Athena-v0.2-4x7B (Merge),apache-2.0,0,24.154,1.65137195219129 Jacoby746/Proto-Harpy-Blazing-Light-v0.1-2x7B_float16_bbb5d7c7a0c9e999e057ffa71eaa93d59d95b36b_False,Jacoby746/Proto-Harpy-Blazing-Light-v0.1-2x7B,bbb5d7c7a0c9e999e057ffa71eaa93d59d95b36b,float16,basemergesandmoerges,Original,MixtralForCausalLM,22.292391864754,FALSE,IFEval,0.490471947765263,49.0471947765263,BBH,0.51868490530526,32.6325299015927,MATH Level 5,0.0634441087613293,6.34441087613293,GPQA,0.295302013422819,6.04026845637584,MUSR,0.44496875,14.12109375,MMLU-PRO,0.330119680851064,25.568853427896,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-22,2024-09-30,1,Jacoby746/Proto-Harpy-Blazing-Light-v0.1-2x7B (Merge),"",0,12.879,0.881840827555971 Jacoby746/Proto-Harpy-Spark-v0.1-7B_float16_984cca02cd930b2e1b7b2a7d53471d32d9821cdd_False,Jacoby746/Proto-Harpy-Spark-v0.1-7B,984cca02cd930b2e1b7b2a7d53471d32d9821cdd,float16,basemergesandmoerges,Original,MistralForCausalLM,19.8625880175234,FALSE,IFEval,0.433269281063135,43.3269281063135,BBH,0.473577180829655,26.9131101594249,MATH Level 5,0.0626888217522659,6.26888217522659,GPQA,0.305369127516779,7.38255033557047,MUSR,0.431666666666667,12.2916666666667,MMLU-PRO,0.306931515957447,22.9923906619385,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-22,2024-09-30,1,Jacoby746/Proto-Harpy-Spark-v0.1-7B (Merge),apache-2.0,0,7.242,0.595804595864942 +JayHyeon/Qwen-0.5B-DPO-1epoch_bfloat16_f5569969d307d193798eff52c0527e23f4ac8bb9_True,JayHyeon/Qwen-0.5B-DPO-1epoch,f5569969d307d193798eff52c0527e23f4ac8bb9,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2Model,7.1969109979814,TRUE,IFEval,0.264733130316449,26.4733130316449,BBH,0.319075024342786,5.54369475035067,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.25251677852349,0.335570469798655,MUSR,0.335177083333333,2.89713541666667,MMLU-PRO,0.155751329787234,6.19459219858156,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-26,2024-12-26,0,JayHyeon/Qwen-0.5B-DPO-1epoch,mit,0,0.247,0.478256742058029 +JayHyeon/Qwen-0.5B-DPO-5epoch_bfloat16_4363737d67e793b7cfb714dda4aa27677a4db6e4_True,JayHyeon/Qwen-0.5B-DPO-5epoch,4363737d67e793b7cfb714dda4aa27677a4db6e4,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2Model,6.89646838113632,TRUE,IFEval,0.257014720940438,25.7014720940438,BBH,0.311210954486878,5.05669225833408,MATH Level 5,0.0219033232628399,2.19033232628399,GPQA,0.243288590604027,0,MUSR,0.33796875,2.51276041666667,MMLU-PRO,0.153257978723404,5.91755319148936,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-26,2024-12-26,0,JayHyeon/Qwen-0.5B-DPO-5epoch,mit,0,0.247,0.946676877617837 +JayHyeon/Qwen-0.5B-IRPO-1epoch_bfloat16_2dc73651ff3cbf0e4638c3bd5b1d87cfe2afc15f_True,JayHyeon/Qwen-0.5B-IRPO-1epoch,2dc73651ff3cbf0e4638c3bd5b1d87cfe2afc15f,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2Model,6.78013020834913,TRUE,IFEval,0.258913017460339,25.8913017460339,BBH,0.31638216610052,5.32435185185185,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.246644295302013,0,MUSR,0.328635416666667,2.24609375,MMLU-PRO,0.150016622340426,5.5574024822695,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-26,2024-12-26,0,JayHyeon/Qwen-0.5B-IRPO-1epoch,mit,0,0.247,0.495443558403486 +JayHyeon/Qwen-0.5B-IRPO-5epoch_bfloat16_dca128b2490982a6f2d53d017ad44c1b7829fabe_True,JayHyeon/Qwen-0.5B-IRPO-5epoch,dca128b2490982a6f2d53d017ad44c1b7829fabe,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2Model,6.6591181877807,TRUE,IFEval,0.248671303253146,24.8671303253146,BBH,0.31891656220326,5.71133449726923,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.23993288590604,0,MUSR,0.328666666666667,2.08333333333333,MMLU-PRO,0.150681515957447,5.63127955082742,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-26,2024-12-26,0,JayHyeon/Qwen-0.5B-IRPO-5epoch,mit,0,0.247,0.975681876690692 +JayHyeon/Qwen-0.5B-eDPO-1epoch_bfloat16_d24f341c6034334f397c156593ac8eece0a8a6ff_True,JayHyeon/Qwen-0.5B-eDPO-1epoch,d24f341c6034334f397c156593ac8eece0a8a6ff,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2Model,6.99147049092451,TRUE,IFEval,0.262335048781677,26.2335048781677,BBH,0.318063758345069,5.91840063270362,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.24244966442953,0,MUSR,0.332697916666667,1.92057291666667,MMLU-PRO,0.155252659574468,6.13918439716312,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-26,2024-12-26,0,JayHyeon/Qwen-0.5B-eDPO-1epoch,mit,0,0.247,0.486569104745833 +JayHyeon/Qwen-0.5B-eDPO-5epoch_bfloat16_8de61ddfbe7dc2a00228309af4851797694cd153_True,JayHyeon/Qwen-0.5B-eDPO-5epoch,8de61ddfbe7dc2a00228309af4851797694cd153,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2Model,6.51617338495319,TRUE,IFEval,0.24562383365027,24.562383365027,BBH,0.309649182386935,5.19783769063181,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.249161073825503,0,MUSR,0.332635416666667,2.24609375,MMLU-PRO,0.152260638297872,5.80673758865248,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-20,2024-12-26,0,JayHyeon/Qwen-0.5B-eDPO-5epoch,mit,0,0.247,0.965733835352203 Jimmy19991222/Llama-3-Instruct-8B-SimPO-v0.2_float16_53a517ceaef324efc3626be44140b4f18a010591_True,Jimmy19991222/Llama-3-Instruct-8B-SimPO-v0.2,53a517ceaef324efc3626be44140b4f18a010591,float16,chatmodels,Original,LlamaForCausalLM,24.2799484428417,TRUE,IFEval,0.654036844461584,65.4036844461584,BBH,0.498371102582105,29.1238227637126,MATH Level 5,0.0430513595166163,4.30513595166163,GPQA,0.314597315436242,8.61297539149888,MUSR,0.40125,8.38958333333333,MMLU-PRO,0.36860039893617,29.8444887706856,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-06,0,Removed,"",0,8.03,0.513151724588246 Jimmy19991222/llama-3-8b-instruct-gapo-v2-bert-f1-beta10-gamma0.3-lr1.0e-6-1minus-rerun_bfloat16_00c02a823b4ff1a6cfcded6085ba9630df633998_True,Jimmy19991222/llama-3-8b-instruct-gapo-v2-bert-f1-beta10-gamma0.3-lr1.0e-6-1minus-rerun,00c02a823b4ff1a6cfcded6085ba9630df633998,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,23.8177042788149,TRUE,IFEval,0.671722141695147,67.1722141695147,BBH,0.487979656728994,27.7552285821971,MATH Level 5,0.040785498489426,4.0785498489426,GPQA,0.294463087248322,5.92841163310962,MUSR,0.404072916666667,8.70911458333334,MMLU-PRO,0.363364361702128,29.262706855792,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-17,2024-09-18,1,meta-llama/Meta-Llama-3-8B-Instruct,llama3,0,8.03,0.481790909131988 Jimmy19991222/llama-3-8b-instruct-gapo-v2-bert_f1-beta10-gamma0.3-lr1.0e-6-scale-log_bfloat16_99d9e31df5b7e88b1da78b1bd335cac3215dfd6e_True,Jimmy19991222/llama-3-8b-instruct-gapo-v2-bert_f1-beta10-gamma0.3-lr1.0e-6-scale-log,99d9e31df5b7e88b1da78b1bd335cac3215dfd6e,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,23.756269939372,TRUE,IFEval,0.655560579263022,65.5560579263022,BBH,0.493458403672942,28.6135966775256,MATH Level 5,0.033987915407855,3.3987915407855,GPQA,0.304530201342282,7.27069351230425,MUSR,0.400010416666667,8.16796875,MMLU-PRO,0.36577460106383,29.5305112293144,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-22,2024-09-22,1,meta-llama/Meta-Llama-3-8B-Instruct,llama3,0,8.03,0.478535413820399 @@ -460,7 +469,7 @@ LEESM/llama-2-7b-hf-lora-oki10p_float16_d6e5af01616a038ac2b5cb83f458e490e1102244 LEESM/llama-3-8b-bnb-4b-kowiki231101_bfloat16_63b8f715daab6a0c7196a20855be8e85fe7ddcb4_False,LEESM/llama-3-8b-bnb-4b-kowiki231101,63b8f715daab6a0c7196a20855be8e85fe7ddcb4,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,9.27108845579953,FALSE,IFEval,0.168487391233039,16.8487391233039,BBH,0.413080565361718,16.9348681493017,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.270973154362416,2.79642058165548,MUSR,0.355145833333333,3.05989583333333,MMLU-PRO,0.242519946808511,15.8355496453901,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-08,2024-11-08,2,meta-llama/Meta-Llama-3.1-8B,apache-2.0,0,8.03,0.756887607200453 LEESM/llama-3-Korean-Bllossom-8B-trexlab-oki10p_float16_d105e0365510f9e5f8550558343083cab8523524_False,LEESM/llama-3-Korean-Bllossom-8B-trexlab-oki10p,d105e0365510f9e5f8550558343083cab8523524,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,12.9431976670495,FALSE,IFEval,0.213725138188894,21.3725138188894,BBH,0.434301211693207,19.7974357609114,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.275167785234899,3.35570469798658,MUSR,0.386927083333333,7.66588541666667,MMLU-PRO,0.317652925531915,24.183658392435,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-22,2024-11-08,0,LEESM/llama-3-Korean-Bllossom-8B-trexlab-oki10p,mit,0,8.03,0.758357790011608 LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct_bfloat16_7f15baedd46858153d817445aff032f4d6cf4939_True,LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct,7f15baedd46858153d817445aff032f4d6cf4939,bfloat16,chatmodels,Original,ExaoneForCausalLM,21.4034633257456,TRUE,IFEval,0.719282614573775,71.9282614573775,BBH,0.417443264778451,17.9773353951805,MATH Level 5,0.0445619335347432,4.45619335347432,GPQA,0.265939597315436,2.12527964205817,MUSR,0.366125,3.29895833333333,MMLU-PRO,0.357712765957447,28.6347517730497,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-31,2024-08-18,0,LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct,other,389,7.8,0.82512797747961 -LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct_float16_e949c91dec92095908d34e6b560af77dd0c993f8_True,LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct,e949c91dec92095908d34e6b560af77dd0c993f8,float16,chatmodels,Original,ExaoneForCausalLM,26.6907110058015,TRUE,IFEval,0.7950449252428,79.50449252428,BBH,0.409234711372341,15.9474371710569,MATH Level 5,0.340634441087613,34.0634441087613,GPQA,0.265939597315436,2.12527964205817,MUSR,0.366125,3.165625,MMLU-PRO,0.328041888297872,25.3379875886525,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-11,0,LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct,other,80,2.4,0.60727146029865 +LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct_float16_e949c91dec92095908d34e6b560af77dd0c993f8_True,LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct,e949c91dec92095908d34e6b560af77dd0c993f8,float16,chatmodels,Original,ExaoneForCausalLM,26.6907110058015,TRUE,IFEval,0.7950449252428,79.50449252428,BBH,0.409234711372341,15.9474371710569,MATH Level 5,0.340634441087613,34.0634441087613,GPQA,0.265939597315436,2.12527964205817,MUSR,0.366125,3.165625,MMLU-PRO,0.328041888297872,25.3379875886525,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-11,0,LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct,other,81,2.4,0.60727146029865 LGAI-EXAONE/EXAONE-3.5-7.8B-Instruct_float16_0ff6b5ec7c13b049b253a16a889aa269e6b79a94_True,LGAI-EXAONE/EXAONE-3.5-7.8B-Instruct,0ff6b5ec7c13b049b253a16a889aa269e6b79a94,float16,chatmodels,Original,ExaoneForCausalLM,31.4646519124242,TRUE,IFEval,0.813604569209697,81.3604569209697,BBH,0.472759230435986,25.653749420829,MATH Level 5,0.41012084592145,41.012084592145,GPQA,0.25755033557047,1.00671140939597,MUSR,0.3779375,4.9421875,MMLU-PRO,0.413314494680851,34.8127216312057,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-11,0,LGAI-EXAONE/EXAONE-3.5-7.8B-Instruct,other,76,7.8,0.719971670493439 LLM360/K2_float16_49d159b6f2b64d562e745f0ff06e65b9a4c28ead_False,LLM360/K2,49d159b6f2b64d562e745f0ff06e65b9a4c28ead,float16,pretrained,Original,LlamaForCausalLM,14.5682245890329,FALSE,IFEval,0.225215760847884,22.5215760847884,BBH,0.497183567652368,28.2204028342011,MATH Level 5,0.0226586102719033,2.26586102719033,GPQA,0.276845637583893,3.57941834451902,MUSR,0.398,8.55,MMLU-PRO,0.300448803191489,22.2720892434988,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-26,0,LLM360/K2,apache-2.0,81,65.286,8.83820641772923 LLM360/K2-Chat_bfloat16_5454f2d28031c9127e4227c873ca2f154e02e4c7_True,LLM360/K2-Chat,5454f2d28031c9127e4227c873ca2f154e02e4c7,bfloat16,chatmodels,Original,LlamaForCausalLM,22.9395117207926,TRUE,IFEval,0.515176398622322,51.5176398622322,BBH,0.535809963024207,33.793829235993,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.306208053691275,7.49440715883669,MUSR,0.457,16.825,MMLU-PRO,0.337101063829787,26.3445626477541,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-12,0,LLM360/K2-Chat,apache-2.0,33,65.286,17.259828063151 @@ -536,11 +545,11 @@ Lyte/Llama-3.2-1B-Instruct-COT-RL-Expriement1-EP04_bfloat16_59d93307c6f2cb7a29c5 Lyte/Llama-3.2-3B-Overthinker_float16_0e7af37fb3381365905fc2df24811c0e6d2ba5b2_True,Lyte/Llama-3.2-3B-Overthinker,0e7af37fb3381365905fc2df24811c0e6d2ba5b2,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.0778462402,TRUE,IFEval,0.640797528335926,64.0797528335926,BBH,0.432009309795252,20.0955822264572,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.259228187919463,1.23042505592841,MUSR,0.34190625,3.90494791666667,MMLU-PRO,0.298537234042553,22.0596926713948,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-17,2024-10-18,2,meta-llama/Llama-3.2-3B-Instruct,apache-2.0,19,3.213,0.733639697394509 M4-ai/TinyMistral-248M-v3_bfloat16_fa23fe617768c671f0bbbff1edf4556cfe844167_False,M4-ai/TinyMistral-248M-v3,fa23fe617768c671f0bbbff1edf4556cfe844167,bfloat16,pretrained,Original,MistralForCausalLM,4.13010760928209,FALSE,IFEval,0.163866319144315,16.3866319144315,BBH,0.288454993899557,1.77755393038632,MATH Level 5,0,0,GPQA,0.240771812080537,0,MUSR,0.379333333333333,5.15,MMLU-PRO,0.113198138297872,1.4664598108747,TRUE,FALSE,FALSE,FALSE,FALSE,2024-02-05,2024-10-18,0,M4-ai/TinyMistral-248M-v3,apache-2.0,5,0.248,0.234183611420779 MEscriva/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis_float16_7a9d848188a674302d64a865786d4508be19571a_False,MEscriva/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis,7a9d848188a674302d64a865786d4508be19571a,float16,fine-tunedondomain-specificdatasets,Adapter,?,3.81803368483764,FALSE,IFEval,0.0866290331874981,8.66290331874981,BBH,0.305728612437881,3.23777427104784,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.251677852348993,0.223713646532442,MUSR,0.40171875,8.61484375,MMLU-PRO,0.115442154255319,1.71579491725768,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-12,2024-11-19,0,MEscriva/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis,"",0,0.63,1.05155623119269 -MLP-KTLim/llama-3-Korean-Bllossom-8B_bfloat16_8a738f9f622ffc2b0a4a6b81dabbca80406248bf_True,MLP-KTLim/llama-3-Korean-Bllossom-8B,8a738f9f622ffc2b0a4a6b81dabbca80406248bf,bfloat16,chatmodels,Original,LlamaForCausalLM,20.333975762059,TRUE,IFEval,0.5112800702137,51.12800702137,BBH,0.490045564701877,26.9275279730551,MATH Level 5,0.0981873111782478,9.81873111782478,GPQA,0.26258389261745,1.67785234899329,MUSR,0.367458333333333,3.63229166666667,MMLU-PRO,0.359375,28.8194444444444,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-25,2024-07-09,1,MLP-KTLim/llama-3-Korean-Bllossom-8B (Merge),llama3,288,8.03,0.774720564334845 +MLP-KTLim/llama-3-Korean-Bllossom-8B_bfloat16_8a738f9f622ffc2b0a4a6b81dabbca80406248bf_True,MLP-KTLim/llama-3-Korean-Bllossom-8B,8a738f9f622ffc2b0a4a6b81dabbca80406248bf,bfloat16,chatmodels,Original,LlamaForCausalLM,20.333975762059,TRUE,IFEval,0.5112800702137,51.12800702137,BBH,0.490045564701877,26.9275279730551,MATH Level 5,0.0981873111782478,9.81873111782478,GPQA,0.26258389261745,1.67785234899329,MUSR,0.367458333333333,3.63229166666667,MMLU-PRO,0.359375,28.8194444444444,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-25,2024-07-09,1,MLP-KTLim/llama-3-Korean-Bllossom-8B (Merge),llama3,289,8.03,0.774720564334845 MTSAIR/Cotype-Nano_bfloat16_91817ff717dd16d216304fa9d749e08fce2aa38d_True,MTSAIR/Cotype-Nano,91817ff717dd16d216304fa9d749e08fce2aa38d,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,13.2588792361465,TRUE,IFEval,0.374792217981622,37.4792217981622,BBH,0.386494096960149,14.4468700232412,MATH Level 5,0.0641993957703928,6.41993957703928,GPQA,0.27013422818792,2.68456375838927,MUSR,0.328916666666667,2.11458333333333,MMLU-PRO,0.247672872340426,16.4080969267139,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-22,2024-12-01,0,MTSAIR/Cotype-Nano,other,45,1.544,0.49328801555598 MTSAIR/MultiVerse_70B_bfloat16_063430cdc4d972a0884e3e3e3d45ea4afbdf71a2_False,MTSAIR/MultiVerse_70B,063430cdc4d972a0884e3e3e3d45ea4afbdf71a2,bfloat16,chatmodels,Original,LlamaForCausalLM,32.0051903084749,FALSE,IFEval,0.524918327814643,52.4918327814643,BBH,0.618313428493118,46.135898982415,MATH Level 5,0.178247734138973,17.8247734138973,GPQA,0.354026845637584,13.8702460850112,MUSR,0.473989583333333,18.8153645833333,MMLU-PRO,0.486037234042553,42.8930260047281,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-25,2024-06-29,0,MTSAIR/MultiVerse_70B,other,39,72.289,13.6018173834864 Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.1_bfloat16_1ed587f54f70334f495efb9c027acb03e96fe24f_True,Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.1,1ed587f54f70334f495efb9c027acb03e96fe24f,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,15.9289113532727,TRUE,IFEval,0.436141659685191,43.6141659685191,BBH,0.461510274452737,23.9901243984113,MATH Level 5,0.0558912386706949,5.58912386706949,GPQA,0.26258389261745,1.67785234899329,MUSR,0.327739583333333,0,MMLU-PRO,0.286319813829787,20.702201536643,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-06,2024-09-17,1,meta-llama/Meta-Llama-3-8B,llama3,4,8.03,0.8335691386634 -Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.3_bfloat16_d2578eb754d1c20efe604749296580f680950917_True,Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.3,d2578eb754d1c20efe604749296580f680950917,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,17.4902847861708,TRUE,IFEval,0.506358683847746,50.6358683847746,BBH,0.457158089967206,23.6988158923876,MATH Level 5,0.0694864048338369,6.94864048338369,GPQA,0.265939597315436,2.12527964205817,MUSR,0.342375,0.396875,MMLU-PRO,0.290226063829787,21.1362293144208,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-13,2024-08-06,1,meta-llama/Meta-Llama-3-8B,llama3,3,8.03,0.895420119077499 +Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.3_bfloat16_d2578eb754d1c20efe604749296580f680950917_True,Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.3,d2578eb754d1c20efe604749296580f680950917,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,17.4902847861708,TRUE,IFEval,0.506358683847746,50.6358683847746,BBH,0.457158089967206,23.6988158923876,MATH Level 5,0.0694864048338369,6.94864048338369,GPQA,0.265939597315436,2.12527964205817,MUSR,0.342375,0.396875,MMLU-PRO,0.290226063829787,21.1362293144208,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-13,2024-08-06,1,meta-llama/Meta-Llama-3-8B,llama3,4,8.03,0.895420119077499 Magpie-Align/Llama-3-8B-Magpie-Align-v0.1_bfloat16_a83ddac146fb2da1dd1bfa4069e336074d1439a8_True,Magpie-Align/Llama-3-8B-Magpie-Align-v0.1,a83ddac146fb2da1dd1bfa4069e336074d1439a8,bfloat16,chatmodels,Original,LlamaForCausalLM,16.4730942691102,TRUE,IFEval,0.411811770546594,41.1811770546594,BBH,0.481144156071485,26.6917608939245,MATH Level 5,0.033987915407855,3.3987915407855,GPQA,0.275167785234899,3.35570469798658,MUSR,0.304697916666667,1.92057291666667,MMLU-PRO,0.300615026595745,22.2905585106383,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-29,2024-07-03,2,meta-llama/Meta-Llama-3-8B,llama3,10,8.03,0.906848539982643 Magpie-Align/Llama-3-8B-Magpie-Align-v0.1_float16_a83ddac146fb2da1dd1bfa4069e336074d1439a8_True,Magpie-Align/Llama-3-8B-Magpie-Align-v0.1,a83ddac146fb2da1dd1bfa4069e336074d1439a8,float16,chatmodels,Original,LlamaForCausalLM,16.3077709906493,TRUE,IFEval,0.402719229422377,40.2719229422377,BBH,0.478940810197055,26.2897120886545,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.276845637583893,3.57941834451902,MUSR,0.308697916666667,1.92057291666667,MMLU-PRO,0.300116356382979,22.2351507092199,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-29,2024-07-03,2,meta-llama/Meta-Llama-3-8B,llama3,10,8.03,1.84953608154845 Magpie-Align/Llama-3-8B-Magpie-Align-v0.3_bfloat16_7e420ddd6ff48bf213dcab2a9ddb7845b80dd1aa_True,Magpie-Align/Llama-3-8B-Magpie-Align-v0.3,7e420ddd6ff48bf213dcab2a9ddb7845b80dd1aa,bfloat16,chatmodels,Original,LlamaForCausalLM,16.9115582373126,TRUE,IFEval,0.4497056698449,44.97056698449,BBH,0.456960506522001,24.311446807587,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.26510067114094,2.01342281879195,MUSR,0.340604166666667,3.7421875,MMLU-PRO,0.313414228723404,23.7126920803782,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-15,2024-08-06,2,meta-llama/Meta-Llama-3-8B,llama3,3,8.03,0.742289627896929 @@ -598,15 +607,16 @@ MaziyarPanahi/calme-2.6-qwen2-7b_bfloat16_ebfaae016a50f8922098a2a262ec3ca704504c MaziyarPanahi/calme-2.7-qwen2-7b_bfloat16_edc11a1baccedc04a5a4576ee4910fd8922ad47f_True,MaziyarPanahi/calme-2.7-qwen2-7b,edc11a1baccedc04a5a4576ee4910fd8922ad47f,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.342679034297,TRUE,IFEval,0.359230175933191,35.9230175933191,BBH,0.488317090131,28.912244614674,MATH Level 5,0.137462235649547,13.7462235649547,GPQA,0.291107382550336,5.48098434004475,MUSR,0.482427083333333,19.93671875,MMLU-PRO,0.370511968085106,30.0568853427896,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-27,2024-09-18,1,Qwen/Qwen2-7B,apache-2.0,2,7.616,1.36428028850371 MaziyarPanahi/calme-3.1-baguette-3b_bfloat16_4601b18deed3931c33907ae98060898e787c7758_True,MaziyarPanahi/calme-3.1-baguette-3b,4601b18deed3931c33907ae98060898e787c7758,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.1324579033114,TRUE,IFEval,0.623436925136416,62.3436925136416,BBH,0.468333410429111,25.5076807577414,MATH Level 5,0.0490936555891239,4.90936555891239,GPQA,0.286073825503356,4.80984340044743,MUSR,0.400791666666667,8.565625,MMLU-PRO,0.339926861702128,26.6585401891253,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,1,3.085,0.731589720630309 MaziyarPanahi/calme-3.1-instruct-3b_bfloat16_3bbd7f1f7949dd7c3679a29a781a95bd1085dc19_True,MaziyarPanahi/calme-3.1-instruct-3b,3bbd7f1f7949dd7c3679a29a781a95bd1085dc19,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,20.2860433047707,TRUE,IFEval,0.433593975097187,43.3593975097187,BBH,0.48127301480431,27.3098959593399,MATH Level 5,0.104229607250755,10.4229607250755,GPQA,0.286073825503356,4.80984340044743,MUSR,0.395208333333333,7.40104166666667,MMLU-PRO,0.355718085106383,28.4131205673759,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,2,3.085,1.39366216973401 -MaziyarPanahi/calme-3.1-instruct-78b_bfloat16_7ccd7f1a55ae79af7969f721bb7055511cc6b986_True,MaziyarPanahi/calme-3.1-instruct-78b,7ccd7f1a55ae79af7969f721bb7055511cc6b986,bfloat16,chatmodels,Original,Qwen2ForCausalLM,51.1993731559107,TRUE,IFEval,0.813554701525286,81.3554701525286,BBH,0.730515449884041,62.4096827037011,MATH Level 5,0.387462235649547,38.7462235649547,GPQA,0.395973154362416,19.4630872483221,MUSR,0.5890625,36.4994791666667,MMLU-PRO,0.718500664893617,68.7222960992908,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-11-27,1,Removed,other,2,77.965,32.2189446468948 +MaziyarPanahi/calme-3.1-instruct-78b_bfloat16_7ccd7f1a55ae79af7969f721bb7055511cc6b986_True,MaziyarPanahi/calme-3.1-instruct-78b,7ccd7f1a55ae79af7969f721bb7055511cc6b986,bfloat16,chatmodels,Original,Qwen2ForCausalLM,51.1993731559107,TRUE,IFEval,0.813554701525286,81.3554701525286,BBH,0.730515449884041,62.4096827037011,MATH Level 5,0.387462235649547,38.7462235649547,GPQA,0.395973154362416,19.4630872483221,MUSR,0.5890625,36.4994791666667,MMLU-PRO,0.718500664893617,68.7222960992908,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-11-27,1,Removed,other,3,77.965,32.2189446468948 MaziyarPanahi/calme-3.1-llamaloi-3b_bfloat16_62547548c06bb22f0b82c2bda7ac466507314a4b_True,MaziyarPanahi/calme-3.1-llamaloi-3b,62547548c06bb22f0b82c2bda7ac466507314a4b,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.0052338092847,TRUE,IFEval,0.73751756450662,73.751756450662,BBH,0.458734000499888,23.7691655758483,MATH Level 5,0.167673716012085,16.7673716012085,GPQA,0.281040268456376,4.13870246085012,MUSR,0.351520833333333,1.10677083333333,MMLU-PRO,0.320478723404255,24.4976359338062,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,meta-llama/Llama-3.2-3B,llama3.2,1,3.213,1.19291766447292 MaziyarPanahi/calme-3.2-baguette-3b_bfloat16_bba8e602432bd467b64cabf9cb62326893060e60_True,MaziyarPanahi/calme-3.2-baguette-3b,bba8e602432bd467b64cabf9cb62326893060e60,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.1406481081638,TRUE,IFEval,0.633828242396841,63.3828242396841,BBH,0.470862269902714,25.8657466507311,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.294463087248322,5.92841163310962,MUSR,0.40209375,8.59505208333333,MMLU-PRO,0.333776595744681,25.9751773049645,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,1,3.085,0.776012497501503 MaziyarPanahi/calme-3.2-instruct-3b_bfloat16_12347f5991157e752de6ba9f773a1bbc22445e3a_True,MaziyarPanahi/calme-3.2-instruct-3b,12347f5991157e752de6ba9f773a1bbc22445e3a,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.6566062728784,TRUE,IFEval,0.553319636342682,55.3319636342682,BBH,0.486564111037674,27.9767982423931,MATH Level 5,0.0989425981873112,9.89425981873112,GPQA,0.283557046979866,4.47427293064877,MUSR,0.404697916666667,8.78723958333333,MMLU-PRO,0.365275930851064,29.475103427896,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,0,3.086,0.743433169169365 -MaziyarPanahi/calme-3.2-instruct-78b_bfloat16_731f4daf584f822f1393731ccff1d58c7f06b99e_True,MaziyarPanahi/calme-3.2-instruct-78b,731f4daf584f822f1393731ccff1d58c7f06b99e,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,52.0184433947031,TRUE,IFEval,0.806260721552148,80.6260721552148,BBH,0.731861627209267,62.6094432829016,MATH Level 5,0.399546827794562,39.9546827794562,GPQA,0.402684563758389,20.3579418344519,MUSR,0.602364583333333,38.52890625,MMLU-PRO,0.730302526595745,70.0336140661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-11-28,1,Removed,other,35,77.965,33.0055653548694 +MaziyarPanahi/calme-3.2-instruct-78b_bfloat16_731f4daf584f822f1393731ccff1d58c7f06b99e_True,MaziyarPanahi/calme-3.2-instruct-78b,731f4daf584f822f1393731ccff1d58c7f06b99e,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,52.0184433947031,TRUE,IFEval,0.806260721552148,80.6260721552148,BBH,0.731861627209267,62.6094432829016,MATH Level 5,0.399546827794562,39.9546827794562,GPQA,0.402684563758389,20.3579418344519,MUSR,0.602364583333333,38.52890625,MMLU-PRO,0.730302526595745,70.0336140661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-11-28,1,Removed,other,36,77.965,33.0055653548694 MaziyarPanahi/calme-3.3-baguette-3b_bfloat16_66f9438922503e5616b6b4488e96fd9342d5efb0_True,MaziyarPanahi/calme-3.3-baguette-3b,66f9438922503e5616b6b4488e96fd9342d5efb0,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,21.0626896485596,TRUE,IFEval,0.635951497581971,63.5951497581971,BBH,0.467821729595752,25.5965941060964,MATH Level 5,0,0,GPQA,0.280201342281879,4.0268456375839,MUSR,0.392822916666667,7.13619791666667,MMLU-PRO,0.334192154255319,26.0213504728132,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,1,3.086,0.746922918806257 MaziyarPanahi/calme-3.3-instruct-3b_bfloat16_ea7d7fb442c981ecd44c5a9060ac6b062927f231_True,MaziyarPanahi/calme-3.3-instruct-3b,ea7d7fb442c981ecd44c5a9060ac6b062927f231,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,21.5477931531294,TRUE,IFEval,0.642321263137364,64.2321263137364,BBH,0.469334094276887,25.6821378185791,MATH Level 5,0,0,GPQA,0.282718120805369,4.36241610738255,MUSR,0.407427083333333,9.39505208333333,MMLU-PRO,0.330535239361702,25.6150265957447,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-07,2024-11-08,1,Qwen/Qwen2.5-3B,other,2,3.086,0.752548515201209 Minami-su/test-7B-00_bfloat16_c8e5b7745c921b5020192f0b3a553c63725048f9_True,Minami-su/test-7B-00,c8e5b7745c921b5020192f0b3a553c63725048f9,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.4357285793648,TRUE,IFEval,0.669049233810733,66.9049233810733,BBH,0.446612376561018,21.4899500189813,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.302852348993289,7.04697986577182,MUSR,0.412604166666667,10.3421875,MMLU-PRO,0.358793218085106,28.7548020094563,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-24,2024-12-24,0,Minami-su/test-7B-00,apache-2.0,0,3.808,0.750604105676129 Minami-su/test-7B-01_bfloat16_9af628070dff4480252a4d4e5f07a9884e3f71d4_True,Minami-su/test-7B-01,9af628070dff4480252a4d4e5f07a9884e3f71d4,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.5034629914445,TRUE,IFEval,0.673620438215047,67.3620438215047,BBH,0.442235942023975,20.8244942662569,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.307046979865772,7.60626398210291,MUSR,0.415302083333333,10.9794270833333,MMLU-PRO,0.353557180851064,28.1730200945627,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-24,2024-12-24,0,Minami-su/test-7B-01,apache-2.0,0,3.808,0.764518630513838 +Minami-su/test-v2-7B-00_bfloat16_fcba9bb21f9cf521dcd5d41749ccce77434fe4dc_True,Minami-su/test-v2-7B-00,fcba9bb21f9cf521dcd5d41749ccce77434fe4dc,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.1203017292081,TRUE,IFEval,0.674719743613612,67.4719743613612,BBH,0.441598934459535,21.1907548239809,MATH Level 5,0,0,GPQA,0.291946308724832,5.59284116331097,MUSR,0.415427083333333,10.9950520833333,MMLU-PRO,0.347240691489362,27.4711879432624,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-25,2024-12-25,0,Minami-su/test-v2-7B-00,apache-2.0,0,3.808,0.766724790387991 MultivexAI/Gladiator-Mini-Exp-1211-3B_float16_9f3f58da3fb4b1825c2b97effc421e7809c95848_True,MultivexAI/Gladiator-Mini-Exp-1211-3B,9f3f58da3fb4b1825c2b97effc421e7809c95848,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,22.2218576631953,TRUE,IFEval,0.68760887777763,68.760887777763,BBH,0.448437526630281,22.1160624932153,MATH Level 5,0.134441087613293,13.4441087613293,GPQA,0.272651006711409,3.02013422818792,MUSR,0.326,2.08333333333333,MMLU-PRO,0.315159574468085,23.9066193853428,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-11,2024-12-11,1,MultivexAI/Gladiator-Mini-Exp-1211-3B (Merge),mit,0,3,0.595781409541183 MultivexAI/Gladiator-Mini-Exp-1221-3B-Instruct_float16_1a3f3808cd5335fb71c88d3c2b681459c2420044_True,MultivexAI/Gladiator-Mini-Exp-1221-3B-Instruct,1a3f3808cd5335fb71c88d3c2b681459c2420044,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.0388235605726,TRUE,IFEval,0.607874883087984,60.7874883087984,BBH,0.43697669924169,20.3954621362182,MATH Level 5,0.130664652567976,13.0664652567976,GPQA,0.263422818791946,1.78970917225951,MUSR,0.311458333333333,1.43229166666667,MMLU-PRO,0.304853723404255,22.761524822695,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-20,2024-12-20,1,MultivexAI/Gladiator-Mini-Exp-1221-3B-Instruct (Merge),mit,0,1.606,0.601069112756674 MultivexAI/Gladiator-Mini-Exp-1221-3B-Instruct-V2_float16_b092e130c61aa44f2556b5db224b4df545fb51aa_True,MultivexAI/Gladiator-Mini-Exp-1221-3B-Instruct-V2,b092e130c61aa44f2556b5db224b4df545fb51aa,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.3522550117212,TRUE,IFEval,0.621538628616515,62.1538628616515,BBH,0.438883390990549,20.6512481387192,MATH Level 5,0.137462235649547,13.7462235649547,GPQA,0.263422818791946,1.78970917225951,MUSR,0.300822916666667,1.26953125,MMLU-PRO,0.302526595744681,22.5029550827423,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,MultivexAI/Gladiator-Mini-Exp-1221-3B-Instruct-V2 (Merge),mit,0,1.606,0.590788011956624 @@ -658,9 +668,9 @@ NotASI/FineTome-v1.5-Llama3.2-3B-1007_float16_6c6e71fbcff6c00d04a3fd69084af20bf2 NousResearch/Hermes-2-Pro-Llama-3-8B_float16_bc265d1781299ed2045214289c927c207439a729_True,NousResearch/Hermes-2-Pro-Llama-3-8B,bc265d1781299ed2045214289c927c207439a729,float16,chatmodels,Original,LlamaForCausalLM,21.7049203338117,TRUE,IFEval,0.536183991808402,53.6183991808402,BBH,0.507112624310082,30.667993420825,MATH Level 5,0.0619335347432024,6.19335347432024,GPQA,0.292785234899329,5.70469798657718,MUSR,0.426239583333333,11.2466145833333,MMLU-PRO,0.305186170212766,22.798463356974,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-30,2024-06-13,1,NousResearch/Meta-Llama-3-8B,llama3,413,8.031,0.749983206264044 NousResearch/Hermes-2-Pro-Mistral-7B_bfloat16_09317b1d8da639b5d9af77c06aa17cde0f0f91c0_True,NousResearch/Hermes-2-Pro-Mistral-7B,09317b1d8da639b5d9af77c06aa17cde0f0f91c0,bfloat16,chatmodels,Original,MistralForCausalLM,21.7021075222127,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.499543533049808,29.427578860536,MATH Level 5,0.0521148036253777,5.21148036253777,GPQA,0.273489932885906,3.13199105145414,MUSR,0.43759375,14.1325520833333,MMLU-PRO,0.294630984042553,21.625664893617,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-11,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,487,7.242,0.472797519360034 NousResearch/Hermes-2-Theta-Llama-3-8B_bfloat16_885173e97ab8572b444f7db1290d5d0386e26816_True,NousResearch/Hermes-2-Theta-Llama-3-8B,885173e97ab8572b444f7db1290d5d0386e26816,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.7757883439893,TRUE,IFEval,0.651788365980044,65.1788365980044,BBH,0.520667226091187,32.0460738480758,MATH Level 5,0.0959214501510574,9.59214501510574,GPQA,0.303691275167785,7.15883668903803,MUSR,0.394895833333333,8.36197916666667,MMLU-PRO,0.336851728723404,26.3168587470449,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-05,2024-07-11,2,NousResearch/Meta-Llama-3-8B,apache-2.0,196,8.03,0.743922417596867 -NousResearch/Hermes-3-Llama-3.1-70B_bfloat16_093242c69a91f8d9d5b8094c380b88772f9bd7f8_True,NousResearch/Hermes-3-Llama-3.1-70B,093242c69a91f8d9d5b8094c380b88772f9bd7f8,bfloat16,chatmodels,Original,LlamaForCausalLM,37.4825450944456,TRUE,IFEval,0.76614383169989,76.614383169989,BBH,0.675578064138748,53.7654086913006,MATH Level 5,0.148036253776435,14.8036253776435,GPQA,0.361577181208054,14.8769574944072,MUSR,0.494895833333333,23.4286458333333,MMLU-PRO,0.47265625,41.40625,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-29,2024-08-28,1,meta-llama/Meta-Llama-3.1-70B,llama3,99,70.554,11.2078909209213 -NousResearch/Hermes-3-Llama-3.1-8B_bfloat16_aabb745a717e133b74dcae23195d2635cf5f38cc_True,NousResearch/Hermes-3-Llama-3.1-8B,aabb745a717e133b74dcae23195d2635cf5f38cc,bfloat16,chatmodels,Original,LlamaForCausalLM,23.49087671148,TRUE,IFEval,0.617017291896612,61.7017291896612,BBH,0.517745254014125,30.724096614148,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.297818791946309,6.3758389261745,MUSR,0.4369375,13.6171875,MMLU-PRO,0.31391289893617,23.7680998817967,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-28,2024-08-28,1,meta-llama/Meta-Llama-3.1-8B,llama3,270,8.03,0.905807900142943 -NousResearch/Hermes-3-Llama-3.2-3B_bfloat16_f6a109fe836b13b6905f8c16a7388f2f557c3974_True,NousResearch/Hermes-3-Llama-3.2-3B,f6a109fe836b13b6905f8c16a7388f2f557c3974,bfloat16,chatmodels,Original,LlamaForCausalLM,15.116238224353,TRUE,IFEval,0.38248624760081,38.248624760081,BBH,0.435199015067149,20.1871880374546,MATH Level 5,0.0317220543806647,3.17220543806647,GPQA,0.275167785234899,3.35570469798658,MUSR,0.403020833333333,8.57760416666667,MMLU-PRO,0.254404920212766,17.1561022458629,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-03,2024-12-20,1,Removed,llama3,107,3.213,1.10155586552599 +NousResearch/Hermes-3-Llama-3.1-70B_bfloat16_093242c69a91f8d9d5b8094c380b88772f9bd7f8_True,NousResearch/Hermes-3-Llama-3.1-70B,093242c69a91f8d9d5b8094c380b88772f9bd7f8,bfloat16,chatmodels,Original,LlamaForCausalLM,37.4825450944456,TRUE,IFEval,0.76614383169989,76.614383169989,BBH,0.675578064138748,53.7654086913006,MATH Level 5,0.148036253776435,14.8036253776435,GPQA,0.361577181208054,14.8769574944072,MUSR,0.494895833333333,23.4286458333333,MMLU-PRO,0.47265625,41.40625,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-29,2024-08-28,1,meta-llama/Meta-Llama-3.1-70B,llama3,100,70.554,11.2078909209213 +NousResearch/Hermes-3-Llama-3.1-8B_bfloat16_aabb745a717e133b74dcae23195d2635cf5f38cc_True,NousResearch/Hermes-3-Llama-3.1-8B,aabb745a717e133b74dcae23195d2635cf5f38cc,bfloat16,chatmodels,Original,LlamaForCausalLM,23.49087671148,TRUE,IFEval,0.617017291896612,61.7017291896612,BBH,0.517745254014125,30.724096614148,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.297818791946309,6.3758389261745,MUSR,0.4369375,13.6171875,MMLU-PRO,0.31391289893617,23.7680998817967,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-28,2024-08-28,1,meta-llama/Meta-Llama-3.1-8B,llama3,272,8.03,0.905807900142943 +NousResearch/Hermes-3-Llama-3.2-3B_bfloat16_f6a109fe836b13b6905f8c16a7388f2f557c3974_True,NousResearch/Hermes-3-Llama-3.2-3B,f6a109fe836b13b6905f8c16a7388f2f557c3974,bfloat16,chatmodels,Original,LlamaForCausalLM,15.116238224353,TRUE,IFEval,0.38248624760081,38.248624760081,BBH,0.435199015067149,20.1871880374546,MATH Level 5,0.0317220543806647,3.17220543806647,GPQA,0.275167785234899,3.35570469798658,MUSR,0.403020833333333,8.57760416666667,MMLU-PRO,0.254404920212766,17.1561022458629,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-03,2024-12-20,1,Removed,llama3,109,3.213,1.10155586552599 NousResearch/Nous-Hermes-2-Mistral-7B-DPO_bfloat16_ebec0a691037d38955727d6949798429a63929dd_True,NousResearch/Nous-Hermes-2-Mistral-7B-DPO,ebec0a691037d38955727d6949798429a63929dd,bfloat16,chatmodels,Original,MistralForCausalLM,21.0376463902847,TRUE,IFEval,0.57625101397625,57.625101397625,BBH,0.485265366546524,27.7925456583661,MATH Level 5,0.0438066465256798,4.38066465256798,GPQA,0.292785234899329,5.70469798657718,MUSR,0.399979166666667,8.33072916666667,MMLU-PRO,0.301529255319149,22.3921394799054,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-18,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,170,7.242,0.474598918698818 NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO_bfloat16_286ae6737d048ad1d965c2e830864df02db50f2f_True,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,286ae6737d048ad1d965c2e830864df02db50f2f,bfloat16,chatmodels,Original,MixtralForCausalLM,27.290249854483,TRUE,IFEval,0.58968980083955,58.968980083955,BBH,0.553885138403382,37.1077837913399,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.321308724832215,9.50782997762864,MUSR,0.459541666666667,16.6760416666667,MMLU-PRO,0.366605718085106,29.6228575650118,TRUE,FALSE,TRUE,FALSE,TRUE,2024-01-11,2024-07-27,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,420,46.703,12.8651437241499 NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT_bfloat16_4c06af2684730f75a6874b95e8bf6058105d9612_True,NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT,4c06af2684730f75a6874b95e8bf6058105d9612,bfloat16,chatmodels,Original,MixtralForCausalLM,21.8410108914617,TRUE,IFEval,0.573078321076965,57.3078321076965,BBH,0.505786845402664,30.5943127788644,MATH Level 5,0.0211480362537764,2.11480362537764,GPQA,0.302013422818792,6.93512304250559,MUSR,0.421375,11.1385416666667,MMLU-PRO,0.306599069148936,22.9554521276596,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-26,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,55,46.703,10.3879398461721 @@ -674,7 +684,7 @@ NousResearch/Yarn-Mistral-7b-64k_bfloat16_0273c624561fcecc8e8f4030492a9307aa60f9 NousResearch/Yarn-Solar-10b-32k_bfloat16_ec3158b5276ac6644ddbdb36ccf6f9a106c98ede_False,NousResearch/Yarn-Solar-10b-32k,ec3158b5276ac6644ddbdb36ccf6f9a106c98ede,bfloat16,continuouslypretrained,Original,LlamaForCausalLM,15.7186653122834,FALSE,IFEval,0.194815312260358,19.4815312260358,BBH,0.498685915232507,28.9948243602567,MATH Level 5,0.0294561933534743,2.94561933534743,GPQA,0.302852348993289,7.04697986577182,MUSR,0.414645833333333,10.5973958333333,MMLU-PRO,0.327210771276596,25.2456412529551,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-17,2024-06-12,0,NousResearch/Yarn-Solar-10b-32k,apache-2.0,10,10,1.3884383632907 NousResearch/Yarn-Solar-10b-64k_bfloat16_703818628a5e8ef637e48e8dbeb3662aa0497aff_False,NousResearch/Yarn-Solar-10b-64k,703818628a5e8ef637e48e8dbeb3662aa0497aff,bfloat16,continuouslypretrained,Original,LlamaForCausalLM,15.1242860962001,FALSE,IFEval,0.1988867316498,19.88867316498,BBH,0.492199079542265,28.3957141535958,MATH Level 5,0.0264350453172205,2.64350453172205,GPQA,0.302013422818792,6.93512304250559,MUSR,0.4014375,9.01302083333334,MMLU-PRO,0.314827127659575,23.8696808510638,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-17,2024-06-12,0,NousResearch/Yarn-Solar-10b-64k,apache-2.0,15,10,0.763752873050906 NucleusAI/nucleus-22B-token-500B_bfloat16_49bb1a47c0d32b4bfa6630a4eff04a857adcd4ca_False,NucleusAI/nucleus-22B-token-500B,49bb1a47c0d32b4bfa6630a4eff04a857adcd4ca,bfloat16,pretrained,Original,LlamaForCausalLM,1.63341634858811,FALSE,IFEval,0.0256541532023919,2.56541532023919,BBH,0.291980078012147,1.88799906857083,MATH Level 5,0,0,GPQA,0.25,0,MUSR,0.351052083333333,3.54817708333333,MMLU-PRO,0.116190159574468,1.79890661938534,TRUE,FALSE,FALSE,FALSE,FALSE,2023-10-06,2024-06-26,0,NucleusAI/nucleus-22B-token-500B,mit,25,21.828,0.59481771866259 -NyxKrage/Microsoft_Phi-4_bfloat16_d6e415636fc3435ec1cf543db77cf228b6ce6bdd_False,NyxKrage/Microsoft_Phi-4,d6e415636fc3435ec1cf543db77cf228b6ce6bdd,bfloat16,chatmodels,Original,Phi3ForCausalLM,29.8294269050018,FALSE,IFEval,0.0585269307659233,5.85269307659233,BBH,0.669056230532287,52.4278484582049,MATH Level 5,0.284743202416918,28.4743202416918,GPQA,0.406040268456376,20.8053691275168,MUSR,0.503354166666667,23.7859375,MMLU-PRO,0.528673537234043,47.6303930260047,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-13,2024-12-21,0,NyxKrage/Microsoft_Phi-4,other,40,7.33,0.894481540571054 +NyxKrage/Microsoft_Phi-4_bfloat16_d6e415636fc3435ec1cf543db77cf228b6ce6bdd_False,NyxKrage/Microsoft_Phi-4,d6e415636fc3435ec1cf543db77cf228b6ce6bdd,bfloat16,chatmodels,Original,Phi3ForCausalLM,29.8294269050018,FALSE,IFEval,0.0585269307659233,5.85269307659233,BBH,0.669056230532287,52.4278484582049,MATH Level 5,0.284743202416918,28.4743202416918,GPQA,0.406040268456376,20.8053691275168,MUSR,0.503354166666667,23.7859375,MMLU-PRO,0.528673537234043,47.6303930260047,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-13,2024-12-21,0,NyxKrage/Microsoft_Phi-4,other,42,7.33,0.894481540571054 OEvortex/HelpingAI-15B_float16_fcc5d4eeee08c07680a2560a302de3eaa5d6f550_True,OEvortex/HelpingAI-15B,fcc5d4eeee08c07680a2560a302de3eaa5d6f550,float16,pretrained,Original,LlamaForCausalLM,4.51549560366053,TRUE,IFEval,0.203009126894418,20.3009126894418,BBH,0.293600697785376,1.81538055149423,MATH Level 5,0,0,GPQA,0.25755033557047,1.00671140939597,MUSR,0.361875,2.734375,MMLU-PRO,0.111120345744681,1.23559397163121,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-11,2024-07-13,0,OEvortex/HelpingAI-15B,other,12,15.323,1.22723730885868 OEvortex/HelpingAI-3B-reloaded_float16_aaee653fea06ba322e7a9ed15530db605cc3b382_True,OEvortex/HelpingAI-3B-reloaded,aaee653fea06ba322e7a9ed15530db605cc3b382,float16,continuouslypretrained,Original,LlamaForCausalLM,14.5921868977018,TRUE,IFEval,0.464668191509639,46.4668191509639,BBH,0.412851289790406,16.9857404490785,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.263422818791946,1.78970917225951,MUSR,0.352447916666667,4.28932291666667,MMLU-PRO,0.259474734042553,17.719414893617,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-31,2024-10-31,0,OEvortex/HelpingAI-3B-reloaded,other,1,2.81,0.561626448418379 OEvortex/HelpingAI2-9B_float16_b45a18cf41d0d438d71d79687e098ec60dd0aec1_True,OEvortex/HelpingAI2-9B,b45a18cf41d0d438d71d79687e098ec60dd0aec1,float16,pretrained,Original,LlamaForCausalLM,17.4181053099944,TRUE,IFEval,0.441312384473198,44.1312384473198,BBH,0.484461764198312,27.0732416091733,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.258389261744966,1.11856823266219,MUSR,0.371083333333333,6.31875,MMLU-PRO,0.289976728723404,21.1085254137116,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-16,2024-10-11,0,OEvortex/HelpingAI2-9B,other,23,8.903,1.04065141094332 @@ -708,9 +718,9 @@ OpenBuddy/openbuddy-zero-56b-v21.2-32k_float16_c7a1a4a6e798f75d1d3219ab9ff9f2692 OpenLeecher/llama3-8b-lima_bfloat16_237a2bcb240eecd9355a091f839e42ba3d31bda5_True,OpenLeecher/llama3-8b-lima,237a2bcb240eecd9355a091f839e42ba3d31bda5,bfloat16,chatmodels,Original,LlamaForCausalLM,14.7610818338696,TRUE,IFEval,0.437065874102936,43.7065874102936,BBH,0.429582863282299,19.573064881965,MATH Level 5,0.0347432024169184,3.47432024169184,GPQA,0.238255033557047,0,MUSR,0.371270833333333,3.7421875,MMLU-PRO,0.262632978723404,18.0703309692671,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-10-01,0,Removed,"",0,8.03,0.958929366024108 OpenScholar/Llama-3.1_OpenScholar-8B_bfloat16_e26aeb22af568bd8d01ffde86ebbd13c3cf4fcc5_True,OpenScholar/Llama-3.1_OpenScholar-8B,e26aeb22af568bd8d01ffde86ebbd13c3cf4fcc5,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.5836887529002,TRUE,IFEval,0.606401015970957,60.6401015970957,BBH,0.520774083445067,32.4039212044879,MATH Level 5,0.142749244712991,14.2749244712991,GPQA,0.281879194630873,4.25055928411633,MUSR,0.427510416666667,11.8388020833333,MMLU-PRO,0.370844414893617,30.0938238770686,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-15,2024-12-03,1,OpenScholar/Llama-3.1_OpenScholar-8B (Merge),apache-2.0,52,8,0.632606719439222 Orenguteng/Llama-3.1-8B-Lexi-Uncensored_bfloat16_56ac439ab4c7826871493ffbe2d49f2100a98e97_True,Orenguteng/Llama-3.1-8B-Lexi-Uncensored,56ac439ab4c7826871493ffbe2d49f2100a98e97,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,26.8604132222972,TRUE,IFEval,0.77768432204329,77.768432204329,BBH,0.505726165264264,29.2425432417686,MATH Level 5,0.13821752265861,13.821752265861,GPQA,0.271812080536913,2.9082774049217,MUSR,0.387114583333333,6.42265625,MMLU-PRO,0.378989361702128,30.9988179669031,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-26,2024-07-29,0,Orenguteng/Llama-3.1-8B-Lexi-Uncensored,llama3.1,42,8.03,0.856735067560064 -Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2_bfloat16_2340f8fbcd2452125a798686ca90b882a08fb0d9_True,Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2,2340f8fbcd2452125a798686ca90b882a08fb0d9,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,27.9251209060615,TRUE,IFEval,0.779158189160317,77.9158189160317,BBH,0.508400801878393,29.6870327456312,MATH Level 5,0.169184290030212,16.9184290030212,GPQA,0.282718120805369,4.36241610738255,MUSR,0.384291666666667,7.76979166666667,MMLU-PRO,0.378075132978723,30.8972369976359,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-09,2024-08-28,0,Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2,llama3.1,131,8.03,0.869686314484719 +Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2_bfloat16_2340f8fbcd2452125a798686ca90b882a08fb0d9_True,Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2,2340f8fbcd2452125a798686ca90b882a08fb0d9,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,27.9251209060615,TRUE,IFEval,0.779158189160317,77.9158189160317,BBH,0.508400801878393,29.6870327456312,MATH Level 5,0.169184290030212,16.9184290030212,GPQA,0.282718120805369,4.36241610738255,MUSR,0.384291666666667,7.76979166666667,MMLU-PRO,0.378075132978723,30.8972369976359,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-09,2024-08-28,0,Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2,llama3.1,133,8.03,0.869686314484719 Orion-zhen/Qwen2.5-7B-Instruct-Uncensored_bfloat16_33c24657b4394fc430ad90b5d413e5985ce8e292_True,Orion-zhen/Qwen2.5-7B-Instruct-Uncensored,33c24657b4394fc430ad90b5d413e5985ce8e292,bfloat16,chatmodels,Original,Qwen2ForCausalLM,27.9897115235622,TRUE,IFEval,0.720431787656751,72.0431787656751,BBH,0.54739186521573,35.8324528622882,MATH Level 5,0.013595166163142,1.3595166163142,GPQA,0.302852348993289,7.04697986577182,MUSR,0.436135416666667,13.58359375,MMLU-PRO,0.442652925531915,38.0725472813239,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-26,2024-10-19,1,Orion-zhen/Qwen2.5-7B-Instruct-Uncensored (Merge),gpl-3.0,14,7.616,1.11681194245401 -Orion-zhen/phi-4-abliterated_bfloat16_90e3bfb1a9507d931c19faa5c2084d3f8d0bfb77_False,Orion-zhen/phi-4-abliterated,90e3bfb1a9507d931c19faa5c2084d3f8d0bfb77,bfloat16,fine-tunedondomain-specificdatasets,Original,Phi3ForCausalLM,29.7021385186012,FALSE,IFEval,0.0576027163481784,5.76027163481784,BBH,0.669823930666478,52.4571292257837,MATH Level 5,0.285498489425982,28.5498489425982,GPQA,0.404362416107383,20.5816554809843,MUSR,0.500625,23.178125,MMLU-PRO,0.529172207446809,47.6858008274232,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-17,2024-12-20,1,Orion-zhen/phi-4-abliterated (Merge),gpl-3.0,6,7.33,0.894350962480824 +Orion-zhen/phi-4-abliterated_bfloat16_90e3bfb1a9507d931c19faa5c2084d3f8d0bfb77_False,Orion-zhen/phi-4-abliterated,90e3bfb1a9507d931c19faa5c2084d3f8d0bfb77,bfloat16,fine-tunedondomain-specificdatasets,Original,Phi3ForCausalLM,29.7021385186012,FALSE,IFEval,0.0576027163481784,5.76027163481784,BBH,0.669823930666478,52.4571292257837,MATH Level 5,0.285498489425982,28.5498489425982,GPQA,0.404362416107383,20.5816554809843,MUSR,0.500625,23.178125,MMLU-PRO,0.529172207446809,47.6858008274232,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-17,2024-12-20,1,Orion-zhen/phi-4-abliterated (Merge),gpl-3.0,7,7.33,0.894350962480824 P0x0/Astra-v1-12B_bfloat16_c706e253f8d8fa838b505cbec0e1a6aeec545abc_False,P0x0/Astra-v1-12B,c706e253f8d8fa838b505cbec0e1a6aeec545abc,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,19.674299882431,FALSE,IFEval,0.280594378471345,28.0594378471345,BBH,0.521450648413898,31.8099073411794,MATH Level 5,0.109516616314199,10.9516616314199,GPQA,0.313758389261745,8.50111856823266,MUSR,0.4051875,11.3817708333333,MMLU-PRO,0.346077127659575,27.3419030732861,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-21,2024-09-23,1,mistralai/Mistral-Nemo-Base-2407,apache-2.0,2,12.248,1.60567337209763 PJMixers/LLaMa-3-CursedStock-v2.0-8B_bfloat16_d47cc29df363f71ffaf6cd21ac4bdeefa27359db_True,PJMixers/LLaMa-3-CursedStock-v2.0-8B,d47cc29df363f71ffaf6cd21ac4bdeefa27359db,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,24.2038982437966,TRUE,IFEval,0.633079118959915,63.3079118959915,BBH,0.527115950402997,32.5636117089159,MATH Level 5,0.0966767371601208,9.66767371601208,GPQA,0.274328859060403,3.24384787472036,MUSR,0.385625,8.03645833333334,MMLU-PRO,0.355634973404255,28.4038859338062,TRUE,TRUE,FALSE,FALSE,FALSE,2024-06-26,2024-06-27,1,PJMixers/LLaMa-3-CursedStock-v2.0-8B (Merge),llama3,11,8.03,1.40269205586454 PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B_bfloat16_c5b8d7fa43a013e434630a7f89f3bf15ac19606f_True,PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B,c5b8d7fa43a013e434630a7f89f3bf15ac19606f,bfloat16,chatmodels,Original,LlamaForCausalLM,28.7938572465617,TRUE,IFEval,0.787101557201559,78.7101557201559,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.194108761329305,19.4108761329305,GPQA,0.291946308724832,5.59284116331097,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376745345744681,30.7494828605201,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-18,2024-12-18,1,PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B (Merge),llama3.1,1,6.523,1.29636573579394 @@ -723,7 +733,7 @@ PJMixers-Dev/LLaMa-3.2-Instruct-JankMixBread-v0.1-3B_bfloat16_19faf7463cab41a249 PJMixers-Dev/Qwen2.5-RomboTiesTest-7B_bfloat16_61e798861cae00ff1108708fc89ed18bccaf1170_True,PJMixers-Dev/Qwen2.5-RomboTiesTest-7B,61e798861cae00ff1108708fc89ed18bccaf1170,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,27.0184610243921,TRUE,IFEval,0.755802382123876,75.5802382123876,BBH,0.539867346152084,34.9314565166555,MATH Level 5,0,0,GPQA,0.297818791946309,6.3758389261745,MUSR,0.403364583333333,8.72057291666667,MMLU-PRO,0.428523936170213,36.5026595744681,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-21,0,Removed,"",0,3.808,0.671382807956332 Parissa3/test-model_bfloat16_7021138dac98d930f1ce0ebe186583c0813d6f48_False,Parissa3/test-model,7021138dac98d930f1ce0ebe186583c0813d6f48,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,20.7585057280105,FALSE,IFEval,0.38825649277251,38.825649277251,BBH,0.519391676180176,32.8390324037912,MATH Level 5,0.0657099697885196,6.57099697885196,GPQA,0.294463087248322,5.92841163310962,MUSR,0.46853125,17.5330729166667,MMLU-PRO,0.305684840425532,22.8538711583924,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-16,2024-11-16,1,Parissa3/test-model (Merge),"",0,7.242,0.473352902911403 PocketDoc/Dans-Instruct-CoreCurriculum-12b_bfloat16_c50db5ba880b7edc0efd32a7f3b9d2f051c3f4a6_True,PocketDoc/Dans-Instruct-CoreCurriculum-12b,c50db5ba880b7edc0efd32a7f3b9d2f051c3f4a6,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,9.40282371026575,TRUE,IFEval,0.219145201398955,21.9145201398955,BBH,0.378873907524027,13.23256495304,MATH Level 5,0.0490936555891239,4.90936555891239,GPQA,0.282718120805369,4.36241610738255,MUSR,0.4095625,9.56197916666667,MMLU-PRO,0.121924867021277,2.4360963356974,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-01,0,Removed,"",0,12,1.5885381520372 -PocketDoc/Dans-PersonalityEngine-V1.1.0-12b_bfloat16_e58b4d12f79522209478fed022b65675a18b877f_True,PocketDoc/Dans-PersonalityEngine-V1.1.0-12b,e58b4d12f79522209478fed022b65675a18b877f,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,26.1385999215711,TRUE,IFEval,0.707467297880734,70.7467297880734,BBH,0.536104624319959,33.666618823463,MATH Level 5,0.0506042296072508,5.06042296072508,GPQA,0.286912751677852,4.92170022371365,MUSR,0.458677083333333,17.3013020833333,MMLU-PRO,0.326213430851064,25.1348256501182,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,PocketDoc/Dans-PersonalityEngine-V1.1.0-12b (Merge),apache-2.0,11,6.124,2.11734611148732 +PocketDoc/Dans-PersonalityEngine-V1.1.0-12b_bfloat16_e58b4d12f79522209478fed022b65675a18b877f_True,PocketDoc/Dans-PersonalityEngine-V1.1.0-12b,e58b4d12f79522209478fed022b65675a18b877f,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,26.1385999215711,TRUE,IFEval,0.707467297880734,70.7467297880734,BBH,0.536104624319959,33.666618823463,MATH Level 5,0.0506042296072508,5.06042296072508,GPQA,0.286912751677852,4.92170022371365,MUSR,0.458677083333333,17.3013020833333,MMLU-PRO,0.326213430851064,25.1348256501182,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,PocketDoc/Dans-PersonalityEngine-V1.1.0-12b (Merge),apache-2.0,12,6.124,2.11734611148732 PocketDoc/Dans-PersonalityEngine-v1.0.0-8b_bfloat16_c64612e1eee1ddb3aa064a25eba8921ec3d94325_True,PocketDoc/Dans-PersonalityEngine-v1.0.0-8b,c64612e1eee1ddb3aa064a25eba8921ec3d94325,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.7794202230361,TRUE,IFEval,0.498190357141274,49.8190357141274,BBH,0.473255442591494,25.6879597690821,MATH Level 5,0.0558912386706949,5.58912386706949,GPQA,0.285234899328859,4.6979865771812,MUSR,0.35415625,3.93619791666667,MMLU-PRO,0.306515957446809,22.9462174940898,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-08,2024-10-08,1,PocketDoc/Dans-PersonalityEngine-v1.0.0-8b (Merge),apache-2.0,4,8.03,0.900974258409386 PranavHarshan/LaMistral-V4_bfloat16_b373c2a1ab08823b6b119899f807793c96ef7888_True,PranavHarshan/LaMistral-V4,b373c2a1ab08823b6b119899f807793c96ef7888,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.2107651768593,TRUE,IFEval,0.623861354539289,62.3861354539289,BBH,0.518425534258647,31.0913486817948,MATH Level 5,0.0687311178247734,6.87311178247734,GPQA,0.328020134228188,10.4026845637584,MUSR,0.364291666666667,5.63645833333333,MMLU-PRO,0.359873670212766,28.8748522458629,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-01,2024-10-05,1,PranavHarshan/LaMistral-V4 (Merge),apache-2.0,1,8.03,0.697232370090008 PranavHarshan/MedNarra-X1_bfloat16_9fe294e7fd69ec56f0b7fa1a23759eed070f44bf_False,PranavHarshan/MedNarra-X1,9fe294e7fd69ec56f0b7fa1a23759eed070f44bf,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.128681543434,FALSE,IFEval,0.43384331351924,43.384331351924,BBH,0.463716681797742,23.5234951323421,MATH Level 5,0.0468277945619335,4.68277945619335,GPQA,0.307885906040268,7.71812080536913,MUSR,0.35403125,2.45390625,MMLU-PRO,0.343085106382979,27.0094562647754,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-08,2024-10-09,1,PranavHarshan/MedNarra-X1 (Merge),"",0,8.03,0.676160938867545 @@ -742,7 +752,7 @@ PrimeIntellect/INTELLECT-1-Instruct_bfloat16_a672cbe91f9bd4df58f90619ca3c2acb2eb PuxAI/LUA_model_float16_f098319bc21c8710652f75febe0d8a110058458f_False,PuxAI/LUA_model,f098319bc21c8710652f75febe0d8a110058458f,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,5.14872374821187,FALSE,IFEval,0.228213362766349,22.8213362766349,BBH,0.287677810298844,1.8156684085008,MATH Level 5,0,0,GPQA,0.26006711409396,1.34228187919463,MUSR,0.348385416666667,3.54817708333333,MMLU-PRO,0.112283909574468,1.36487884160756,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-18,0,PuxAI/LUA_model,"",0,3.693,0.630092113903009 PygmalionAI/pygmalion-6b_float16_2a0d74449c8fbf0378194e95f64aa92e16297294_False,PygmalionAI/pygmalion-6b,2a0d74449c8fbf0378194e95f64aa92e16297294,float16,fine-tunedondomain-specificdatasets,Original,GPTJForCausalLM,5.3923596589092,FALSE,IFEval,0.20910406610017,20.910406610017,BBH,0.3198894464386,5.08957714398891,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.249161073825503,0,MUSR,0.368354166666667,3.7109375,MMLU-PRO,0.118351063829787,2.03900709219858,TRUE,FALSE,FALSE,FALSE,TRUE,2023-01-07,2024-06-12,0,PygmalionAI/pygmalion-6b,creativeml-openrail-m,736,6,31.9231192804799 Q-bert/MetaMath-1B_float16_da62756f069aba78d07d4c76108e246cb91dbc35_True,Q-bert/MetaMath-1B,da62756f069aba78d07d4c76108e246cb91dbc35,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,11.3242479106733,TRUE,IFEval,0.530039184918239,53.0039184918239,BBH,0.345068636779295,8.43461064483256,MATH Level 5,0,0,GPQA,0.251677852348993,0.223713646532442,MUSR,0.328916666666667,0.78125,MMLU-PRO,0.14951795212766,5.50199468085107,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-30,0,Removed,"",0,1.236,0.465027993931676 -Qwen/QwQ-32B-Preview_bfloat16_1032e81cb936c486aae1d33da75b2fbcd5deed4a_True,Qwen/QwQ-32B-Preview,1032e81cb936c486aae1d33da75b2fbcd5deed4a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,30.444123257489,TRUE,IFEval,0.403543708471301,40.3543708471301,BBH,0.669138148225274,53.3876763517132,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.281879194630873,4.25055928411634,MUSR,0.410989583333333,9.80703125,MMLU-PRO,0.56781914893617,51.9799054373523,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-27,2024-11-29,2,Qwen/Qwen2.5-32B,apache-2.0,1416,32.764,10.2103897762396 +Qwen/QwQ-32B-Preview_bfloat16_1032e81cb936c486aae1d33da75b2fbcd5deed4a_True,Qwen/QwQ-32B-Preview,1032e81cb936c486aae1d33da75b2fbcd5deed4a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,30.444123257489,TRUE,IFEval,0.403543708471301,40.3543708471301,BBH,0.669138148225274,53.3876763517132,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.281879194630873,4.25055928411634,MUSR,0.410989583333333,9.80703125,MMLU-PRO,0.56781914893617,51.9799054373523,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-27,2024-11-29,2,Qwen/Qwen2.5-32B,apache-2.0,1425,32.764,10.2103897762396 Qwen/Qwen1.5-0.5B_bfloat16_8f445e3628f3500ee69f24e1303c9f10f5342a39_False,Qwen/Qwen1.5-0.5B,8f445e3628f3500ee69f24e1303c9f10f5342a39,bfloat16,pretrained,Original,Qwen2ForCausalLM,5.13701708767239,FALSE,IFEval,0.17056077873376,17.056077873376,BBH,0.315353865914256,5.03547583679937,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.254194630872483,0.559284116331097,MUSR,0.361625,4.303125,MMLU-PRO,0.130734707446809,3.41496749408983,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-22,2024-06-13,0,Qwen/Qwen1.5-0.5B,other,147,0.62,0.978737373550742 Qwen/Qwen1.5-0.5B-Chat_bfloat16_4d14e384a4b037942bb3f3016665157c8bcb70ea_True,Qwen/Qwen1.5-0.5B-Chat,4d14e384a4b037942bb3f3016665157c8bcb70ea,bfloat16,chatmodels,Original,Qwen2ForCausalLM,5.56486903979377,TRUE,IFEval,0.180727137328954,18.0727137328954,BBH,0.316666215203671,4.31803263693806,MATH Level 5,0,0,GPQA,0.269295302013423,2.57270693512304,MUSR,0.383708333333333,6.06354166666667,MMLU-PRO,0.121259973404255,2.36221926713948,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-31,2024-06-12,0,Qwen/Qwen1.5-0.5B-Chat,other,75,0.62,0.54974439031725 Qwen/Qwen1.5-1.8B_bfloat16_7846de7ed421727b318d6605a0bfab659da2c067_False,Qwen/Qwen1.5-1.8B,7846de7ed421727b318d6605a0bfab659da2c067,bfloat16,pretrained,Original,Qwen2ForCausalLM,9.18137570437486,FALSE,IFEval,0.215423963971152,21.5423963971152,BBH,0.347612155836631,9.75990158772794,MATH Level 5,0.0264350453172205,2.64350453172205,GPQA,0.305369127516779,7.38255033557047,MUSR,0.360510416666667,3.96380208333333,MMLU-PRO,0.188164893617021,9.79609929078014,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-22,2024-06-13,0,Qwen/Qwen1.5-1.8B,other,44,1.837,0.948870786599621 @@ -766,40 +776,40 @@ Qwen/Qwen2-1.5B-Instruct_bfloat16_ba1cf1846d7df0a0591d6c00649f57e798519da8_True, Qwen/Qwen2-57B-A14B_bfloat16_973e466c39ba76372a2ae464dbca0af3f5a5a2a9_False,Qwen/Qwen2-57B-A14B,973e466c39ba76372a2ae464dbca0af3f5a5a2a9,bfloat16,pretrained,Original,Qwen2MoeForCausalLM,25.0338731324107,FALSE,IFEval,0.311269653408512,31.1269653408512,BBH,0.561820493868417,38.8759890503419,MATH Level 5,0.186555891238671,18.6555891238671,GPQA,0.306208053691275,7.49440715883669,MUSR,0.417375,10.5385416666667,MMLU-PRO,0.491605718085106,43.5117464539007,TRUE,FALSE,TRUE,FALSE,TRUE,2024-05-22,2024-06-13,0,Qwen/Qwen2-57B-A14B,apache-2.0,48,57.409,107.031477464734 Qwen/Qwen2-57B-A14B-Instruct_bfloat16_5ea455a449e61a92a5b194ee06be807647d3e8b5_True,Qwen/Qwen2-57B-A14B-Instruct,5ea455a449e61a92a5b194ee06be807647d3e8b5,bfloat16,chatmodels,Original,Qwen2MoeForCausalLM,29.780722801392,TRUE,IFEval,0.63377837471243,63.377837471243,BBH,0.588760696353205,41.7859177348425,MATH Level 5,0.0876132930513595,8.76132930513595,GPQA,0.331375838926175,10.8501118568233,MUSR,0.436135416666667,14.18359375,MMLU-PRO,0.457529920212766,39.7255466903073,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-04,2024-08-14,1,Qwen/Qwen2-57B-A14B,apache-2.0,78,57.409,42.5062475032037 Qwen/Qwen2-72B_bfloat16_87993795c78576318087f70b43fbf530eb7789e7_False,Qwen/Qwen2-72B,87993795c78576318087f70b43fbf530eb7789e7,bfloat16,pretrained,Original,Qwen2ForCausalLM,35.4818471661096,FALSE,IFEval,0.382361024304401,38.2361024304401,BBH,0.661734029856643,51.8561311869552,MATH Level 5,0.312688821752266,31.2688821752266,GPQA,0.394295302013423,19.2393736017897,MUSR,0.470364583333333,19.72890625,MMLU-PRO,0.573055186170213,52.5616873522459,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-26,0,Qwen/Qwen2-72B,other,194,72.706,64.0622792398665 -Qwen/Qwen2-72B-Instruct_bfloat16_1af63c698f59c4235668ec9c1395468cb7cd7e79_False,Qwen/Qwen2-72B-Instruct,1af63c698f59c4235668ec9c1395468cb7cd7e79,bfloat16,chatmodels,Original,Qwen2ForCausalLM,42.9143041555209,FALSE,IFEval,0.7989168738946,79.89168738946,BBH,0.697730968386067,57.483009118763,MATH Level 5,0.376888217522659,37.6888217522659,GPQA,0.37248322147651,16.331096196868,MUSR,0.456010416666667,17.16796875,MMLU-PRO,0.540309175531915,48.9232417257683,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-28,2024-06-26,1,Qwen/Qwen2-72B,other,691,72.706,37.5539744227 +Qwen/Qwen2-72B-Instruct_bfloat16_1af63c698f59c4235668ec9c1395468cb7cd7e79_False,Qwen/Qwen2-72B-Instruct,1af63c698f59c4235668ec9c1395468cb7cd7e79,bfloat16,chatmodels,Original,Qwen2ForCausalLM,42.9143041555209,FALSE,IFEval,0.7989168738946,79.89168738946,BBH,0.697730968386067,57.483009118763,MATH Level 5,0.376888217522659,37.6888217522659,GPQA,0.37248322147651,16.331096196868,MUSR,0.456010416666667,17.16796875,MMLU-PRO,0.540309175531915,48.9232417257683,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-28,2024-06-26,1,Qwen/Qwen2-72B,other,692,72.706,37.5539744227 Qwen/Qwen2-7B_bfloat16_453ed1575b739b5b03ce3758b23befdb0967f40e_False,Qwen/Qwen2-7B,453ed1575b739b5b03ce3758b23befdb0967f40e,bfloat16,pretrained,Original,Qwen2ForCausalLM,23.9377502573001,FALSE,IFEval,0.31486677571067,31.486677571067,BBH,0.531531595001889,34.7111362027534,MATH Level 5,0.204682779456193,20.4682779456193,GPQA,0.304530201342282,7.27069351230425,MUSR,0.443916666666667,14.3229166666667,MMLU-PRO,0.418301196808511,35.3667996453901,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-04,2024-06-09,0,Qwen/Qwen2-7B,apache-2.0,147,7.616,1.28058225557584 Qwen/Qwen2-7B-Instruct_bfloat16_41c66b0be1c3081f13defc6bdf946c2ef240d6a6_True,Qwen/Qwen2-7B-Instruct,41c66b0be1c3081f13defc6bdf946c2ef240d6a6,bfloat16,chatmodels,Original,Qwen2ForCausalLM,24.9029516291134,TRUE,IFEval,0.567907596288958,56.7907596288958,BBH,0.554478156379319,37.8083909231017,MATH Level 5,0.0944108761329305,9.44108761329305,GPQA,0.297818791946309,6.3758389261745,MUSR,0.392791666666667,7.365625,MMLU-PRO,0.384724069148936,31.6360076832151,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-04,2024-06-12,1,Qwen/Qwen2-7B,apache-2.0,604,7.616,1.04203898585749 Qwen/Qwen2-Math-72B-Instruct_bfloat16_5c267882f3377bcfc35882f8609098a894eeeaa8_True,Qwen/Qwen2-Math-72B-Instruct,5c267882f3377bcfc35882f8609098a894eeeaa8,bfloat16,chatmodels,Original,Qwen2ForCausalLM,35.1508663678517,TRUE,IFEval,0.569381463405985,56.9381463405985,BBH,0.634337660025181,47.9601995073491,MATH Level 5,0.381419939577039,38.1419939577039,GPQA,0.368288590604027,15.7718120805369,MUSR,0.451697916666667,15.72890625,MMLU-PRO,0.427277260638298,36.364140070922,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-08,2024-08-19,0,Qwen/Qwen2-Math-72B-Instruct,other,87,72.706,12.1682476948271 Qwen/Qwen2-Math-7B_bfloat16_47a44ff4136da8960adbab02b2326787086bcf6c_True,Qwen/Qwen2-Math-7B,47a44ff4136da8960adbab02b2326787086bcf6c,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,11.9413924471103,TRUE,IFEval,0.26870481433707,26.870481433707,BBH,0.386954741074792,14.0644944888713,MATH Level 5,0.243202416918429,24.3202416918429,GPQA,0.263422818791946,1.78970917225951,MUSR,0.359333333333333,2.41666666666667,MMLU-PRO,0.11968085106383,2.18676122931442,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-08,2024-08-19,0,Qwen/Qwen2-Math-7B,apache-2.0,13,7.616,1.5630360629051 -Qwen/Qwen2-VL-72B-Instruct_bfloat16_f400120e59a6196b024298b7d09fb517f742db7d_True,Qwen/Qwen2-VL-72B-Instruct,f400120e59a6196b024298b7d09fb517f742db7d,bfloat16,multimodal,Original,Qwen2VLForConditionalGeneration,37.9127528860119,TRUE,IFEval,0.598232689264485,59.8232689264485,BBH,0.694628729233868,56.3112338791251,MATH Level 5,0.246978851963746,24.6978851963746,GPQA,0.38758389261745,18.34451901566,MUSR,0.44921875,15.8856770833333,MMLU-PRO,0.57172539893617,52.41393321513,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-10-20,1,Qwen/Qwen2-VL-72B-Instruct (Merge),other,231,73.406,27.2497165156002 -Qwen/Qwen2-VL-7B-Instruct_bfloat16_51c47430f97dd7c74aa1fa6825e68a813478097f_True,Qwen/Qwen2-VL-7B-Instruct,51c47430f97dd7c74aa1fa6825e68a813478097f,bfloat16,multimodal,Original,Qwen2VLForConditionalGeneration,24.2148096194201,TRUE,IFEval,0.459921896124505,45.9921896124505,BBH,0.546450715906999,35.8771031449895,MATH Level 5,0.0619335347432024,6.19335347432024,GPQA,0.319630872483222,9.2841163310962,MUSR,0.4375,13.5541666666667,MMLU-PRO,0.409491356382979,34.3879284869976,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-28,2024-10-20,1,Qwen/Qwen2-VL-7B-Instruct (Merge),apache-2.0,978,8.291,1.05438228472396 +Qwen/Qwen2-VL-72B-Instruct_bfloat16_f400120e59a6196b024298b7d09fb517f742db7d_True,Qwen/Qwen2-VL-72B-Instruct,f400120e59a6196b024298b7d09fb517f742db7d,bfloat16,multimodal,Original,Qwen2VLForConditionalGeneration,37.9127528860119,TRUE,IFEval,0.598232689264485,59.8232689264485,BBH,0.694628729233868,56.3112338791251,MATH Level 5,0.246978851963746,24.6978851963746,GPQA,0.38758389261745,18.34451901566,MUSR,0.44921875,15.8856770833333,MMLU-PRO,0.57172539893617,52.41393321513,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-10-20,1,Qwen/Qwen2-VL-72B-Instruct (Merge),other,233,73.406,27.2497165156002 +Qwen/Qwen2-VL-7B-Instruct_bfloat16_51c47430f97dd7c74aa1fa6825e68a813478097f_True,Qwen/Qwen2-VL-7B-Instruct,51c47430f97dd7c74aa1fa6825e68a813478097f,bfloat16,multimodal,Original,Qwen2VLForConditionalGeneration,24.2148096194201,TRUE,IFEval,0.459921896124505,45.9921896124505,BBH,0.546450715906999,35.8771031449895,MATH Level 5,0.0619335347432024,6.19335347432024,GPQA,0.319630872483222,9.2841163310962,MUSR,0.4375,13.5541666666667,MMLU-PRO,0.409491356382979,34.3879284869976,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-28,2024-10-20,1,Qwen/Qwen2-VL-7B-Instruct (Merge),apache-2.0,981,8.291,1.05438228472396 Qwen/Qwen2.5-0.5B_bfloat16_2630d3d2321bc1f1878f702166d1b2af019a7310_False,Qwen/Qwen2.5-0.5B,2630d3d2321bc1f1878f702166d1b2af019a7310,bfloat16,pretrained,Original,Qwen2ForCausalLM,6.31089339476025,FALSE,IFEval,0.162717146061339,16.271714606134,BBH,0.327481481511966,6.95396163488226,MATH Level 5,0.0249244712990937,2.49244712990937,GPQA,0.246644295302013,0,MUSR,0.343333333333333,2.08333333333333,MMLU-PRO,0.190575132978723,10.0639036643026,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-0.5B,apache-2.0,147,0.5,1.16534262881835 -Qwen/Qwen2.5-0.5B-Instruct_bfloat16_a8b602d9dafd3a75d382e62757d83d89fca3be54_True,Qwen/Qwen2.5-0.5B-Instruct,a8b602d9dafd3a75d382e62757d83d89fca3be54,bfloat16,chatmodels,Original,Qwen2ForCausalLM,8.14064731927608,TRUE,IFEval,0.307122878407071,30.7122878407071,BBH,0.334072921493727,8.43486361058883,MATH Level 5,0,0,GPQA,0.25755033557047,1.00671140939597,MUSR,0.332885416666667,0.944010416666666,MMLU-PRO,0.169714095744681,7.74601063829787,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-19,1,Qwen/Qwen2.5-0.5B,apache-2.0,151,0.5,0.63082445281977 -Qwen/Qwen2.5-0.5B-Instruct_float16_7ae557604adf67be50417f59c2c2f167def9a775_True,Qwen/Qwen2.5-0.5B-Instruct,7ae557604adf67be50417f59c2c2f167def9a775,float16,chatmodels,Original,Qwen2ForCausalLM,8.38297184669106,TRUE,IFEval,0.315291205113543,31.5291205113543,BBH,0.332191642954914,8.16950226818277,MATH Level 5,0,0,GPQA,0.259228187919463,1.23042505592841,MUSR,0.3341875,1.3734375,MMLU-PRO,0.171958111702128,7.99534574468085,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-0.5B,apache-2.0,151,0.494,0.618575974583338 +Qwen/Qwen2.5-0.5B-Instruct_bfloat16_a8b602d9dafd3a75d382e62757d83d89fca3be54_True,Qwen/Qwen2.5-0.5B-Instruct,a8b602d9dafd3a75d382e62757d83d89fca3be54,bfloat16,chatmodels,Original,Qwen2ForCausalLM,8.14064731927608,TRUE,IFEval,0.307122878407071,30.7122878407071,BBH,0.334072921493727,8.43486361058883,MATH Level 5,0,0,GPQA,0.25755033557047,1.00671140939597,MUSR,0.332885416666667,0.944010416666666,MMLU-PRO,0.169714095744681,7.74601063829787,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-19,1,Qwen/Qwen2.5-0.5B,apache-2.0,152,0.5,0.63082445281977 +Qwen/Qwen2.5-0.5B-Instruct_float16_7ae557604adf67be50417f59c2c2f167def9a775_True,Qwen/Qwen2.5-0.5B-Instruct,7ae557604adf67be50417f59c2c2f167def9a775,float16,chatmodels,Original,Qwen2ForCausalLM,8.38297184669106,TRUE,IFEval,0.315291205113543,31.5291205113543,BBH,0.332191642954914,8.16950226818277,MATH Level 5,0,0,GPQA,0.259228187919463,1.23042505592841,MUSR,0.3341875,1.3734375,MMLU-PRO,0.171958111702128,7.99534574468085,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-0.5B,apache-2.0,152,0.494,0.618575974583338 Qwen/Qwen2.5-1.5B_bfloat16_e5dfabbcffd9b0c7b31d89b82c5a6b72e663f32c_False,Qwen/Qwen2.5-1.5B,e5dfabbcffd9b0c7b31d89b82c5a6b72e663f32c,bfloat16,pretrained,Original,Qwen2ForCausalLM,13.8023486940494,FALSE,IFEval,0.267430417957686,26.7430417957686,BBH,0.407795094513661,16.6604651676919,MATH Level 5,0.088368580060423,8.8368580060423,GPQA,0.285234899328859,4.6979865771812,MUSR,0.35759375,5.26588541666667,MMLU-PRO,0.285488696808511,20.6098552009456,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-1.5B,apache-2.0,48,1.5,1.24850101000351 -Qwen/Qwen2.5-1.5B-Instruct_bfloat16_5fee7c4ed634dc66c6e318c8ac2897b8b9154536_True,Qwen/Qwen2.5-1.5B-Instruct,5fee7c4ed634dc66c6e318c8ac2897b8b9154536,bfloat16,chatmodels,Original,Qwen2ForCausalLM,15.0317176008589,TRUE,IFEval,0.447556926732182,44.7556926732182,BBH,0.428898274042291,19.809786497359,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.255872483221477,0.782997762863532,MUSR,0.3663125,3.1890625,MMLU-PRO,0.279920212765957,19.9911347517731,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-1.5B,apache-2.0,256,1.5,0.687189331195425 +Qwen/Qwen2.5-1.5B-Instruct_bfloat16_5fee7c4ed634dc66c6e318c8ac2897b8b9154536_True,Qwen/Qwen2.5-1.5B-Instruct,5fee7c4ed634dc66c6e318c8ac2897b8b9154536,bfloat16,chatmodels,Original,Qwen2ForCausalLM,15.0317176008589,TRUE,IFEval,0.447556926732182,44.7556926732182,BBH,0.428898274042291,19.809786497359,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.255872483221477,0.782997762863532,MUSR,0.3663125,3.1890625,MMLU-PRO,0.279920212765957,19.9911347517731,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-1.5B,apache-2.0,257,1.5,0.687189331195425 Qwen/Qwen2.5-14B_bfloat16_83a1904df002b00bc8db6f877821cb77dbb363b0_False,Qwen/Qwen2.5-14B,83a1904df002b00bc8db6f877821cb77dbb363b0,bfloat16,pretrained,Original,Qwen2ForCausalLM,31.7496528240654,FALSE,IFEval,0.369446402212795,36.9446402212795,BBH,0.616051493531774,45.0783124049849,MATH Level 5,0.277945619335347,27.7945619335347,GPQA,0.381711409395973,17.5615212527964,MUSR,0.450239583333333,15.91328125,MMLU-PRO,0.52485039893617,47.2055998817967,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-14B,apache-2.0,47,14.77,5.58592135172473 Qwen/Qwen2.5-14B-Instruct_bfloat16_f55224c616ca27d4bcf28969a156de12c98981cf_True,Qwen/Qwen2.5-14B-Instruct,f55224c616ca27d4bcf28969a156de12c98981cf,bfloat16,chatmodels,Original,Qwen2ForCausalLM,32.1830727842617,TRUE,IFEval,0.815777692079239,81.5777692079239,BBH,0.639045370590622,48.3607066128271,MATH Level 5,0,0,GPQA,0.322147651006711,9.61968680089485,MUSR,0.4100625,10.1578125,MMLU-PRO,0.490442154255319,43.3824615839244,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-18,1,Qwen/Qwen2.5-14B,apache-2.0,145,14.77,1.7736503203376 Qwen/Qwen2.5-32B_bfloat16_ff23665d01c3665be5fdb271d18a62090b65c06d_False,Qwen/Qwen2.5-32B,ff23665d01c3665be5fdb271d18a62090b65c06d,bfloat16,pretrained,Original,Qwen2ForCausalLM,37.9827910715109,FALSE,IFEval,0.407664995545154,40.7664995545154,BBH,0.677052244872651,53.954752851332,MATH Level 5,0.354984894259819,35.4984894259819,GPQA,0.411912751677852,21.5883668903803,MUSR,0.497833333333333,22.6958333333333,MMLU-PRO,0.580535239361702,53.3928043735225,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-32B,apache-2.0,58,32.764,5.87488554274725 -Qwen/Qwen2.5-32B-Instruct_bfloat16_70e8dfb9ad18a7d499f765fe206ff065ed8ca197_True,Qwen/Qwen2.5-32B-Instruct,70e8dfb9ad18a7d499f765fe206ff065ed8ca197,bfloat16,chatmodels,Original,Qwen2ForCausalLM,36.174184974139,TRUE,IFEval,0.834612162395777,83.4612162395777,BBH,0.691252508013434,56.4893482615939,MATH Level 5,0,0,GPQA,0.338087248322148,11.744966442953,MUSR,0.426125,13.4989583333333,MMLU-PRO,0.566655585106383,51.8506205673759,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-32B,apache-2.0,156,32.764,5.75248317034287 +Qwen/Qwen2.5-32B-Instruct_bfloat16_70e8dfb9ad18a7d499f765fe206ff065ed8ca197_True,Qwen/Qwen2.5-32B-Instruct,70e8dfb9ad18a7d499f765fe206ff065ed8ca197,bfloat16,chatmodels,Original,Qwen2ForCausalLM,36.174184974139,TRUE,IFEval,0.834612162395777,83.4612162395777,BBH,0.691252508013434,56.4893482615939,MATH Level 5,0,0,GPQA,0.338087248322148,11.744966442953,MUSR,0.426125,13.4989583333333,MMLU-PRO,0.566655585106383,51.8506205673759,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-32B,apache-2.0,158,32.764,5.75248317034287 Qwen/Qwen2.5-3B_bfloat16_e4aa5ac50aa507415cda96cc99eb77ad0a3d2d34_False,Qwen/Qwen2.5-3B,e4aa5ac50aa507415cda96cc99eb77ad0a3d2d34,bfloat16,pretrained,Original,Qwen2ForCausalLM,17.1083089890835,FALSE,IFEval,0.268954152759124,26.8954152759124,BBH,0.461247534101163,24.3042417263717,MATH Level 5,0.088368580060423,8.8368580060423,GPQA,0.297818791946309,6.3758389261745,MUSR,0.430333333333333,11.7583333333333,MMLU-PRO,0.3203125,24.4791666666667,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-27,0,Qwen/Qwen2.5-3B,other,45,3.086,3.81050747400589 Qwen/Qwen2.5-3B-Instruct_bfloat16_82f42baa094a9600e39ccd80d34058aeeb3abbc1_True,Qwen/Qwen2.5-3B-Instruct,82f42baa094a9600e39ccd80d34058aeeb3abbc1,bfloat16,chatmodels,Original,Qwen2ForCausalLM,21.0313443188007,TRUE,IFEval,0.647491987925371,64.7491987925372,BBH,0.469276665604885,25.8013939440886,MATH Level 5,0,0,GPQA,0.272651006711409,3.02013422818792,MUSR,0.396791666666667,7.565625,MMLU-PRO,0.325465425531915,25.0517139479905,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,1,Qwen/Qwen2.5-3B,other,120,3,1.38847430558096 Qwen/Qwen2.5-72B_bfloat16_587cc4061cf6a7cc0d429d05c109447e5cf063af_False,Qwen/Qwen2.5-72B,587cc4061cf6a7cc0d429d05c109447e5cf063af,bfloat16,pretrained,Original,Qwen2ForCausalLM,38.3656148716295,FALSE,IFEval,0.413710067066495,41.3710067066495,BBH,0.679732067069485,54.6150578016369,MATH Level 5,0.386706948640483,38.6706948640483,GPQA,0.405201342281879,20.6935123042506,MUSR,0.477125,19.640625,MMLU-PRO,0.596825132978723,55.2027925531915,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-72B,other,49,72.706,18.0919265899938 -Qwen/Qwen2.5-72B-Instruct_bfloat16_a13fff9ad76700c7ecff2769f75943ba8395b4a7_True,Qwen/Qwen2.5-72B-Instruct,a13fff9ad76700c7ecff2769f75943ba8395b4a7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,38.2120812616148,TRUE,IFEval,0.863837949972739,86.3837949972739,BBH,0.727274732174482,61.8732556687879,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.375,16.6666666666667,MUSR,0.420604166666667,11.7421875,MMLU-PRO,0.562583111702128,51.3981235224587,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-72B,other,629,72.706,33.0067683243991 +Qwen/Qwen2.5-72B-Instruct_bfloat16_a13fff9ad76700c7ecff2769f75943ba8395b4a7_True,Qwen/Qwen2.5-72B-Instruct,a13fff9ad76700c7ecff2769f75943ba8395b4a7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,38.2120812616148,TRUE,IFEval,0.863837949972739,86.3837949972739,BBH,0.727274732174482,61.8732556687879,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.375,16.6666666666667,MUSR,0.420604166666667,11.7421875,MMLU-PRO,0.562583111702128,51.3981235224587,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-72B,other,632,72.706,33.0067683243991 Qwen/Qwen2.5-7B_bfloat16_57597c00770845ceba45271ba1b24c94bbcc7baf_False,Qwen/Qwen2.5-7B,57597c00770845ceba45271ba1b24c94bbcc7baf,bfloat16,pretrained,Original,Qwen2ForCausalLM,24.9869343450417,FALSE,IFEval,0.337447971382598,33.7447971382598,BBH,0.541630376778862,35.8134732875478,MATH Level 5,0.188821752265861,18.8821752265861,GPQA,0.324664429530201,9.95525727069351,MUSR,0.442427083333333,14.13671875,MMLU-PRO,0.436502659574468,37.3891843971631,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-15,2024-09-19,0,Qwen/Qwen2.5-7B,apache-2.0,87,7.616,3.02796087914288 -Qwen/Qwen2.5-7B-Instruct_bfloat16_52e20a6f5f475e5c8f6a8ebda4ae5fa6b1ea22ac_True,Qwen/Qwen2.5-7B-Instruct,52e20a6f5f475e5c8f6a8ebda4ae5fa6b1ea22ac,bfloat16,chatmodels,Original,Qwen2ForCausalLM,26.8667753266146,TRUE,IFEval,0.7585251576927,75.85251576927,BBH,0.53942319682991,34.8921167587655,MATH Level 5,0,0,GPQA,0.291107382550336,5.48098434004475,MUSR,0.40203125,8.45390625,MMLU-PRO,0.428690159574468,36.5211288416076,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-18,1,Qwen/Qwen2.5-7B,apache-2.0,372,7.616,2.16827148311528 +Qwen/Qwen2.5-7B-Instruct_bfloat16_52e20a6f5f475e5c8f6a8ebda4ae5fa6b1ea22ac_True,Qwen/Qwen2.5-7B-Instruct,52e20a6f5f475e5c8f6a8ebda4ae5fa6b1ea22ac,bfloat16,chatmodels,Original,Qwen2ForCausalLM,26.8667753266146,TRUE,IFEval,0.7585251576927,75.85251576927,BBH,0.53942319682991,34.8921167587655,MATH Level 5,0,0,GPQA,0.291107382550336,5.48098434004475,MUSR,0.40203125,8.45390625,MMLU-PRO,0.428690159574468,36.5211288416076,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-18,1,Qwen/Qwen2.5-7B,apache-2.0,373,7.616,2.16827148311528 Qwen/Qwen2.5-Coder-14B_bfloat16_1db30eb5ec86a6e51d8981818ee2910370b3010d_True,Qwen/Qwen2.5-Coder-14B,1db30eb5ec86a6e51d8981818ee2910370b3010d,bfloat16,pretrained,Original,Qwen2ForCausalLM,24.7661116962997,TRUE,IFEval,0.347265256186917,34.7265256186917,BBH,0.586486009174123,40.523002115363,MATH Level 5,0.221299093655589,22.1299093655589,GPQA,0.292785234899329,5.70469798657718,MUSR,0.387364583333333,6.38723958333334,MMLU-PRO,0.452127659574468,39.1252955082742,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-08,2024-11-12,1,Qwen/Qwen2.5-Coder-14B (Merge),apache-2.0,22,14.77,3.63262520075326 -Qwen/Qwen2.5-Coder-14B-Instruct_bfloat16_1a62978099f9b19f72fdd191988ff958abb18561_True,Qwen/Qwen2.5-Coder-14B-Instruct,1a62978099f9b19f72fdd191988ff958abb18561,bfloat16,chatmodels,Original,Qwen2ForCausalLM,31.1787254167968,TRUE,IFEval,0.690756082749327,69.0756082749327,BBH,0.614029642366133,44.2200182156684,MATH Level 5,0.268126888217523,26.8126888217523,GPQA,0.304530201342282,7.27069351230425,MUSR,0.391458333333333,7.03229166666667,MMLU-PRO,0.393949468085106,32.6610520094563,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-11-12,1,Qwen/Qwen2.5-Coder-14B-Instruct (Merge),apache-2.0,62,14.77,1.38321406525897 +Qwen/Qwen2.5-Coder-14B-Instruct_bfloat16_1a62978099f9b19f72fdd191988ff958abb18561_True,Qwen/Qwen2.5-Coder-14B-Instruct,1a62978099f9b19f72fdd191988ff958abb18561,bfloat16,chatmodels,Original,Qwen2ForCausalLM,31.1787254167968,TRUE,IFEval,0.690756082749327,69.0756082749327,BBH,0.614029642366133,44.2200182156684,MATH Level 5,0.268126888217523,26.8126888217523,GPQA,0.304530201342282,7.27069351230425,MUSR,0.391458333333333,7.03229166666667,MMLU-PRO,0.393949468085106,32.6610520094563,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-11-12,1,Qwen/Qwen2.5-Coder-14B-Instruct (Merge),apache-2.0,63,14.77,1.38321406525897 Qwen/Qwen2.5-Coder-32B_float16_2e12b5f7bc878d424d222e224ed40aee564ec45f_False,Qwen/Qwen2.5-Coder-32B,2e12b5f7bc878d424d222e224ed40aee564ec45f,float16,pretrained,Original,Qwen2ForCausalLM,33.2120108702677,FALSE,IFEval,0.436341130422834,43.6341130422834,BBH,0.640395506550809,48.5112134061417,MATH Level 5,0.305891238670695,30.5891238670695,GPQA,0.346476510067114,12.8635346756152,MUSR,0.4528125,15.8682291666667,MMLU-PRO,0.530252659574468,47.8058510638298,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-08,2024-12-10,1,Qwen/Qwen2.5-Coder-32B (Merge),apache-2.0,91,32,4.6902502672998 -Qwen/Qwen2.5-Coder-32B-Instruct_float16_b47205940b83b5b484577359f71ee7b88472df67_False,Qwen/Qwen2.5-Coder-32B-Instruct,b47205940b83b5b484577359f71ee7b88472df67,float16,chatmodels,Original,Qwen2ForCausalLM,38.7525412608276,FALSE,IFEval,0.726526726862503,72.6526726862503,BBH,0.662522222240513,52.2665152094361,MATH Level 5,0.427492447129909,42.7492447129909,GPQA,0.348993288590604,13.1991051454139,MUSR,0.438583333333333,13.7229166666667,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-12-10,1,Qwen/Qwen2.5-Coder-32B-Instruct (Merge),apache-2.0,1364,32,4.69438966297979 +Qwen/Qwen2.5-Coder-32B-Instruct_float16_b47205940b83b5b484577359f71ee7b88472df67_False,Qwen/Qwen2.5-Coder-32B-Instruct,b47205940b83b5b484577359f71ee7b88472df67,float16,chatmodels,Original,Qwen2ForCausalLM,38.7525412608276,FALSE,IFEval,0.726526726862503,72.6526726862503,BBH,0.662522222240513,52.2665152094361,MATH Level 5,0.427492447129909,42.7492447129909,GPQA,0.348993288590604,13.1991051454139,MUSR,0.438583333333333,13.7229166666667,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-12-10,1,Qwen/Qwen2.5-Coder-32B-Instruct (Merge),apache-2.0,1368,32,4.69438966297979 Qwen/Qwen2.5-Coder-7B_bfloat16_097b213c52760d22753af1aa5cbdba94b5c99506_True,Qwen/Qwen2.5-Coder-7B,097b213c52760d22753af1aa5cbdba94b5c99506,bfloat16,pretrained,Original,Qwen2ForCausalLM,19.2094905389622,TRUE,IFEval,0.344592348302504,34.4592348302504,BBH,0.485564055342148,28.4389441152555,MATH Level 5,0.191842900302115,19.1842900302115,GPQA,0.259228187919463,1.23042505592841,MUSR,0.344854166666667,2.1734375,MMLU-PRO,0.367935505319149,29.7706117021277,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-21,1,Qwen/Qwen2.5-Coder-7B (Merge),apache-2.0,83,7.616,2.30176716800796 -Qwen/Qwen2.5-Coder-7B-Instruct_bfloat16_3030861ab8e72c6155e1821631bf977ef40d3e5b_True,Qwen/Qwen2.5-Coder-7B-Instruct,3030861ab8e72c6155e1821631bf977ef40d3e5b,bfloat16,chatmodels,Original,Qwen2ForCausalLM,22.4254329651823,TRUE,IFEval,0.610147741326347,61.0147741326347,BBH,0.500797698622455,28.9385040453791,MATH Level 5,0.033987915407855,3.3987915407855,GPQA,0.291946308724832,5.59284116331097,MUSR,0.407270833333333,9.47552083333333,MMLU-PRO,0.335189494680851,26.1321660756501,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-11-07,1,Qwen/Qwen2.5-Coder-7B-Instruct (Merge),apache-2.0,371,7.616,1.77985748125157 -Qwen/Qwen2.5-Coder-7B-Instruct_float16_f784f10a7b2aac91bd26e6dbe7dccce691cd4ac5_True,Qwen/Qwen2.5-Coder-7B-Instruct,f784f10a7b2aac91bd26e6dbe7dccce691cd4ac5,float16,chatmodels,Original,Qwen2ForCausalLM,22.5245158164521,TRUE,IFEval,0.614718945730661,61.4718945730661,BBH,0.499904855031131,28.7265779689503,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.293624161073826,5.8165548098434,MUSR,0.4099375,9.87552083333333,MMLU-PRO,0.335438829787234,26.1598699763593,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-11-07,1,Qwen/Qwen2.5-Coder-7B-Instruct (Merge),apache-2.0,371,7.616,0.697647347897138 +Qwen/Qwen2.5-Coder-7B-Instruct_bfloat16_3030861ab8e72c6155e1821631bf977ef40d3e5b_True,Qwen/Qwen2.5-Coder-7B-Instruct,3030861ab8e72c6155e1821631bf977ef40d3e5b,bfloat16,chatmodels,Original,Qwen2ForCausalLM,22.4254329651823,TRUE,IFEval,0.610147741326347,61.0147741326347,BBH,0.500797698622455,28.9385040453791,MATH Level 5,0.033987915407855,3.3987915407855,GPQA,0.291946308724832,5.59284116331097,MUSR,0.407270833333333,9.47552083333333,MMLU-PRO,0.335189494680851,26.1321660756501,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-11-07,1,Qwen/Qwen2.5-Coder-7B-Instruct (Merge),apache-2.0,373,7.616,1.77985748125157 +Qwen/Qwen2.5-Coder-7B-Instruct_float16_f784f10a7b2aac91bd26e6dbe7dccce691cd4ac5_True,Qwen/Qwen2.5-Coder-7B-Instruct,f784f10a7b2aac91bd26e6dbe7dccce691cd4ac5,float16,chatmodels,Original,Qwen2ForCausalLM,22.5245158164521,TRUE,IFEval,0.614718945730661,61.4718945730661,BBH,0.499904855031131,28.7265779689503,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.293624161073826,5.8165548098434,MUSR,0.4099375,9.87552083333333,MMLU-PRO,0.335438829787234,26.1598699763593,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-11-07,1,Qwen/Qwen2.5-Coder-7B-Instruct (Merge),apache-2.0,373,7.616,0.697647347897138 Qwen/Qwen2.5-Math-72B-Instruct_bfloat16_3743c8fd46b002d105c1d28d180f1e531df1d40f_True,Qwen/Qwen2.5-Math-72B-Instruct,3743c8fd46b002d105c1d28d180f1e531df1d40f,bfloat16,chatmodels,Original,Qwen2ForCausalLM,29.6476372762452,TRUE,IFEval,0.400346635815193,40.0346635815193,BBH,0.645226663780376,48.9660960294212,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.331375838926175,10.8501118568233,MUSR,0.447270833333333,16.3421875,MMLU-PRO,0.481216755319149,42.3574172576832,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-29,2,Qwen/Qwen2.5-72B,other,22,72.706,28.6768849752573 Qwen/Qwen2.5-Math-7B_bfloat16_8daf1d676c3f24ddec5a99c5cff00a5c0e1c441c_True,Qwen/Qwen2.5-Math-7B,8daf1d676c3f24ddec5a99c5cff00a5c0e1c441c,bfloat16,continuouslypretrained,Original,Qwen2ForCausalLM,17.8366571562897,TRUE,IFEval,0.245998395368733,24.5998395368733,BBH,0.445463937284094,22.0087606795866,MATH Level 5,0.305135951661631,30.5135951661631,GPQA,0.293624161073826,5.8165548098434,MUSR,0.37809375,4.99505208333333,MMLU-PRO,0.271775265957447,19.0861406619385,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-09-21,1,Qwen/Qwen2.5-7B,apache-2.0,20,7.616,1.33972974562764 -Qwen/Qwen2.5-Math-7B-Instruct_bfloat16_b3b4c5794bf4b68c1978bb3525afc5e0d0d6fcc4_True,Qwen/Qwen2.5-Math-7B-Instruct,b3b4c5794bf4b68c1978bb3525afc5e0d0d6fcc4,bfloat16,chatmodels,Original,Qwen2ForCausalLM,16.5063129078039,TRUE,IFEval,0.263583957233474,26.3583957233474,BBH,0.438762734452786,21.489765755272,MATH Level 5,0.265105740181269,26.5105740181269,GPQA,0.261744966442953,1.56599552572707,MUSR,0.364729166666667,2.89114583333333,MMLU-PRO,0.281998005319149,20.2220005910165,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-19,2024-09-19,2,Qwen/Qwen2.5-7B,apache-2.0,42,7,1.13926656088631 +Qwen/Qwen2.5-Math-7B-Instruct_bfloat16_b3b4c5794bf4b68c1978bb3525afc5e0d0d6fcc4_True,Qwen/Qwen2.5-Math-7B-Instruct,b3b4c5794bf4b68c1978bb3525afc5e0d0d6fcc4,bfloat16,chatmodels,Original,Qwen2ForCausalLM,16.5063129078039,TRUE,IFEval,0.263583957233474,26.3583957233474,BBH,0.438762734452786,21.489765755272,MATH Level 5,0.265105740181269,26.5105740181269,GPQA,0.261744966442953,1.56599552572707,MUSR,0.364729166666667,2.89114583333333,MMLU-PRO,0.281998005319149,20.2220005910165,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-19,2024-09-19,2,Qwen/Qwen2.5-7B,apache-2.0,43,7,1.13926656088631 RESMPDEV/Qwen2-Wukong-0.5B_bfloat16_52c58a4aa3d0b44c363c5761fa658243f5c53943_True,RESMPDEV/Qwen2-Wukong-0.5B,52c58a4aa3d0b44c363c5761fa658243f5c53943,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,4.95036347711133,TRUE,IFEval,0.185423565029677,18.5423565029677,BBH,0.308451428837168,4.19666315993673,MATH Level 5,0,0,GPQA,0.236577181208054,0,MUSR,0.352479166666667,3.3265625,MMLU-PRO,0.132729388297872,3.63659869976359,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-29,2024-06-30,0,RESMPDEV/Qwen2-Wukong-0.5B,apache-2.0,6,0.63,0.987269093125126 -RLHFlow/ArmoRM-Llama3-8B-v0.1_bfloat16_eb2676d20da2f2d41082289d23c59b9f7427f955_True,RLHFlow/ArmoRM-Llama3-8B-v0.1,eb2676d20da2f2d41082289d23c59b9f7427f955,bfloat16,chatmodels,Original,LlamaForRewardModelWithGating,4.70548740930265,TRUE,IFEval,0.189670075399939,18.9670075399939,BBH,0.287646744678814,1.74944787031375,MATH Level 5,0,0,GPQA,0.249161073825503,0,MUSR,0.394802083333333,6.65026041666667,MMLU-PRO,0.107795877659574,0.866208628841606,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-23,2024-10-08,0,RLHFlow/ArmoRM-Llama3-8B-v0.1,llama3,161,7.511,0.92352291228196 +RLHFlow/ArmoRM-Llama3-8B-v0.1_bfloat16_eb2676d20da2f2d41082289d23c59b9f7427f955_True,RLHFlow/ArmoRM-Llama3-8B-v0.1,eb2676d20da2f2d41082289d23c59b9f7427f955,bfloat16,chatmodels,Original,LlamaForRewardModelWithGating,4.70548740930265,TRUE,IFEval,0.189670075399939,18.9670075399939,BBH,0.287646744678814,1.74944787031375,MATH Level 5,0,0,GPQA,0.249161073825503,0,MUSR,0.394802083333333,6.65026041666667,MMLU-PRO,0.107795877659574,0.866208628841606,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-23,2024-10-08,0,RLHFlow/ArmoRM-Llama3-8B-v0.1,llama3,162,7.511,0.92352291228196 RLHFlow/LLaMA3-iterative-DPO-final_bfloat16_40b73bd07a019795837f80579fe95470484ca82b_True,RLHFlow/LLaMA3-iterative-DPO-final,40b73bd07a019795837f80579fe95470484ca82b,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.6363431297776,TRUE,IFEval,0.53401086893886,53.401086893886,BBH,0.505825718273373,29.7877602720978,MATH Level 5,0,0,GPQA,0.283557046979866,4.47427293064877,MUSR,0.367270833333333,5.07552083333334,MMLU-PRO,0.325714760638298,25.0794178486998,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-17,2024-06-26,0,RLHFlow/LLaMA3-iterative-DPO-final,llama3,40,8.03,1.89274652696707 RWKV/rwkv-raven-14b_float16_359c0649b4f1d10a26ebea32908035bc00d152ee_False,RWKV/rwkv-raven-14b,359c0649b4f1d10a26ebea32908035bc00d152ee,float16,fine-tunedondomain-specificdatasets,Original,RwkvForCausalLM,3.88505660140927,FALSE,IFEval,0.0768372363107666,7.68372363107666,BBH,0.33070411765529,6.76376506130334,MATH Level 5,0,0,GPQA,0.229026845637584,0,MUSR,0.395145833333333,7.19322916666667,MMLU-PRO,0.115026595744681,1.66962174940898,FALSE,FALSE,FALSE,FALSE,FALSE,2023-05-05,2024-07-08,0,RWKV/rwkv-raven-14b,"",55,14,1.59062906993106 Rakuten/RakutenAI-7B_float16_c687b10cbf1aa6c34868904b62ecfcef2e0946bf_False,Rakuten/RakutenAI-7B,c687b10cbf1aa6c34868904b62ecfcef2e0946bf,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,11.5469783767466,FALSE,IFEval,0.155597148898257,15.5597148898257,BBH,0.431490526136154,20.9820523129145,MATH Level 5,0.0196374622356495,1.96374622356495,GPQA,0.289429530201342,5.2572706935123,MUSR,0.3738125,4.65989583333333,MMLU-PRO,0.287732712765957,20.8591903073286,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-18,2024-09-06,0,Rakuten/RakutenAI-7B,apache-2.0,46,7.373,0.641848681233742 @@ -833,7 +843,7 @@ Sakalti/Saba2-14B-Preview_float16_e8a44ff1844a15780aab1d60f670e07a17b8ccb8_False Sakalti/Sailor-japanese_float16__False,Sakalti/Sailor-japanese,"",float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,4.46774965709104,FALSE,IFEval,0.160468667579799,16.0468667579799,BBH,0.291258360296278,1.72179128807351,MATH Level 5,0,0,GPQA,0.253355704697987,0.447427293064876,MUSR,0.391177083333333,6.76380208333334,MMLU-PRO,0.116439494680851,1.82661052009456,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-22,0,Removed,"",0,0.494,1.73631652384882 Sakalti/llama-3-yanyuedao-8b-instruct_bfloat16_d36d76a88f6af38e923be426623ed1211e7099d8_False,Sakalti/llama-3-yanyuedao-8b-instruct,d36d76a88f6af38e923be426623ed1211e7099d8,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,13.7721958190546,FALSE,IFEval,0.218571168942849,21.8571168942849,BBH,0.434978490552475,20.593160052038,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.290268456375839,5.36912751677852,MUSR,0.419854166666667,10.7151041666667,MMLU-PRO,0.291057180851064,21.2285756501182,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-13,2024-12-13,1,Sakalti/llama-3-yanyuedao-8b-instruct (Merge),llama3,0,8,0.747158859660416 Sakalti/magro-7B_float16_db8d1d3aa647ac59884448d23eef35187839f123_False,Sakalti/magro-7B,db8d1d3aa647ac59884448d23eef35187839f123,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,12.3825524996845,FALSE,IFEval,0.134390084974534,13.4390084974534,BBH,0.418552648596624,19.5488837610594,MATH Level 5,0.020392749244713,2.0392749244713,GPQA,0.295302013422819,6.04026845637584,MUSR,0.445989583333333,13.6153645833333,MMLU-PRO,0.276512632978723,19.6125147754137,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-11,2024-12-12,2,mistralai/Mistral-7B-v0.1,mit,1,7,0.452276006033254 -Sakalti/ultiima-32B_float16_843652316df8b2b02d829325fbe4607ccf262ef4_False,Sakalti/ultiima-32B,843652316df8b2b02d829325fbe4607ccf262ef4,float16,basemergesandmoerges,Original,Qwen2ForCausalLM,44.3206398268785,FALSE,IFEval,0.685435754908088,68.5435754908088,BBH,0.703728578279788,58.112446786766,MATH Level 5,0.431268882175227,43.1268882175227,GPQA,0.380872483221477,17.4496644295302,MUSR,0.499479166666667,24.1348958333333,MMLU-PRO,0.591007313829787,54.5563682033097,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,Sakalti/ultiima-32B (Merge),"",1,16.382,5.25580190082621 +Sakalti/ultiima-32B_float16_843652316df8b2b02d829325fbe4607ccf262ef4_False,Sakalti/ultiima-32B,843652316df8b2b02d829325fbe4607ccf262ef4,float16,basemergesandmoerges,Original,Qwen2ForCausalLM,44.3206398268785,FALSE,IFEval,0.685435754908088,68.5435754908088,BBH,0.703728578279788,58.112446786766,MATH Level 5,0.431268882175227,43.1268882175227,GPQA,0.380872483221477,17.4496644295302,MUSR,0.499479166666667,24.1348958333333,MMLU-PRO,0.591007313829787,54.5563682033097,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,Sakalti/ultiima-32B (Merge),"",2,16.382,5.25580190082621 Salesforce/LLaMA-3-8B-SFR-Iterative-DPO-R_bfloat16_ad7d1aed82eb6d8ca4b3aad627ff76f72ab34f70_True,Salesforce/LLaMA-3-8B-SFR-Iterative-DPO-R,ad7d1aed82eb6d8ca4b3aad627ff76f72ab34f70,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,17.0297653902418,TRUE,IFEval,0.381562033183065,38.1562033183065,BBH,0.501195046966693,29.1502893497656,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.287751677852349,5.03355704697987,MUSR,0.363333333333333,5.55,MMLU-PRO,0.317237367021277,24.1374852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-09,2024-07-02,0,Salesforce/LLaMA-3-8B-SFR-Iterative-DPO-R,llama3,76,8.03,0.857392430518302 SanjiWatsuki/Kunoichi-DPO-v2-7B_float16_5278247beb482c4fceff2294570236d68b74d132_True,SanjiWatsuki/Kunoichi-DPO-v2-7B,5278247beb482c4fceff2294570236d68b74d132,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,20.5564548887298,TRUE,IFEval,0.543103410063077,54.3103410063077,BBH,0.441559245086928,20.9034724841238,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.296140939597315,6.15212527964205,MUSR,0.418833333333333,11.0875,MMLU-PRO,0.310671542553192,23.4079491725768,TRUE,FALSE,FALSE,FALSE,FALSE,2024-01-13,2024-06-28,0,SanjiWatsuki/Kunoichi-DPO-v2-7B,cc-by-nc-4.0,82,7.242,1.20820684318841 SanjiWatsuki/Silicon-Maid-7B_bfloat16_4e43d81f3fff1091df7cb2d85e9e306d25235701_True,SanjiWatsuki/Silicon-Maid-7B,4e43d81f3fff1091df7cb2d85e9e306d25235701,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,19.4498598838105,TRUE,IFEval,0.536783512192095,53.6783512192095,BBH,0.412797283100907,16.6927467535864,MATH Level 5,0.0672205438066465,6.72205438066465,GPQA,0.290268456375839,5.36912751677852,MUSR,0.418833333333333,11.0875,MMLU-PRO,0.308344414893617,23.1493794326241,TRUE,TRUE,FALSE,FALSE,FALSE,2023-12-27,2024-09-08,0,SanjiWatsuki/Silicon-Maid-7B,cc-by-4.0,104,7.242,0.606163302282549 @@ -841,10 +851,12 @@ Sao10K/Fimbulvetr-11B-v2_float16_b2dcd534dc3a53ff84e60a53b87816185169be19_True,S Sao10K/L3-70B-Euryale-v2.1_bfloat16_36ad832b771cd783ea7ad00ed39e61f679b1a7c6_True,Sao10K/L3-70B-Euryale-v2.1,36ad832b771cd783ea7ad00ed39e61f679b1a7c6,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,35.3480147060313,TRUE,IFEval,0.738441778924365,73.8441778924365,BBH,0.647132281126872,48.7011867294481,MATH Level 5,0.208459214501511,20.8459214501511,GPQA,0.331375838926175,10.8501118568233,MUSR,0.420916666666667,12.2479166666667,MMLU-PRO,0.510388962765958,45.598773640662,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-11,2024-07-01,0,Sao10K/L3-70B-Euryale-v2.1,cc-by-nc-4.0,124,70.554,8.61834854619988 Sao10K/L3-70B-Euryale-v2.1_float16_36ad832b771cd783ea7ad00ed39e61f679b1a7c6_True,Sao10K/L3-70B-Euryale-v2.1,36ad832b771cd783ea7ad00ed39e61f679b1a7c6,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,35.4732526687288,TRUE,IFEval,0.728100329348351,72.8100329348351,BBH,0.650277899274504,49.1930030798986,MATH Level 5,0.224320241691843,22.4320241691843,GPQA,0.331375838926175,10.8501118568233,MUSR,0.419583333333333,12.0479166666667,MMLU-PRO,0.509557845744681,45.5064273049645,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-11,2024-06-26,0,Sao10K/L3-70B-Euryale-v2.1,cc-by-nc-4.0,124,70.554,8.61645431985954 Sao10K/L3-8B-Lunaris-v1_bfloat16_8479c2a7ee119c935b9a02c921cc2a85b698dfe8_True,Sao10K/L3-8B-Lunaris-v1,8479c2a7ee119c935b9a02c921cc2a85b698dfe8,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,25.6283363857046,TRUE,IFEval,0.68945730661312,68.945730661312,BBH,0.523529928251542,32.1143484550954,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.301174496644295,6.82326621923937,MUSR,0.372666666666667,5.55,MMLU-PRO,0.378740026595745,30.9711140661939,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-26,2024-07-22,0,Sao10K/L3-8B-Lunaris-v1,llama3,96,8.03,0.660498638520832 -Sao10K/L3-8B-Stheno-v3.2_bfloat16_4bb828f6e1b1efd648c39b1ad682c44ff260f018_True,Sao10K/L3-8B-Stheno-v3.2,4bb828f6e1b1efd648c39b1ad682c44ff260f018,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.9095698218306,TRUE,IFEval,0.687284183743578,68.7284183743578,BBH,0.522778637171633,32.021597924075,MATH Level 5,0.0944108761329305,9.44108761329305,GPQA,0.310402684563758,8.05369127516779,MUSR,0.379364583333333,6.45390625,MMLU-PRO,0.376828457446809,30.7587174940898,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-05,2024-06-30,0,Sao10K/L3-8B-Stheno-v3.2,cc-by-nc-4.0,255,8.03,0.891672233627461 +Sao10K/L3-8B-Stheno-v3.2_bfloat16_4bb828f6e1b1efd648c39b1ad682c44ff260f018_True,Sao10K/L3-8B-Stheno-v3.2,4bb828f6e1b1efd648c39b1ad682c44ff260f018,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.9095698218306,TRUE,IFEval,0.687284183743578,68.7284183743578,BBH,0.522778637171633,32.021597924075,MATH Level 5,0.0944108761329305,9.44108761329305,GPQA,0.310402684563758,8.05369127516779,MUSR,0.379364583333333,6.45390625,MMLU-PRO,0.376828457446809,30.7587174940898,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-05,2024-06-30,0,Sao10K/L3-8B-Stheno-v3.2,cc-by-nc-4.0,256,8.03,0.891672233627461 Sao10K/L3-8B-Stheno-v3.3-32K_bfloat16_1a59d163e079c7e7f1542553d085853119960f0c_True,Sao10K/L3-8B-Stheno-v3.3-32K,1a59d163e079c7e7f1542553d085853119960f0c,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,12.5870405203853,TRUE,IFEval,0.460371813454966,46.0371813454966,BBH,0.384401292300821,13.5120089831975,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.256711409395973,0.894854586129753,MUSR,0.372541666666667,4.06770833333333,MMLU-PRO,0.189577792553192,9.95308806146572,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-22,2024-06-26,0,Sao10K/L3-8B-Stheno-v3.3-32K,cc-by-nc-4.0,52,8.03,1.46863224607195 Sao10K/MN-12B-Lyra-v3_bfloat16_da76fa39d128ca84065427189bb228f2dfc6b8a3_True,Sao10K/MN-12B-Lyra-v3,da76fa39d128ca84065427189bb228f2dfc6b8a3,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,19.3964568922766,TRUE,IFEval,0.448606364446336,44.8606364446336,BBH,0.480395436039724,25.8709633830725,MATH Level 5,0.0793051359516616,7.93051359516616,GPQA,0.277684563758389,3.69127516778523,MUSR,0.40190625,9.03828125,MMLU-PRO,0.324883643617021,24.9870715130024,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-27,2024-09-03,0,Sao10K/MN-12B-Lyra-v3,cc-by-nc-4.0,34,12.248,2.08466477138094 +Saxo/Linkbricks-Horizon-AI-Korean-Superb-22B_bfloat16_4fb08002ca40d2fdfbf1334049e8e1264daf50c1_True,Saxo/Linkbricks-Horizon-AI-Korean-Superb-22B,4fb08002ca40d2fdfbf1334049e8e1264daf50c1,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,28.8155478487289,TRUE,IFEval,0.676667907817923,67.6667907817923,BBH,0.56255395689276,36.578023822519,MATH Level 5,0.20619335347432,20.619335347432,GPQA,0.326342281879195,10.1789709172259,MUSR,0.390770833333333,5.94635416666667,MMLU-PRO,0.387134308510638,31.9038120567376,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-08,2024-12-25,1,mistralai/Mistral-Small-Instruct-2409,apache-2.0,0,11.124,1.01349684362914 Saxo/Linkbricks-Horizon-AI-Korean-Superb-27B_bfloat16_0b4cf265801f8ee050a54eea7ee51d3142e98c74_False,Saxo/Linkbricks-Horizon-AI-Korean-Superb-27B,0b4cf265801f8ee050a54eea7ee51d3142e98c74,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,38.3242071739626,FALSE,IFEval,0.776760107625545,77.6760107625545,BBH,0.651834568511945,50.60725661581,MATH Level 5,0.26963746223565,26.963746223565,GPQA,0.35989932885906,14.6532438478747,MUSR,0.479135416666667,19.5252604166667,MMLU-PRO,0.464677526595745,40.519725177305,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-16,2024-11-17,2,google/gemma-2-27b,apache-2.0,1,27.227,3.88846900552202 +Saxo/Linkbricks-Horizon-AI-Superb-27B_bfloat16_b1bffefa2c1c36436275abae3b9bc018f9ea1908_True,Saxo/Linkbricks-Horizon-AI-Superb-27B,b1bffefa2c1c36436275abae3b9bc018f9ea1908,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,33.5504554567316,TRUE,IFEval,0.730223584533482,73.0223584533482,BBH,0.618624552892505,45.6943239100436,MATH Level 5,0.157099697885196,15.7099697885196,GPQA,0.357382550335571,14.3176733780761,MUSR,0.465,18.5583333333333,MMLU-PRO,0.406000664893617,34.0000738770686,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-04,2024-12-25,2,google/gemma-2-27b,apache-2.0,0,13.614,4.62461246194147 SeaLLMs/SeaLLM-7B-v2_bfloat16_35c5464399144a14915733dc690c4a74e1f71b16_False,SeaLLMs/SeaLLM-7B-v2,35c5464399144a14915733dc690c4a74e1f71b16,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,18.1160373143562,FALSE,IFEval,0.367123676290022,36.7123676290022,BBH,0.490210079545832,27.4381594015709,MATH Level 5,0.0823262839879154,8.23262839879154,GPQA,0.278523489932886,3.80313199105145,MUSR,0.406958333333333,9.36979166666667,MMLU-PRO,0.308261303191489,23.1401447990544,TRUE,FALSE,FALSE,FALSE,FALSE,2024-01-29,2024-09-17,0,SeaLLMs/SeaLLM-7B-v2,other,65,7.376,0.63489301124129 SeaLLMs/SeaLLM-7B-v2.5_bfloat16_a961daf713dcb31e3253ebe40d43ea5fb7a84099_True,SeaLLMs/SeaLLM-7B-v2.5,a961daf713dcb31e3253ebe40d43ea5fb7a84099,bfloat16,fine-tunedondomain-specificdatasets,Original,GemmaForCausalLM,18.9304673292228,TRUE,IFEval,0.452153619064083,45.2153619064083,BBH,0.498020295943528,28.7381539301028,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.276006711409396,3.4675615212528,MUSR,0.420322916666667,11.60703125,MMLU-PRO,0.3203125,24.4791666666667,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-03,2024-07-29,0,SeaLLMs/SeaLLM-7B-v2.5,other,49,8.538,1.10097672185204 SeaLLMs/SeaLLMs-v3-7B-Chat_bfloat16_67ef6dfd0a5df7af4be7a325786105a2ba4cbaf7_True,SeaLLMs/SeaLLMs-v3-7B-Chat,67ef6dfd0a5df7af4be7a325786105a2ba4cbaf7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,23.884404819428,TRUE,IFEval,0.437665394486629,43.7665394486629,BBH,0.526640628459536,33.8016227223784,MATH Level 5,0.166163141993958,16.6163141993958,GPQA,0.298657718120805,6.48769574944072,MUSR,0.417375,10.471875,MMLU-PRO,0.389461436170213,32.1623817966903,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-03,2024-07-29,0,SeaLLMs/SeaLLMs-v3-7B-Chat,other,46,7.616,0.842853124695207 @@ -882,11 +894,13 @@ Syed-Hasan-8503/Phi-3-mini-4K-instruct-cpo-simpo_bfloat16_2896ef357be81fd433c178 T145/KRONOS-8B-V2_bfloat16_8a004e1e51aa24574ba961613fe9698df30bd9a0_True,T145/KRONOS-8B-V2,8a004e1e51aa24574ba961613fe9698df30bd9a0,bfloat16,chatmodels,Original,LlamaForCausalLM,25.0497936461037,TRUE,IFEval,0.518024397487555,51.8024397487555,BBH,0.513268555595521,30.6749071378466,MATH Level 5,0.226586102719033,22.6586102719033,GPQA,0.298657718120805,6.48769574944072,MUSR,0.382864583333333,8.25807291666667,MMLU-PRO,0.373753324468085,30.4170360520095,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-08,2024-12-13,1,T145/KRONOS-8B-V2 (Merge),llama3.1,1,8,0.684995365601827 T145/KRONOS-8B-V3_bfloat16_75b0ff936de5caa98a6b9680bafeeb92d4b9abaa_True,T145/KRONOS-8B-V3,75b0ff936de5caa98a6b9680bafeeb92d4b9abaa,bfloat16,chatmodels,Original,LlamaForCausalLM,25.3465711884425,TRUE,IFEval,0.547475143729748,54.7475143729748,BBH,0.511865544689898,30.2910989848355,MATH Level 5,0.236404833836858,23.6404833836858,GPQA,0.288590604026846,5.14541387024609,MUSR,0.392229166666667,7.82864583333334,MMLU-PRO,0.373836436170213,30.4262706855792,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-18,2024-12-18,1,T145/KRONOS-8B-V3 (Merge),"",1,4.015,0.700782263383934 T145/KRONOS-8B-V4_bfloat16_f9faad008b866745fd60755e558f7a06d3a59da4_True,T145/KRONOS-8B-V4,f9faad008b866745fd60755e558f7a06d3a59da4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.5992309430025,TRUE,IFEval,0.788949986037048,78.8949986037048,BBH,0.509247003484674,30.1406194721162,MATH Level 5,0.185800604229607,18.5800604229607,GPQA,0.289429530201342,5.2572706935123,MUSR,0.382958333333333,7.76979166666667,MMLU-PRO,0.378573803191489,30.9526447990544,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,T145/KRONOS-8B-V4 (Merge),"",1,4.015,0.695259465116396 -T145/KRONOS-8B-V5_bfloat16_67a69b38a382a7cebe2d8d7b52aeafab6ff89a29_True,T145/KRONOS-8B-V5,67a69b38a382a7cebe2d8d7b52aeafab6ff89a29,bfloat16,chatmodels,Original,LlamaForCausalLM,25.4340192861369,TRUE,IFEval,0.540505857790662,54.0505857790662,BBH,0.508865159896917,30.1736822166472,MATH Level 5,0.219033232628399,21.9033232628399,GPQA,0.290268456375839,5.36912751677852,MUSR,0.40546875,10.4502604166667,MMLU-PRO,0.375914228723404,30.6571365248227,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-20,1,T145/KRONOS-8B-V5 (Merge),"",2,4.015,0.690409073100682 +T145/KRONOS-8B-V5_bfloat16_67a69b38a382a7cebe2d8d7b52aeafab6ff89a29_True,T145/KRONOS-8B-V5,67a69b38a382a7cebe2d8d7b52aeafab6ff89a29,bfloat16,chatmodels,Original,LlamaForCausalLM,25.4340192861369,TRUE,IFEval,0.540505857790662,54.0505857790662,BBH,0.508865159896917,30.1736822166472,MATH Level 5,0.219033232628399,21.9033232628399,GPQA,0.290268456375839,5.36912751677852,MUSR,0.40546875,10.4502604166667,MMLU-PRO,0.375914228723404,30.6571365248227,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-20,1,T145/KRONOS-8B-V5 (Merge),"",1,4.015,0.690409073100682 T145/KRONOS-8B-V6_bfloat16_7afd2483e81c58ad3865a9cac6f2e66afe1d1f78_True,T145/KRONOS-8B-V6,7afd2483e81c58ad3865a9cac6f2e66afe1d1f78,bfloat16,chatmodels,Original,LlamaForCausalLM,24.4866603152291,TRUE,IFEval,0.702246705408317,70.2246705408317,BBH,0.503360614949941,29.6592864185256,MATH Level 5,0.0551359516616314,5.51359516616314,GPQA,0.279362416107383,3.91498881431767,MUSR,0.412104166666667,9.81302083333333,MMLU-PRO,0.35014960106383,27.7944001182033,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-20,2024-12-20,1,T145/KRONOS-8B-V6 (Merge),"",1,4.015,0.719828308044664 +T145/KRONOS-8B-V7_bfloat16_422458ab11c4a8bb502fd8681551f9b54d7e6162_True,T145/KRONOS-8B-V7,422458ab11c4a8bb502fd8681551f9b54d7e6162,bfloat16,chatmodels,Original,LlamaForCausalLM,14.5277265195895,TRUE,IFEval,0.352910278062208,35.2910278062208,BBH,0.452621944393916,23.8901731388557,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.266778523489933,2.23713646532438,MUSR,0.367114583333333,4.02265625,MMLU-PRO,0.269697473404255,18.855274822695,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-25,0,Removed,"",0,4.015,0.727073711442984 T145/Llama-3.1-8B-Instruct-Zeus_bfloat16_672f9f1d4256f999b4513061c5406f60bfda2949_True,T145/Llama-3.1-8B-Instruct-Zeus,672f9f1d4256f999b4513061c5406f60bfda2949,bfloat16,chatmodels,Original,LlamaForCausalLM,29.587053709442,TRUE,IFEval,0.794120710825055,79.4120710825055,BBH,0.51739824399963,31.3889907284783,MATH Level 5,0.191842900302115,19.1842900302115,GPQA,0.301174496644295,6.82326621923937,MUSR,0.397625,8.56979166666666,MMLU-PRO,0.389295212765957,32.1439125295508,TRUE,TRUE,FALSE,FALSE,FALSE,2024-11-28,2024-11-28,1,T145/Llama-3.1-8B-Instruct-Zeus (Merge),apache-2.0,0,8.03,0.694684704446944 T145/Llama-3.1-8B-Zeus_bfloat16_712ff76aa966b0a9c5c65a074b2eb2b2cb56de86_True,T145/Llama-3.1-8B-Zeus,712ff76aa966b0a9c5c65a074b2eb2b2cb56de86,bfloat16,chatmodels,Original,LlamaForCausalLM,9.01349989790302,TRUE,IFEval,0.351761104979233,35.1761104979233,BBH,0.367117534844685,10.5608077568321,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.26510067114094,2.01342281879195,MUSR,0.331583333333333,1.58125,MMLU-PRO,0.133228058510638,3.69200650118203,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-11-28,0,Removed,"",0,8.03,0.731717749121906 T145/Meta-Llama-3.1-8B-Instruct-TIES_bfloat16_62a8c4f6e02a2e18f79688877fa925dcac8096aa_True,T145/Meta-Llama-3.1-8B-Instruct-TIES,62a8c4f6e02a2e18f79688877fa925dcac8096aa,bfloat16,chatmodels,Original,LlamaForCausalLM,24.812945035541,TRUE,IFEval,0.542354286626152,54.2354286626152,BBH,0.507011138556476,29.7742634799406,MATH Level 5,0.200151057401813,20.0151057401813,GPQA,0.294463087248322,5.92841163310962,MUSR,0.384291666666667,8.03645833333334,MMLU-PRO,0.377992021276596,30.8880023640662,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-21,2024-12-22,1,T145/Meta-Llama-3.1-8B-Instruct-TIES (Merge),"",1,4.015,0.684712012934721 +T145/ZEUS-8B-V10_bfloat16_94b750b9de63df6391bb42d304a3dabea259b178_True,T145/ZEUS-8B-V10,94b750b9de63df6391bb42d304a3dabea259b178,bfloat16,chatmodels,Original,LlamaForCausalLM,30.1934569847742,TRUE,IFEval,0.770665168419793,77.0665168419793,BBH,0.526975827044266,32.6950476722608,MATH Level 5,0.200906344410876,20.0906344410876,GPQA,0.324664429530201,9.95525727069351,MUSR,0.38978125,9.08932291666667,MMLU-PRO,0.390375664893617,32.2639627659575,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-24,2024-12-24,1,T145/ZEUS-8B-V10 (Merge),"",2,4.015,0.683466588983542 T145/ZEUS-8B-V2_bfloat16_8f874a61fe651717afaf484e3a556a0c11b7f292_True,T145/ZEUS-8B-V2,8f874a61fe651717afaf484e3a556a0c11b7f292,bfloat16,chatmodels,Original,LlamaForCausalLM,30.067952754747,TRUE,IFEval,0.802938425599631,80.2938425599631,BBH,0.519440545574716,31.6055927750739,MATH Level 5,0.211480362537764,21.1480362537764,GPQA,0.302013422818792,6.93512304250559,MUSR,0.391020833333333,8.24427083333333,MMLU-PRO,0.389627659574468,32.1808510638298,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-01,1,T145/ZEUS-8B-V2 (Merge),"",2,8.03,0.695717516485473 T145/ZEUS-8B-V2L1_bfloat16_c2d7f009c769f7ebdef00412ad85f2d3bdea9869_False,T145/ZEUS-8B-V2L1,c2d7f009c769f7ebdef00412ad85f2d3bdea9869,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,20.0348610358661,FALSE,IFEval,0.31918864169293,31.918864169293,BBH,0.501348537526027,28.6942082065513,MATH Level 5,0.128398791540786,12.8398791540786,GPQA,0.312919463087248,8.38926174496644,MUSR,0.388197916666667,9.05807291666666,MMLU-PRO,0.363779920212766,29.3088800236407,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-02,0,Removed,"",0,8.03,0.744636958690887 T145/ZEUS-8B-V2L2_bfloat16_d3ae250942e4b749c2d545a48f08a93a659a9b6e_True,T145/ZEUS-8B-V2L2,d3ae250942e4b749c2d545a48f08a93a659a9b6e,bfloat16,chatmodels,Original,LlamaForCausalLM,29.8855739004236,TRUE,IFEval,0.802064078866297,80.2064078866297,BBH,0.520284366540213,32.0175092945529,MATH Level 5,0.198640483383686,19.8640483383686,GPQA,0.299496644295302,6.59955257270694,MUSR,0.39746875,8.58359375,MMLU-PRO,0.388380984042553,32.0423315602837,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-03,0,Removed,"",0,8.03,0.704039554036526 @@ -897,9 +911,9 @@ T145/ZEUS-8B-V7_bfloat16_dbaa3828be77d925f40ecf3762b90ec4ad70e6d9_True,T145/ZEUS T145/ZEUS-8B-V8_bfloat16_c7da6c67926ddaff25602bfd1b9941d9822c1387_True,T145/ZEUS-8B-V8,c7da6c67926ddaff25602bfd1b9941d9822c1387,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2109530522113,TRUE,IFEval,0.791397935256231,79.1397935256231,BBH,0.50645104198647,29.3940309567592,MATH Level 5,0.132175226586103,13.2175226586103,GPQA,0.287751677852349,5.03355704697987,MUSR,0.421375,11.8052083333333,MMLU-PRO,0.37608045212766,30.6756057919622,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-12,2024-12-12,1,T145/ZEUS-8B-V8 (Merge),llama3.1,1,8,0.660013974860776 T145/ZEUS-8B-V9_bfloat16_10b386571ad34d115433419d30b61746ef4d9735_True,T145/ZEUS-8B-V9,10b386571ad34d115433419d30b61746ef4d9735,bfloat16,chatmodels,Original,LlamaForCausalLM,25.8271249353926,TRUE,IFEval,0.555143685421349,55.5143685421349,BBH,0.520725634647775,31.8505495278181,MATH Level 5,0.211480362537764,21.1480362537764,GPQA,0.291107382550336,5.48098434004475,MUSR,0.394927083333333,8.73255208333333,MMLU-PRO,0.390126329787234,32.2362588652482,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,T145/ZEUS-8B-V9 (Merge),"",1,4.015,0.673209944939504 T145/qwen-2.5-3B-merge-test_bfloat16_0d5f82d841f811fbf1ee07bfbf7c6eb1de812840_True,T145/qwen-2.5-3B-merge-test,0d5f82d841f811fbf1ee07bfbf7c6eb1de812840,bfloat16,chatmodels,Original,Qwen2ForCausalLM,21.1541505180996,TRUE,IFEval,0.575101840893274,57.5101840893274,BBH,0.484248874772039,27.8893413136761,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.285234899328859,4.6979865771812,MUSR,0.400729166666667,8.29114583333333,MMLU-PRO,0.328956117021277,25.4395685579196,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-11-16,0,Removed,"",0,3.397,0.783956586523256 -THUDM/glm-4-9b_bfloat16_99a140996f9d4f197842fb6b1aab217a42e27ef3_False,THUDM/glm-4-9b,99a140996f9d4f197842fb6b1aab217a42e27ef3,bfloat16,pretrained,Original,ChatGLMModelM,18.0067317317162,FALSE,IFEval,0.142608279365417,14.2608279365417,BBH,0.552836814166527,35.8112835812089,MATH Level 5,0,0,GPQA,0.316275167785235,8.83668903803132,MUSR,0.438583333333333,14.1895833333333,MMLU-PRO,0.414478058510638,34.942006501182,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-07-04,0,THUDM/glm-4-9b,other,114,9,1.67244683755118 -THUDM/glm-4-9b-chat_bfloat16_04419001bc63e05e70991ade6da1f91c4aeec278_True,THUDM/glm-4-9b-chat,04419001bc63e05e70991ade6da1f91c4aeec278,bfloat16,chatmodels,Original,ChatGLMModelM,10.9734772970452,TRUE,IFEval,0,0,BBH,0.473638842910357,25.2051836744402,MATH Level 5,0,0,GPQA,0.313758389261745,8.50111856823266,MUSR,0.399427083333333,8.06171875,MMLU-PRO,0.316655585106383,24.0728427895981,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-07-09,0,THUDM/glm-4-9b-chat,other,648,9,0.247134508492731 -THUDM/glm-4-9b-chat-1m_bfloat16_0aa722c7e0745dd21453427dd44c257dd253304f_True,THUDM/glm-4-9b-chat-1m,0aa722c7e0745dd21453427dd44c257dd253304f,bfloat16,chatmodels,Original,ChatGLMModel,8.92251018653198,TRUE,IFEval,0,0,BBH,0.418005782183303,17.1080285081681,MATH Level 5,0,0,GPQA,0.303691275167785,7.15883668903803,MUSR,0.379458333333333,5.23229166666667,MMLU-PRO,0.316323138297872,24.0359042553192,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-10-09,0,THUDM/glm-4-9b-chat-1m,other,181,9.484,0.205669954986166 +THUDM/glm-4-9b_bfloat16_99a140996f9d4f197842fb6b1aab217a42e27ef3_False,THUDM/glm-4-9b,99a140996f9d4f197842fb6b1aab217a42e27ef3,bfloat16,pretrained,Original,ChatGLMModelM,18.0067317317162,FALSE,IFEval,0.142608279365417,14.2608279365417,BBH,0.552836814166527,35.8112835812089,MATH Level 5,0,0,GPQA,0.316275167785235,8.83668903803132,MUSR,0.438583333333333,14.1895833333333,MMLU-PRO,0.414478058510638,34.942006501182,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-07-04,0,THUDM/glm-4-9b,other,115,9,1.67244683755118 +THUDM/glm-4-9b-chat_bfloat16_04419001bc63e05e70991ade6da1f91c4aeec278_True,THUDM/glm-4-9b-chat,04419001bc63e05e70991ade6da1f91c4aeec278,bfloat16,chatmodels,Original,ChatGLMModelM,10.9734772970452,TRUE,IFEval,0,0,BBH,0.473638842910357,25.2051836744402,MATH Level 5,0,0,GPQA,0.313758389261745,8.50111856823266,MUSR,0.399427083333333,8.06171875,MMLU-PRO,0.316655585106383,24.0728427895981,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-07-09,0,THUDM/glm-4-9b-chat,other,649,9,0.247134508492731 +THUDM/glm-4-9b-chat-1m_bfloat16_0aa722c7e0745dd21453427dd44c257dd253304f_True,THUDM/glm-4-9b-chat-1m,0aa722c7e0745dd21453427dd44c257dd253304f,bfloat16,chatmodels,Original,ChatGLMModel,8.92251018653198,TRUE,IFEval,0,0,BBH,0.418005782183303,17.1080285081681,MATH Level 5,0,0,GPQA,0.303691275167785,7.15883668903803,MUSR,0.379458333333333,5.23229166666667,MMLU-PRO,0.316323138297872,24.0359042553192,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-04,2024-10-09,0,THUDM/glm-4-9b-chat-1m,other,182,9.484,0.205669954986166 TIGER-Lab/MAmmoTH2-7B-Plus_bfloat16_3ed578d8dda09787137e363a0dc32e3a8ed908de_True,TIGER-Lab/MAmmoTH2-7B-Plus,3ed578d8dda09787137e363a0dc32e3a8ed908de,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,21.4698622596292,TRUE,IFEval,0.557466411344123,55.7466411344123,BBH,0.423469498880191,18.9259532275557,MATH Level 5,0.175981873111782,17.5981873111782,GPQA,0.280201342281879,4.0268456375839,MUSR,0.412354166666667,10.1109375,MMLU-PRO,0.301695478723404,22.4106087470449,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-06,2024-06-27,0,TIGER-Lab/MAmmoTH2-7B-Plus,mit,7,7.242,0.552663350555736 TTTXXX01/Mistral-7B-Base-SimPO2-5e-7_bfloat16_7a271e3061165f4e1abfe26715c04e20c2ac935e_True,TTTXXX01/Mistral-7B-Base-SimPO2-5e-7,7a271e3061165f4e1abfe26715c04e20c2ac935e,bfloat16,chatmodels,Original,MistralForCausalLM,16.3796884014764,TRUE,IFEval,0.439189129288067,43.9189129288067,BBH,0.431955150148828,20.6926273825575,MATH Level 5,0.0241691842900302,2.41691842900302,GPQA,0.297818791946309,6.3758389261745,MUSR,0.360416666666667,5.25208333333333,MMLU-PRO,0.276595744680851,19.6217494089835,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-30,2024-09-01,2,mistralai/Mistral-7B-v0.1,apache-2.0,0,7.242,0.522996132267287 TeeZee/DoubleBagel-57B-v1.0_bfloat16_6e10dc1fb5223d1b045dc2a19c9c267a574e520f_True,TeeZee/DoubleBagel-57B-v1.0,6e10dc1fb5223d1b045dc2a19c9c267a574e520f,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,8.54410296272912,TRUE,IFEval,0.233633425976409,23.3633425976409,BBH,0.325078559362514,5.52278169826115,MATH Level 5,0,0,GPQA,0.276006711409396,3.4675615212528,MUSR,0.431489583333333,13.6028645833333,MMLU-PRO,0.147772606382979,5.30806737588653,TRUE,TRUE,FALSE,FALSE,FALSE,2024-08-05,2024-08-10,1,TeeZee/DoubleBagel-57B-v1.0 (Merge),apache-2.0,1,56.703,9.36864747817259 @@ -923,10 +937,10 @@ Tijmen2/cosmosage-v3_bfloat16_e6d4b4e6868fcf113ab5261d71c7214a1f7fbb0c_True,Tijm TinyLlama/TinyLlama-1.1B-Chat-v0.1_float16_7abc14e7779eabc3a028bc695342869d0410dea2_False,TinyLlama/TinyLlama-1.1B-Chat-v0.1,7abc14e7779eabc3a028bc695342869d0410dea2,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,3.85687240027727,FALSE,IFEval,0.147854359765422,14.7854359765422,BBH,0.308352947486801,3.36301067393934,MATH Level 5,0,0,GPQA,0.229026845637584,0,MUSR,0.359239583333333,3.90494791666667,MMLU-PRO,0.109790558510638,1.08783983451537,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-16,2024-12-02,0,TinyLlama/TinyLlama-1.1B-Chat-v0.1,apache-2.0,53,1.1,0.0910952097470587 TinyLlama/TinyLlama-1.1B-Chat-v0.5_bfloat16_5c9e70dd07f5234bf6bf6a2425fffeecd5a6020b_False,TinyLlama/TinyLlama-1.1B-Chat-v0.5,5c9e70dd07f5234bf6bf6a2425fffeecd5a6020b,bfloat16,chatmodels,Original,LlamaForCausalLM,4.07581143646604,FALSE,IFEval,0.163366534129443,16.3366534129443,BBH,0.31050469159357,3.40769093756971,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.248322147651007,0,MUSR,0.366125,3.565625,MMLU-PRO,0.109624335106383,1.06937056737589,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-20,2024-10-23,0,TinyLlama/TinyLlama-1.1B-Chat-v0.5,apache-2.0,8,1.1,0.0949638317549067 TinyLlama/TinyLlama-1.1B-Chat-v0.6_bfloat16_bf9ae1c8bf026667e6f810768de259bb4a7f4777_True,TinyLlama/TinyLlama-1.1B-Chat-v0.6,bf9ae1c8bf026667e6f810768de259bb4a7f4777,bfloat16,chatmodels,Original,LlamaForCausalLM,4.09286641277805,TRUE,IFEval,0.157421197976923,15.7421197976923,BBH,0.306697665616683,3.39037070951253,MATH Level 5,0.00377643504531722,0.377643504531722,GPQA,0.258389261744966,1.11856823266219,MUSR,0.34221875,2.27734375,MMLU-PRO,0.114860372340426,1.6511524822695,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-20,2024-10-23,0,TinyLlama/TinyLlama-1.1B-Chat-v0.6,apache-2.0,91,1.1,0.430347260938312 -TinyLlama/TinyLlama-1.1B-Chat-v1.0_float16_fe8a4ea1ffedaf415f4da2f062534de366a451e6_False,TinyLlama/TinyLlama-1.1B-Chat-v1.0,fe8a4ea1ffedaf415f4da2f062534de366a451e6,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,2.71815455158305,FALSE,IFEval,0.0595763684800773,5.95763684800773,BBH,0.310356286749101,4.0133968484868,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.25,0,MUSR,0.351520833333333,4.30677083333334,MMLU-PRO,0.110123005319149,1.12477836879433,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-30,2024-08-04,0,TinyLlama/TinyLlama-1.1B-Chat-v1.0,apache-2.0,1107,1.1,0.268441454812413 +TinyLlama/TinyLlama-1.1B-Chat-v1.0_float16_fe8a4ea1ffedaf415f4da2f062534de366a451e6_False,TinyLlama/TinyLlama-1.1B-Chat-v1.0,fe8a4ea1ffedaf415f4da2f062534de366a451e6,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,2.71815455158305,FALSE,IFEval,0.0595763684800773,5.95763684800773,BBH,0.310356286749101,4.0133968484868,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.25,0,MUSR,0.351520833333333,4.30677083333334,MMLU-PRO,0.110123005319149,1.12477836879433,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-30,2024-08-04,0,TinyLlama/TinyLlama-1.1B-Chat-v1.0,apache-2.0,1109,1.1,0.268441454812413 TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T_bfloat16_59f6f375b26bde864a6ca194a9a3044570490064_False,TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T,59f6f375b26bde864a6ca194a9a3044570490064,bfloat16,pretrained,Original,LlamaForCausalLM,5.16737751670247,FALSE,IFEval,0.227663710067066,22.7663710067067,BBH,0.307118843826727,3.54709338950808,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.25251677852349,0.335570469798655,MUSR,0.33803125,2.18723958333333,MMLU-PRO,0.112034574468085,1.33717494089835,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-28,2024-11-27,0,TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T,apache-2.0,164,1.1,0.165797879432131 TinyLlama/TinyLlama_v1.1_bfloat16_ff3c701f2424c7625fdefb9dd470f45ef18b02d6_False,TinyLlama/TinyLlama_v1.1,ff3c701f2424c7625fdefb9dd470f45ef18b02d6,bfloat16,pretrained,Original,LlamaForCausalLM,4.72384891003899,FALSE,IFEval,0.200061392660363,20.0061392660363,BBH,0.302370180450761,3.21030104971281,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.245805369127517,0,MUSR,0.36996875,3.97942708333333,MMLU-PRO,0.104886968085106,0.542996453900708,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-09,2024-06-12,0,TinyLlama/TinyLlama_v1.1,apache-2.0,80,1.1,0.248928618602363 -Trappu/Magnum-Picaro-0.7-v2-12b_bfloat16_2ffc46cde49eb823f5588990bd6b848cd505271e_False,Trappu/Magnum-Picaro-0.7-v2-12b,2ffc46cde49eb823f5588990bd6b848cd505271e,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,21.4783017974636,FALSE,IFEval,0.300278815764394,30.0278815764394,BBH,0.550666191882885,35.7462331985544,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.322986577181208,9.73154362416107,MUSR,0.47271875,19.5565104166667,MMLU-PRO,0.358045212765957,28.6716903073286,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-11,2024-09-12,1,Trappu/Magnum-Picaro-0.7-v2-12b (Merge),"",7,12.248,1.67495885513732 +Trappu/Magnum-Picaro-0.7-v2-12b_bfloat16_2ffc46cde49eb823f5588990bd6b848cd505271e_False,Trappu/Magnum-Picaro-0.7-v2-12b,2ffc46cde49eb823f5588990bd6b848cd505271e,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,21.4783017974636,FALSE,IFEval,0.300278815764394,30.0278815764394,BBH,0.550666191882885,35.7462331985544,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.322986577181208,9.73154362416107,MUSR,0.47271875,19.5565104166667,MMLU-PRO,0.358045212765957,28.6716903073286,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-12,0,Removed,"",0,12.248,1.67495885513732 Trappu/Nemo-Picaro-12B_float16_d65bf383d744998ae93a5589ec886532bb7e18eb_False,Trappu/Nemo-Picaro-12B,d65bf383d744998ae93a5589ec886532bb7e18eb,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,21.3247281984241,FALSE,IFEval,0.257713976692953,25.7713976692953,BBH,0.548958612599755,35.9731352844479,MATH Level 5,0.0823262839879154,8.23262839879154,GPQA,0.327181208053691,10.2908277404922,MUSR,0.47259375,18.7408854166667,MMLU-PRO,0.36045545212766,28.9394946808511,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-10,2024-09-22,2,royallab/MN-LooseCannon-12B-v2 (Merge),apache-2.0,1,12.248,1.8410278639878 Tremontaine/L3-12B-Lunaris-v1_bfloat16_7be236530a835416ebca712d51d661c4488a45de_True,Tremontaine/L3-12B-Lunaris-v1,7be236530a835416ebca712d51d661c4488a45de,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.5024308317828,TRUE,IFEval,0.690931173730147,69.0931173730147,BBH,0.523021723724401,32.1807456461844,MATH Level 5,0.0891238670694864,8.91238670694864,GPQA,0.309563758389262,7.94183445190157,MUSR,0.367364583333333,4.05390625,MMLU-PRO,0.37749335106383,30.8325945626478,FALSE,FALSE,FALSE,FALSE,FALSE,2024-07-14,2024-07-15,1,Tremontaine/L3-12B-Lunaris-v1 (Merge),"",2,11.52,1.14096394871727 Tsunami-th/Tsunami-0.5-7B-Instruct_bfloat16_10706336513d54c4e8962f54653f25941c4031f4_True,Tsunami-th/Tsunami-0.5-7B-Instruct,10706336513d54c4e8962f54653f25941c4031f4,bfloat16,chatmodels,Original,Qwen2ForCausalLM,28.0434107087801,TRUE,IFEval,0.740015381410214,74.0015381410214,BBH,0.552369427738073,36.1382541870034,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.308724832214765,7.82997762863535,MUSR,0.42571875,12.21484375,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-11,2024-10-12,1,Tsunami-th/Tsunami-0.5-7B-Instruct (Merge),apache-2.0,0,7.616,1.0900527971612 @@ -935,7 +949,7 @@ Tsunami-th/Tsunami-1.0-14B-Instruct_bfloat16_b468814b5242acbe6294226db71bc19dead Tsunami-th/Tsunami-1.0-7B-Instruct_bfloat16_34d0f8da8ce6b0de50a269eef622ff2e93e5c059_True,Tsunami-th/Tsunami-1.0-7B-Instruct,34d0f8da8ce6b0de50a269eef622ff2e93e5c059,bfloat16,chatmodels,Original,Qwen2ForCausalLM,28.7623077837889,TRUE,IFEval,0.730872972601586,73.0872972601586,BBH,0.549071195618326,35.8572427497732,MATH Level 5,0.0143504531722054,1.43504531722054,GPQA,0.312919463087248,8.38926174496644,MUSR,0.44928125,15.76015625,MMLU-PRO,0.442403590425532,38.0448433806147,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-28,2024-10-28,1,Tsunami-th/Tsunami-1.0-7B-Instruct (Merge),apache-2.0,1,7.616,1.98139950611626 UCLA-AGI/Gemma-2-9B-It-SPPO-Iter1_bfloat16_33cfd6919f22efc38f71e9d21a7e697afb418e6b_True,UCLA-AGI/Gemma-2-9B-It-SPPO-Iter1,33cfd6919f22efc38f71e9d21a7e697afb418e6b,bfloat16,chatmodels,Original,Gemma2ForCausalLM,21.0881686855902,TRUE,IFEval,0.308221075634871,30.8221075634871,BBH,0.596893476270551,41.8092296200635,MATH Level 5,0,0,GPQA,0.336409395973154,11.5212527964206,MUSR,0.4099375,10.0755208333333,MMLU-PRO,0.390708111702128,32.3009013002364,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-29,2024-09-21,0,UCLA-AGI/Gemma-2-9B-It-SPPO-Iter1,gemma,3,9.242,2.94265823851697 UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2_bfloat16_b7590721d92bf6e0606e3dbc1ca2c229b7c534b4_True,UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2,b7590721d92bf6e0606e3dbc1ca2c229b7c534b4,bfloat16,chatmodels,Original,Gemma2ForCausalLM,21.2161444866379,TRUE,IFEval,0.31001963678595,31.001963678595,BBH,0.598988087742128,42.1698338017458,MATH Level 5,0,0,GPQA,0.334731543624161,11.2975391498881,MUSR,0.4139375,10.9421875,MMLU-PRO,0.386968085106383,31.8853427895981,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-29,2024-08-07,0,UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2,gemma,2,9.242,2.7164617984263 -UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3_bfloat16_2261f2a03b2e15de13a18da52590c237ecf5f188_True,UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3,2261f2a03b2e15de13a18da52590c237ecf5f188,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,21.4671799758725,TRUE,IFEval,0.316714096375395,31.6714096375395,BBH,0.600708022926803,42.5367522410743,MATH Level 5,0,0,GPQA,0.338926174496644,11.8568232662192,MUSR,0.416604166666667,11.3421875,MMLU-PRO,0.382563164893617,31.3959072104019,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-29,2024-07-31,0,UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3,gemma,118,9.242,2.81515014948886 +UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3_bfloat16_2261f2a03b2e15de13a18da52590c237ecf5f188_True,UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3,2261f2a03b2e15de13a18da52590c237ecf5f188,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,21.4671799758725,TRUE,IFEval,0.316714096375395,31.6714096375395,BBH,0.600708022926803,42.5367522410743,MATH Level 5,0,0,GPQA,0.338926174496644,11.8568232662192,MUSR,0.416604166666667,11.3421875,MMLU-PRO,0.382563164893617,31.3959072104019,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-29,2024-07-31,0,UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3,gemma,119,9.242,2.81515014948886 UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter1_bfloat16_2076437f65776aeb9686c95f1f41515f70c4db27_True,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter1,2076437f65776aeb9686c95f1f41515f70c4db27,bfloat16,chatmodels,Original,LlamaForCausalLM,24.6400773055141,TRUE,IFEval,0.72989889049943,72.989889049943,BBH,0.505789069108271,29.489353188072,MATH Level 5,0.107250755287009,10.7250755287009,GPQA,0.26761744966443,2.3489932885906,MUSR,0.356791666666667,2.165625,MMLU-PRO,0.37109375,30.1215277777778,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-25,2024-09-21,0,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter1,apache-2.0,1,8.03,0.701228912473034 UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter2_bfloat16_730c7207d4b538feeb3c2e6d6f6a6ba8615a9be3_True,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter2,730c7207d4b538feeb3c2e6d6f6a6ba8615a9be3,bfloat16,chatmodels,Original,LlamaForCausalLM,23.927649495929,TRUE,IFEval,0.698874541771389,69.8874541771389,BBH,0.508869627885296,29.8694493280916,MATH Level 5,0.0966767371601208,9.66767371601208,GPQA,0.266778523489933,2.23713646532438,MUSR,0.359427083333333,1.99505208333334,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-25,2024-08-07,0,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter2,apache-2.0,0,8,0.656766723762742 UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3_bfloat16_f73dafc2923acd56f115f21f76e9d14f8d19a63e_True,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3,f73dafc2923acd56f115f21f76e9d14f8d19a63e,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,23.4793983222734,TRUE,IFEval,0.683412235091779,68.3412235091779,BBH,0.50795799761689,29.7396835804407,MATH Level 5,0.0830815709969789,8.30815709969789,GPQA,0.26510067114094,2.01342281879195,MUSR,0.3660625,3.09114583333333,MMLU-PRO,0.364444813829787,29.3827570921986,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-25,2024-07-02,0,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3,apache-2.0,77,8.03,8.20181186822828 @@ -982,7 +996,7 @@ ValiantLabs/Llama3.2-3B-Enigma_float16_ca6adf3a289ce47c7598139e7a312e2b4b3708ce_ ValiantLabs/Llama3.2-3B-Esper2_float16_64a2c619a2e1680ab42945fcf5b75a5242cab3a1_False,ValiantLabs/Llama3.2-3B-Esper2,64a2c619a2e1680ab42945fcf5b75a5242cab3a1,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,10.7302971407332,FALSE,IFEval,0.274974844523642,27.4974844523642,BBH,0.380826113903661,13.8517329079134,MATH Level 5,0.0234138972809668,2.34138972809668,GPQA,0.27013422818792,2.68456375838927,MUSR,0.354958333333333,4.03645833333333,MMLU-PRO,0.225731382978723,13.9701536643026,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-03,2024-10-09,1,meta-llama/Llama-3.2-3B-Instruct,llama3.2,3,3.213,0.73888435001663 ValiantLabs/Llama3.2-3B-ShiningValiant2_float16_1336e200485675c9b92baae17831eab17c601803_False,ValiantLabs/Llama3.2-3B-ShiningValiant2,1336e200485675c9b92baae17831eab17c601803,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,14.2144620627591,FALSE,IFEval,0.262510139762497,26.2510139762497,BBH,0.422593253378702,18.9127087830015,MATH Level 5,0.0717522658610272,7.17522658610272,GPQA,0.280201342281879,4.0268456375839,MUSR,0.386645833333333,8.59739583333334,MMLU-PRO,0.282912234042553,20.3235815602837,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-27,2024-11-05,1,meta-llama/Llama-3.2-3B-Instruct,llama3.2,3,3.213,2.85629887818233 Vikhrmodels/Vikhr-Llama3.1-8B-Instruct-R-21-09-24_float16_c0b57cf6d4444b35fc5cec0525ff5eef32af22c9_True,Vikhrmodels/Vikhr-Llama3.1-8B-Instruct-R-21-09-24,c0b57cf6d4444b35fc5cec0525ff5eef32af22c9,float16,chatmodels,Original,LlamaForCausalLM,24.8388385724359,TRUE,IFEval,0.643145742186288,64.3145742186288,BBH,0.527224269970207,32.6694172942473,MATH Level 5,0.186555891238671,18.6555891238671,GPQA,0.24496644295302,0,MUSR,0.375395833333333,5.09114583333334,MMLU-PRO,0.354720744680851,28.302304964539,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-20,2024-09-21,1,Vikhrmodels/Vikhr-Llama3.1-8B-Instruct-R-21-09-24 (Merge),apache-2.0,26,8.03,0.856611700315968 -Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24_float16_6abd887cb631f705042c9e8085615fe4d76e9779_True,Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24,6abd887cb631f705042c9e8085615fe4d76e9779,float16,chatmodels,Original,MistralForCausalLM,24.4031363985684,TRUE,IFEval,0.599931515046743,59.9931515046743,BBH,0.521230905282762,31.4144091133763,MATH Level 5,0.134441087613293,13.4441087613293,GPQA,0.291107382550336,5.48098434004475,MUSR,0.407302083333333,9.44609375,MMLU-PRO,0.339760638297872,26.6400709219858,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-20,2024-09-21,1,Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24 (Merge),apache-2.0,96,12.248,1.72079181191147 +Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24_float16_6abd887cb631f705042c9e8085615fe4d76e9779_True,Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24,6abd887cb631f705042c9e8085615fe4d76e9779,float16,chatmodels,Original,MistralForCausalLM,24.4031363985684,TRUE,IFEval,0.599931515046743,59.9931515046743,BBH,0.521230905282762,31.4144091133763,MATH Level 5,0.134441087613293,13.4441087613293,GPQA,0.291107382550336,5.48098434004475,MUSR,0.407302083333333,9.44609375,MMLU-PRO,0.339760638297872,26.6400709219858,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-20,2024-09-21,1,Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24 (Merge),apache-2.0,97,12.248,1.72079181191147 Weyaxi/Bagel-Hermes-2x34B_bfloat16_44fddd32d7dcafc0fa670fd87a2e129310640aac_True,Weyaxi/Bagel-Hermes-2x34B,44fddd32d7dcafc0fa670fd87a2e129310640aac,bfloat16,chatmodels,Original,MixtralForCausalLM,25.4728041623161,TRUE,IFEval,0.543153277747488,54.3153277747488,BBH,0.491665556322855,27.4090314454288,MATH Level 5,0.0521148036253777,5.21148036253777,GPQA,0.328020134228188,10.4026845637584,MUSR,0.451666666666667,15.625,MMLU-PRO,0.458859707446809,39.8733008274232,TRUE,FALSE,TRUE,FALSE,FALSE,2024-01-12,2024-10-28,0,Weyaxi/Bagel-Hermes-2x34B,apache-2.0,16,60.814,9.81516791030478 Weyaxi/Bagel-Hermes-34B-Slerp_bfloat16_dcdcc17a2c650a95bc27129a3ddbf261dffed37f_False,Weyaxi/Bagel-Hermes-34B-Slerp,dcdcc17a2c650a95bc27129a3ddbf261dffed37f,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,27.2090932781494,FALSE,IFEval,0.460272078086145,46.0272078086145,BBH,0.592190360586005,41.9570474805579,MATH Level 5,0.0581570996978852,5.81570996978852,GPQA,0.334731543624161,11.2975391498881,MUSR,0.462208333333333,17.009375,MMLU-PRO,0.470329122340426,41.1476802600473,TRUE,TRUE,FALSE,FALSE,FALSE,2024-01-12,2024-08-30,0,Weyaxi/Bagel-Hermes-34B-Slerp,apache-2.0,1,34.389,3.02137549848606 Weyaxi/Einstein-v4-7B_bfloat16_7eecd9833b8a012e23ac1df789884888b047baa0_True,Weyaxi/Einstein-v4-7B,7eecd9833b8a012e23ac1df789884888b047baa0,bfloat16,chatmodels,Original,MistralForCausalLM,16.7682521716074,TRUE,IFEval,0.470812998399801,47.0812998399802,BBH,0.384946996927418,14.3044514172073,MATH Level 5,0.0196374622356496,1.96374622356496,GPQA,0.281879194630873,4.25055928411633,MUSR,0.468166666666667,19.0208333333333,MMLU-PRO,0.225897606382979,13.9886229314421,TRUE,FALSE,FALSE,FALSE,FALSE,2024-02-22,2024-06-26,1,mistralai/Mistral-7B-v0.1,other,47,7.242,0.667754010854814 @@ -1025,7 +1039,7 @@ ZeroXClem/Qwen2.5-7B-HomerCreative-Mix_bfloat16_6849553db73428ca67823a06f5cfeea6 ZeroXClem/Qwen2.5-7B-Qandora-CySec_bfloat16_6c8b513dbc61a9f704210d26124244f19f3bc4cc_True,ZeroXClem/Qwen2.5-7B-Qandora-CySec,6c8b513dbc61a9f704210d26124244f19f3bc4cc,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,30.9535098871614,TRUE,IFEval,0.677317295886027,67.7317295886027,BBH,0.549002266368929,36.2648981658979,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.300335570469799,6.71140939597315,MUSR,0.428604166666667,13.4088541666667,MMLU-PRO,0.448470744680851,38.7189716312057,TRUE,TRUE,FALSE,FALSE,FALSE,2024-11-12,2024-11-12,1,ZeroXClem/Qwen2.5-7B-Qandora-CySec (Merge),apache-2.0,3,7.616,0.682080291831643 ZeusLabs/L3-Aethora-15B-V2_bfloat16_2c601f116c37dd912c89357dbdbef879a637997e_True,ZeusLabs/L3-Aethora-15B-V2,2c601f116c37dd912c89357dbdbef879a637997e,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.6735374098962,TRUE,IFEval,0.720806349375213,72.0806349375213,BBH,0.50109104654637,28.9685046953127,MATH Level 5,0.0793051359516616,7.93051359516616,GPQA,0.287751677852349,5.03355704697987,MUSR,0.387083333333333,6.25208333333334,MMLU-PRO,0.349983377659575,27.7759308510638,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-27,2024-06-27,1,ZeusLabs/L3-Aethora-15B-V2 (Merge),cc-by-sa-4.0,40,15.01,2.377668733892 ZhangShenao/SELM-Llama-3-8B-Instruct-iter-3_bfloat16_9c95ccdeceed14a3c2881bc495101a1acca1385f_True,ZhangShenao/SELM-Llama-3-8B-Instruct-iter-3,9c95ccdeceed14a3c2881bc495101a1acca1385f,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,23.6527060288546,TRUE,IFEval,0.690281785662043,69.0281785662043,BBH,0.504608939077051,29.0785308840227,MATH Level 5,0.0626888217522659,6.26888217522659,GPQA,0.258389261744966,1.11856823266219,MUSR,0.384510416666667,5.49713541666667,MMLU-PRO,0.378324468085106,30.9249408983452,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-25,2024-07-02,3,meta-llama/Meta-Llama-3-8B-Instruct,mit,5,8.03,0.655590932177198 -aaditya/Llama3-OpenBioLLM-70B_bfloat16_5f79deaf38bc5f662943d304d59cb30357e8e5bd_True,aaditya/Llama3-OpenBioLLM-70B,5f79deaf38bc5f662943d304d59cb30357e8e5bd,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,35.0041966456474,TRUE,IFEval,0.759674330775675,75.9674330775675,BBH,0.639887237548552,47.1470746771679,MATH Level 5,0.198640483383686,19.8640483383686,GPQA,0.322986577181208,9.73154362416107,MUSR,0.44171875,14.3481770833333,MMLU-PRO,0.486702127659575,42.9669030732861,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-24,2024-08-30,2,meta-llama/Meta-Llama-3-70B,llama3,358,70,9.6570223229552 +aaditya/Llama3-OpenBioLLM-70B_bfloat16_5f79deaf38bc5f662943d304d59cb30357e8e5bd_True,aaditya/Llama3-OpenBioLLM-70B,5f79deaf38bc5f662943d304d59cb30357e8e5bd,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,35.0041966456474,TRUE,IFEval,0.759674330775675,75.9674330775675,BBH,0.639887237548552,47.1470746771679,MATH Level 5,0.198640483383686,19.8640483383686,GPQA,0.322986577181208,9.73154362416107,MUSR,0.44171875,14.3481770833333,MMLU-PRO,0.486702127659575,42.9669030732861,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-24,2024-08-30,2,meta-llama/Meta-Llama-3-70B,llama3,359,70,9.6570223229552 abacusai/Dracarys-72B-Instruct_bfloat16_10cabc4beb57a69df51533f65e39a7ad22821370_True,abacusai/Dracarys-72B-Instruct,10cabc4beb57a69df51533f65e39a7ad22821370,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,42.7100419445772,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.694406639208498,56.9355201000337,MATH Level 5,0.356495468277946,35.6495468277946,GPQA,0.390939597315436,18.7919463087248,MUSR,0.455822916666667,16.8111979166667,MMLU-PRO,0.545628324468085,49.5142582742317,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-14,2024-08-16,0,abacusai/Dracarys-72B-Instruct,other,20,72.706,12.3834640727275 abacusai/Liberated-Qwen1.5-14B_float16_cc0fa5102bfee821bb5e49f082731ccb9d1fedf1_True,abacusai/Liberated-Qwen1.5-14B,cc0fa5102bfee821bb5e49f082731ccb9d1fedf1,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,19.866148278783,TRUE,IFEval,0.36310212458499,36.310212458499,BBH,0.494800091746719,28.0209059996855,MATH Level 5,0.121601208459215,12.1601208459215,GPQA,0.283557046979866,4.47427293064877,MUSR,0.41746875,10.3169270833333,MMLU-PRO,0.351230053191489,27.9144503546099,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-05,2024-09-05,0,abacusai/Liberated-Qwen1.5-14B,other,21,14,4.07731190007935 abacusai/Llama-3-Smaug-8B_bfloat16_fe54a7d42160d3d8fcc3289c8c411fd9dd5e8357_True,abacusai/Llama-3-Smaug-8B,fe54a7d42160d3d8fcc3289c8c411fd9dd5e8357,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.9670574419879,TRUE,IFEval,0.486675354725462,48.6675354725462,BBH,0.493071276966717,27.8803741894159,MATH Level 5,0.0793051359516616,7.93051359516616,GPQA,0.248322147651007,0,MUSR,0.36225,5.04791666666666,MMLU-PRO,0.318484042553192,24.2760047281324,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-19,2024-07-02,0,abacusai/Llama-3-Smaug-8B,llama2,87,8.03,0.910218264650151 @@ -1054,7 +1068,7 @@ akjindal53244/Llama-3.1-Storm-8B_float16_df21b06dcf534b026dd301a44a521d7253c8b94 alcholjung/llama3_medical_tuned_float16_62bd457b6fe961a42a631306577e622c83876cb6_False,alcholjung/llama3_medical_tuned,62bd457b6fe961a42a631306577e622c83876cb6,float16,fine-tunedondomain-specificdatasets,Adapter,?,11.3060714020907,FALSE,IFEval,0.0105664082412443,1.05664082412443,BBH,0.451294319166093,23.2650890249695,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.286073825503356,4.80984340044743,MUSR,0.466020833333333,16.8526041666667,MMLU-PRO,0.294630984042553,21.625664893617,FALSE,FALSE,FALSE,FALSE,FALSE,2024-08-14,2024-08-14,0,alcholjung/llama3_medical_tuned,"",0,16.061,0.910721097346861 allenai/Llama-3.1-Tulu-3-70B_bfloat16_c4280450c0cd91a2fb6f41a25c6a1662c6966b01_True,allenai/Llama-3.1-Tulu-3-70B,c4280450c0cd91a2fb6f41a25c6a1662c6966b01,bfloat16,chatmodels,Original,LlamaForCausalLM,41.1988568717258,TRUE,IFEval,0.829116743573718,82.9116743573718,BBH,0.616362649619995,45.3655686174063,MATH Level 5,0.382175226586103,38.2175226586103,GPQA,0.373322147651007,16.4429530201342,MUSR,0.494833333333333,23.7541666666667,MMLU-PRO,0.464511303191489,40.5012559101655,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-27,1,allenai/Llama-3.1-Tulu-3-70B (Merge),llama3.1,44,70.554,36.5930504800871 allenai/Llama-3.1-Tulu-3-70B_float16_c4280450c0cd91a2fb6f41a25c6a1662c6966b01_True,allenai/Llama-3.1-Tulu-3-70B,c4280450c0cd91a2fb6f41a25c6a1662c6966b01,float16,chatmodels,Original,LlamaForCausalLM,41.4545274065984,TRUE,IFEval,0.837934458348294,83.7934458348294,BBH,0.615684716955611,45.259480995205,MATH Level 5,0.382930513595166,38.2930513595166,GPQA,0.373322147651007,16.4429530201342,MUSR,0.498802083333333,24.3169270833333,MMLU-PRO,0.465591755319149,40.6213061465721,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-27,1,allenai/Llama-3.1-Tulu-3-70B (Merge),llama3.1,44,70.554,38.022026223354 -allenai/Llama-3.1-Tulu-3-70B-DPO_bfloat16_6ea110f39fb660573111892a1381d3be3f826f80_True,allenai/Llama-3.1-Tulu-3-70B-DPO,6ea110f39fb660573111892a1381d3be3f826f80,bfloat16,chatmodels,Original,LlamaForCausalLM,41.2047774579198,TRUE,IFEval,0.828192529155973,82.8192529155973,BBH,0.61462036269585,45.0471809195084,MATH Level 5,0.38821752265861,38.821752265861,GPQA,0.375838926174497,16.7785234899329,MUSR,0.492260416666667,23.39921875,MMLU-PRO,0.463264627659575,40.3627364066194,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-27,1,allenai/Llama-3.1-Tulu-3-70B-DPO (Merge),llama3.1,7,70,36.8007490331295 +allenai/Llama-3.1-Tulu-3-70B-DPO_bfloat16_6ea110f39fb660573111892a1381d3be3f826f80_True,allenai/Llama-3.1-Tulu-3-70B-DPO,6ea110f39fb660573111892a1381d3be3f826f80,bfloat16,chatmodels,Original,LlamaForCausalLM,41.2047774579198,TRUE,IFEval,0.828192529155973,82.8192529155973,BBH,0.61462036269585,45.0471809195084,MATH Level 5,0.38821752265861,38.821752265861,GPQA,0.375838926174497,16.7785234899329,MUSR,0.492260416666667,23.39921875,MMLU-PRO,0.463264627659575,40.3627364066194,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-27,1,allenai/Llama-3.1-Tulu-3-70B-DPO (Merge),llama3.1,8,70,36.8007490331295 allenai/Llama-3.1-Tulu-3-70B-SFT_bfloat16_f58ab66db3a1c5dd805c6d3420b2b4f5aef30041_True,allenai/Llama-3.1-Tulu-3-70B-SFT,f58ab66db3a1c5dd805c6d3420b2b4f5aef30041,bfloat16,chatmodels,Original,LlamaForCausalLM,38.7226108999501,TRUE,IFEval,0.805061680784762,80.5061680784762,BBH,0.595143780058093,42.0239839490646,MATH Level 5,0.324018126888218,32.4018126888218,GPQA,0.344798657718121,12.6398210290828,MUSR,0.502614583333333,24.4934895833333,MMLU-PRO,0.462433510638298,40.270390070922,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-18,2024-11-27,1,allenai/Llama-3.1-Tulu-3-70B-SFT (Merge),llama3.1,4,70.554,27.3383271895368 allenai/Llama-3.1-Tulu-3-8B_bfloat16_63b75e0dd6eac3725319f869716b9b70c16a6a65_True,allenai/Llama-3.1-Tulu-3-8B,63b75e0dd6eac3725319f869716b9b70c16a6a65,bfloat16,chatmodels,Original,LlamaForCausalLM,26.0349980816721,TRUE,IFEval,0.826668794354535,82.6668794354535,BBH,0.404983310273191,16.671812993248,MATH Level 5,0.196374622356495,19.6374622356495,GPQA,0.298657718120805,6.48769574944072,MUSR,0.41746875,10.4502604166667,MMLU-PRO,0.28266289893617,20.2958776595745,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-21,1,allenai/Llama-3.1-Tulu-3-8B (Merge),llama3.1,108,8.03,0.703774148994329 allenai/Llama-3.1-Tulu-3-8B_float16_50fef8756a9a4ca2010587d128aebb3a18ec897d_True,allenai/Llama-3.1-Tulu-3-8B,50fef8756a9a4ca2010587d128aebb3a18ec897d,float16,chatmodels,Original,LlamaForCausalLM,25.8832245109219,TRUE,IFEval,0.825469753587149,82.5469753587149,BBH,0.40608256120952,16.8580520694028,MATH Level 5,0.188821752265861,18.8821752265861,GPQA,0.296979865771812,6.26398210290828,MUSR,0.41746875,10.5169270833333,MMLU-PRO,0.282081117021277,20.2312352245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-20,2024-11-28,1,allenai/Llama-3.1-Tulu-3-8B (Merge),llama3.1,108,8.03,0.701232116583257 @@ -1154,7 +1168,7 @@ allknowingroger/Yunconglong-13B-slerp_bfloat16_dead687b7342d875bd8ac73bfcd34b88a allknowingroger/limyClown-7B-slerp_bfloat16_732a1ed0c2c7007297ad9d9797793073825f65ca_False,allknowingroger/limyClown-7B-slerp,732a1ed0c2c7007297ad9d9797793073825f65ca,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,19.7038886947961,FALSE,IFEval,0.401745147320221,40.1745147320221,BBH,0.514751731705597,31.9314661071385,MATH Level 5,0.0687311178247734,6.87311178247734,GPQA,0.281040268456376,4.13870246085012,MUSR,0.4293125,12.4640625,MMLU-PRO,0.303773271276596,22.6414745862884,TRUE,TRUE,FALSE,FALSE,FALSE,2024-03-23,2024-06-26,1,allknowingroger/limyClown-7B-slerp (Merge),apache-2.0,0,7.242,0.610050396647597 allknowingroger/llama3-Jallabi-40B-s_float16_a86d8cc3530fb466245b2cac55f25c28d0bd8c22_False,allknowingroger/llama3-Jallabi-40B-s,a86d8cc3530fb466245b2cac55f25c28d0bd8c22,float16,basemergesandmoerges,Original,LlamaForCausalLM,5.02970163690686,FALSE,IFEval,0.192068156934711,19.2068156934711,BBH,0.325224241985263,5.95791156295821,MATH Level 5,0,0,GPQA,0.23741610738255,0,MUSR,0.374958333333333,4.03645833333333,MMLU-PRO,0.108793218085106,0.977024231678486,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-19,0,Removed,"",0,18.769,0.979574739798707 allknowingroger/llama3AnFeng-40B_float16_5995441962287970ffc98ad9b292e14420bf49ca_False,allknowingroger/llama3AnFeng-40B,5995441962287970ffc98ad9b292e14420bf49ca,float16,basemergesandmoerges,Original,LlamaForCausalLM,9.23799437810072,FALSE,IFEval,0.174207768720329,17.4207768720329,BBH,0.379408044766034,12.4769961857253,MATH Level 5,0,0,GPQA,0.306208053691275,7.49440715883669,MUSR,0.394,7.15,MMLU-PRO,0.197972074468085,10.8857860520095,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-09-19,0,Removed,"",0,39.971,4.06346810125561 -allura-org/MS-Meadowlark-22B_bfloat16_6eb2f6bee66dbffa1b17397e75a7380ed4f9d0ac_True,allura-org/MS-Meadowlark-22B,6eb2f6bee66dbffa1b17397e75a7380ed4f9d0ac,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,26.3930298651709,TRUE,IFEval,0.669698621878837,66.9698621878837,BBH,0.516257693321777,30.2965804466696,MATH Level 5,0.141238670694864,14.1238670694864,GPQA,0.325503355704698,10.0671140939597,MUSR,0.384260416666667,5.53255208333333,MMLU-PRO,0.382313829787234,31.3682033096927,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-18,2024-10-24,1,allura-org/MS-Meadowlark-22B (Merge),other,9,22.247,2.89590158379718 +allura-org/MS-Meadowlark-22B_bfloat16_6eb2f6bee66dbffa1b17397e75a7380ed4f9d0ac_True,allura-org/MS-Meadowlark-22B,6eb2f6bee66dbffa1b17397e75a7380ed4f9d0ac,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,26.3930298651709,TRUE,IFEval,0.669698621878837,66.9698621878837,BBH,0.516257693321777,30.2965804466696,MATH Level 5,0.141238670694864,14.1238670694864,GPQA,0.325503355704698,10.0671140939597,MUSR,0.384260416666667,5.53255208333333,MMLU-PRO,0.382313829787234,31.3682033096927,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-18,2024-10-24,1,allura-org/MS-Meadowlark-22B (Merge),other,10,22.247,2.89590158379718 allura-org/MoE-Girl-1BA-7BT_bfloat16_ecfac73ab9e7f2ee006d6a2ad9c8e86a85deab2b_True,allura-org/MoE-Girl-1BA-7BT,ecfac73ab9e7f2ee006d6a2ad9c8e86a85deab2b,bfloat16,fine-tunedondomain-specificdatasets,Original,OlmoeForCausalLM,6.39021099096268,TRUE,IFEval,0.270503375488149,27.0503375488149,BBH,0.313917536326241,4.8423440285205,MATH Level 5,0.0143504531722054,1.43504531722054,GPQA,0.258389261744966,1.11856823266219,MUSR,0.343552083333333,1.47734375,MMLU-PRO,0.121758643617021,2.41762706855792,TRUE,FALSE,TRUE,FALSE,FALSE,2024-10-08,2024-10-10,1,allenai/OLMoE-1B-7B-0924,apache-2.0,14,6.919,3.20115464710205 aloobun/Meta-Llama-3-7B-28Layers_bfloat16_9822e6b8d4de0c0f2964d299f6fcef72385a0341_False,aloobun/Meta-Llama-3-7B-28Layers,9822e6b8d4de0c0f2964d299f6fcef72385a0341,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,13.1365160784577,FALSE,IFEval,0.196364534989384,19.6364534989384,BBH,0.443749701425339,22.0965302513435,MATH Level 5,0.013595166163142,1.3595166163142,GPQA,0.294463087248322,5.92841163310962,MUSR,0.358927083333333,5.79921875,MMLU-PRO,0.315990691489362,23.9989657210402,TRUE,TRUE,FALSE,FALSE,FALSE,2024-05-10,2024-06-26,1,aloobun/Meta-Llama-3-7B-28Layers (Merge),llama3,0,7.158,0.809358294835876 aloobun/d-SmolLM2-360M_bfloat16_2a1d82b4cbcdfdff3c2cfcd171435c5f01b8de43_False,aloobun/d-SmolLM2-360M,2a1d82b4cbcdfdff3c2cfcd171435c5f01b8de43,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,6.00783726880815,FALSE,IFEval,0.209703586483863,20.9703586483863,BBH,0.319578440563683,4.76282074716569,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.253355704697987,0.447427293064876,MUSR,0.3980625,7.7578125,MMLU-PRO,0.116938164893617,1.882018321513,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-20,2024-11-26,0,aloobun/d-SmolLM2-360M,apache-2.0,1,0.362,0.370123277612295 @@ -1179,13 +1193,13 @@ anthracite-org/magnum-v4-27b_bfloat16_50a14716bdeb6a9376b9377df31ab1497864f3f9_F anthracite-org/magnum-v4-9b_bfloat16_e9db6cb80f02ca2e2db4538ef59f7a30f69a849d_False,anthracite-org/magnum-v4-9b,e9db6cb80f02ca2e2db4538ef59f7a30f69a849d,bfloat16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,23.7738183884644,FALSE,IFEval,0.350262858105383,35.0262858105383,BBH,0.533642399193156,33.2704044364764,MATH Level 5,0.129154078549849,12.9154078549849,GPQA,0.347315436241611,12.9753914988814,MUSR,0.451572916666667,15.6466145833333,MMLU-PRO,0.395279255319149,32.8088061465721,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-20,2024-10-23,0,anthracite-org/magnum-v4-9b,gemma,14,9.242,2.55632615106111 apple/DCLM-7B_bfloat16_c85bfa168f999ce27e954808bc005a2748fda5c5_False,apple/DCLM-7B,c85bfa168f999ce27e954808bc005a2748fda5c5,bfloat16,pretrained,Original,OpenLMModel,13.9869771215513,FALSE,IFEval,0.217272392806642,21.7272392806642,BBH,0.423214236681842,19.7609349747722,MATH Level 5,0.0294561933534743,2.94561933534743,GPQA,0.315436241610738,8.7248322147651,MUSR,0.392072916666667,7.30911458333333,MMLU-PRO,0.31108710106383,23.4541223404255,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-11,2024-08-16,0,apple/DCLM-7B,apple-ascl,828,7,0.629955551509212 appvoid/arco-2_float16_9bec3c42c5bb557eb218513f4fe26c4edc803f0f_False,appvoid/arco-2,9bec3c42c5bb557eb218513f4fe26c4edc803f0f,float16,basemergesandmoerges,Original,LlamaForCausalLM,4.94827908660223,FALSE,IFEval,0.199137178242618,19.9137178242619,BBH,0.314566762748308,4.05915006958283,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.239093959731544,0,MUSR,0.35359375,4.19921875,MMLU-PRO,0.111619015957447,1.29100177304964,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-22,2024-12-23,0,appvoid/arco-2,apache-2.0,7,0.257,0.158147024487816 -arcee-ai/Arcee-Nova_bfloat16_ec3bfe88b83f81481daa04b6789c1e0d32827dc5_True,arcee-ai/Arcee-Nova,ec3bfe88b83f81481daa04b6789c1e0d32827dc5,bfloat16,chatmodels,Original,Qwen2ForCausalLM,43.9023352264525,TRUE,IFEval,0.790748547188128,79.0748547188128,BBH,0.694196965855899,56.7409875395207,MATH Level 5,0.429003021148036,42.9003021148036,GPQA,0.38506711409396,18.0089485458613,MUSR,0.456166666666667,17.2208333333333,MMLU-PRO,0.545212765957447,49.468085106383,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2024-09-19,0,arcee-ai/Arcee-Nova,other,48,72.706,11.4932935647508 +arcee-ai/Arcee-Nova_bfloat16_ec3bfe88b83f81481daa04b6789c1e0d32827dc5_True,arcee-ai/Arcee-Nova,ec3bfe88b83f81481daa04b6789c1e0d32827dc5,bfloat16,chatmodels,Original,Qwen2ForCausalLM,43.9023352264525,TRUE,IFEval,0.790748547188128,79.0748547188128,BBH,0.694196965855899,56.7409875395207,MATH Level 5,0.429003021148036,42.9003021148036,GPQA,0.38506711409396,18.0089485458613,MUSR,0.456166666666667,17.2208333333333,MMLU-PRO,0.545212765957447,49.468085106383,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2024-09-19,0,arcee-ai/Arcee-Nova,other,49,72.706,11.4932935647508 arcee-ai/Arcee-Spark_bfloat16_3fe368ea5fd32bc4a8d1bcf42510416f7fa28668_True,arcee-ai/Arcee-Spark,3fe368ea5fd32bc4a8d1bcf42510416f7fa28668,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,25.5364556314038,TRUE,IFEval,0.562087483432847,56.2087483432847,BBH,0.548947419856745,37.1385224558447,MATH Level 5,0.123111782477341,12.3111782477341,GPQA,0.307046979865772,7.60626398210291,MUSR,0.40209375,8.59505208333333,MMLU-PRO,0.382230718085106,31.3589686761229,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-22,2024-06-26,0,arcee-ai/Arcee-Spark,apache-2.0,86,7.616,1.09853282777225 arcee-ai/Arcee-Spark_float16_3fe368ea5fd32bc4a8d1bcf42510416f7fa28668_True,arcee-ai/Arcee-Spark,3fe368ea5fd32bc4a8d1bcf42510416f7fa28668,float16,chatmodels,Original,Qwen2ForCausalLM,25.4431687473776,TRUE,IFEval,0.571829412625168,57.1829412625168,BBH,0.548086411471413,36.9243904358649,MATH Level 5,0.11404833836858,11.404833836858,GPQA,0.306208053691275,7.49440715883669,MUSR,0.400760416666667,8.39505208333334,MMLU-PRO,0.381316489361702,31.2573877068558,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-22,2024-06-26,0,arcee-ai/Arcee-Spark,apache-2.0,86,7.616,1.13604019364973 arcee-ai/Llama-3.1-SuperNova-Lite_bfloat16_76246ca4448c1a11787daee0958b60ab27f17774_True,arcee-ai/Llama-3.1-SuperNova-Lite,76246ca4448c1a11787daee0958b60ab27f17774,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,30.0424065786489,TRUE,IFEval,0.801739384832245,80.1739384832245,BBH,0.515199211510482,31.5723402129807,MATH Level 5,0.173716012084592,17.3716012084592,GPQA,0.306208053691275,7.49440715883669,MUSR,0.416322916666667,11.6736979166667,MMLU-PRO,0.387716090425532,31.9684544917258,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-10,2024-09-17,2,meta-llama/Meta-Llama-3.1-8B,llama3,182,8.03,0.855993385011881 arcee-ai/Llama-Spark_bfloat16_6d74a617fbb17a1ada08528f2673c89f84fb062e_True,arcee-ai/Llama-Spark,6d74a617fbb17a1ada08528f2673c89f84fb062e,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,24.9224332761527,TRUE,IFEval,0.791073241222179,79.1073241222179,BBH,0.505350414574998,29.7702537002086,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.299496644295302,6.59955257270694,MUSR,0.359333333333333,2.61666666666667,MMLU-PRO,0.372091090425532,30.2323433806147,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-26,2024-08-08,0,arcee-ai/Llama-Spark,llama3,26,8.03,0.830714101745732 arcee-ai/SuperNova-Medius_bfloat16_e34fafcac2801be1ae5c7eb744e191a08119f2af_True,arcee-ai/SuperNova-Medius,e34fafcac2801be1ae5c7eb744e191a08119f2af,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,33.8924710529695,TRUE,IFEval,0.718358400156031,71.8358400156031,BBH,0.637728446311571,48.0050146271633,MATH Level 5,0.153323262839879,15.3323262839879,GPQA,0.333053691275168,11.0738255033557,MUSR,0.423270833333333,12.2755208333333,MMLU-PRO,0.503490691489362,44.8322990543735,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-02,2024-10-22,1,arcee-ai/SuperNova-Medius (Merge),apache-2.0,196,14.77,5.86781166745177 -arcee-ai/Virtuoso-Small_bfloat16_ca5dec1c6351ba6f2f0c59e609b94628a29c1459_True,arcee-ai/Virtuoso-Small,ca5dec1c6351ba6f2f0c59e609b94628a29c1459,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,39.4283232965703,TRUE,IFEval,0.793521190441362,79.3521190441362,BBH,0.651763312945478,50.3998463118999,MATH Level 5,0.342900302114804,34.2900302114804,GPQA,0.336409395973154,11.5212527964206,MUSR,0.43390625,14.43828125,MMLU-PRO,0.519115691489362,46.5684101654846,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-03,1,arcee-ai/Virtuoso-Small (Merge),apache-2.0,39,14.77,1.51431412160642 +arcee-ai/Virtuoso-Small_bfloat16_ca5dec1c6351ba6f2f0c59e609b94628a29c1459_True,arcee-ai/Virtuoso-Small,ca5dec1c6351ba6f2f0c59e609b94628a29c1459,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,39.4283232965703,TRUE,IFEval,0.793521190441362,79.3521190441362,BBH,0.651763312945478,50.3998463118999,MATH Level 5,0.342900302114804,34.2900302114804,GPQA,0.336409395973154,11.5212527964206,MUSR,0.43390625,14.43828125,MMLU-PRO,0.519115691489362,46.5684101654846,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-03,1,arcee-ai/Virtuoso-Small (Merge),apache-2.0,41,14.77,1.51431412160642 arcee-ai/raspberry-3B_bfloat16_66bf1346c060bbfe1f1b98cd22e7a26ada69cf70_True,arcee-ai/raspberry-3B,66bf1346c060bbfe1f1b98cd22e7a26ada69cf70,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,15.5380031214432,TRUE,IFEval,0.315416428409952,31.5416428409952,BBH,0.42689280188827,19.5282344009925,MATH Level 5,0.0845921450151058,8.45921450151058,GPQA,0.277684563758389,3.69127516778523,MUSR,0.412322916666667,9.40703125,MMLU-PRO,0.285405585106383,20.6006205673759,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-05,2024-10-07,1,Qwen/Qwen2.5-3B,other,37,3.086,1.03652651773508 argilla/notus-7b-v1_bfloat16_30172203a2d41cb487bf7e2b92a821080783b2c9_True,argilla/notus-7b-v1,30172203a2d41cb487bf7e2b92a821080783b2c9,bfloat16,chatmodels,Original,MistralForCausalLM,18.4113211888546,TRUE,IFEval,0.508207112683236,50.8207112683236,BBH,0.45118574073815,22.7471119611614,MATH Level 5,0.0279456193353474,2.79456193353474,GPQA,0.289429530201342,5.2572706935123,MUSR,0.336416666666667,6.58541666666667,MMLU-PRO,0.300365691489362,22.2628546099291,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-16,2024-06-27,2,mistralai/Mistral-7B-v0.1,mit,122,7.242,0.667908131155709 argilla/notux-8x7b-v1_bfloat16_0b29f9afcbae2ab4c5085638d8f5a7f6d44c6b17_True,argilla/notux-8x7b-v1,0b29f9afcbae2ab4c5085638d8f5a7f6d44c6b17,bfloat16,chatmodels,Original,MixtralForCausalLM,24.4282310956467,TRUE,IFEval,0.542229063329743,54.2229063329743,BBH,0.536330416451635,34.7580616829018,MATH Level 5,0.0966767371601208,9.66767371601208,GPQA,0.308724832214765,7.82997762863535,MUSR,0.41759375,10.5325520833333,MMLU-PRO,0.366023936170213,29.5582151300237,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-12,2024-06-12,2,mistralai/Mixtral-8x7B-v0.1,apache-2.0,165,46.703,21.3908445719779 @@ -1214,6 +1228,7 @@ bamec66557/MISCHIEVOUS-12B-Mix_III_IV_V_bfloat16_651323f625a3b0f982bd0ca294b7293 bamec66557/MISCHIEVOUS-12B-Mix_III_ex_V_bfloat16_3af16a4f7be269c0483ba7ff3c7ea70c5843a44d_False,bamec66557/MISCHIEVOUS-12B-Mix_III_ex_V,3af16a4f7be269c0483ba7ff3c7ea70c5843a44d,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,23.7952538160544,FALSE,IFEval,0.431620322965288,43.1620322965288,BBH,0.544892689125407,34.8686348943506,MATH Level 5,0.131419939577039,13.1419939577039,GPQA,0.320469798657718,9.39597315436242,MUSR,0.419791666666667,12.7739583333333,MMLU-PRO,0.364860372340426,29.4289302600473,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-17,2024-12-18,1,bamec66557/MISCHIEVOUS-12B-Mix_III_ex_V (Merge),apache-2.0,0,6.124,1.07950239643296 bamec66557/MISCHIEVOUS-12B-Mix_Neo_bfloat16_a3f902a40e0e6a1b7abdefe70e8cd14929deddc9_True,bamec66557/MISCHIEVOUS-12B-Mix_Neo,a3f902a40e0e6a1b7abdefe70e8cd14929deddc9,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,25.8007316140612,TRUE,IFEval,0.624960659937854,62.4960659937854,BBH,0.507757472871752,30.3606897425242,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.316275167785235,8.83668903803132,MUSR,0.415020833333333,11.6442708333333,MMLU-PRO,0.368517287234043,29.8352541371158,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,bamec66557/MISCHIEVOUS-12B-Mix_Neo (Merge),apache-2.0,1,6.124,1.00545013428172 bamec66557/Mistral-Nemo-VICIOUS_MESH-12B-2407_bfloat16_5e11cfae129186b2479fb01211d565a16eed1f02_True,bamec66557/Mistral-Nemo-VICIOUS_MESH-12B-2407,5e11cfae129186b2479fb01211d565a16eed1f02,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,27.2681193004847,TRUE,IFEval,0.670572968612171,67.0572968612171,BBH,0.515596428572409,31.3566073935338,MATH Level 5,0.123867069486405,12.3867069486405,GPQA,0.315436241610738,8.7248322147651,MUSR,0.430989583333333,14.3403645833333,MMLU-PRO,0.367686170212766,29.7429078014184,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-22,2024-12-22,1,bamec66557/Mistral-Nemo-VICIOUS_MESH-12B-2407 (Merge),apache-2.0,2,6.124,1.95466791866422 +bamec66557/NameLess-12B-prob_bfloat16_eb53d01a5d573356c16b6235679e84567f599e33_True,bamec66557/NameLess-12B-prob,eb53d01a5d573356c16b6235679e84567f599e33,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,26.9372864818212,TRUE,IFEval,0.660231519036157,66.0231519036157,BBH,0.51581410191513,31.3557280590341,MATH Level 5,0.111027190332326,11.1027190332326,GPQA,0.314597315436242,8.61297539149888,MUSR,0.433625,14.703125,MMLU-PRO,0.368434175531915,29.8260195035461,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-25,2024-12-25,0,bamec66557/NameLess-12B-prob,apache-2.0,0,6.124,0.961466441708975 bamec66557/VICIOUS_MESH-12B_bfloat16_4a0a2cf1eca5766badb8ff2853e15f045de71a92_False,bamec66557/VICIOUS_MESH-12B,4a0a2cf1eca5766badb8ff2853e15f045de71a92,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,22.7302307814069,FALSE,IFEval,0.373093392199364,37.3093392199364,BBH,0.543602252458766,34.3725160302973,MATH Level 5,0.129909365558912,12.9909365558912,GPQA,0.328020134228188,10.4026845637584,MUSR,0.410489583333333,11.54453125,MMLU-PRO,0.367852393617021,29.7613770685579,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-18,0,Removed,"",0,6.124,2.21832596940297 bamec66557/VICIOUS_MESH-12B-0.1v_bfloat16_14e82cd2858767003bed53db1c0de82f6c7dd9bf_False,bamec66557/VICIOUS_MESH-12B-0.1v,14e82cd2858767003bed53db1c0de82f6c7dd9bf,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,22.3991009779179,FALSE,IFEval,0.365749544541816,36.5749544541816,BBH,0.541227600452917,34.1302381345742,MATH Level 5,0.129154078549849,12.9154078549849,GPQA,0.324664429530201,9.95525727069351,MUSR,0.415822916666667,11.0111979166667,MMLU-PRO,0.36826795212766,29.8075502364066,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-18,0,Removed,"",0,6.124,1.07445876466654 bamec66557/VICIOUS_MESH-12B-0.X.ver_bfloat16_93bdb2c1d5644217e5f5e9bcbf669b18e3b05851_False,bamec66557/VICIOUS_MESH-12B-0.X.ver,93bdb2c1d5644217e5f5e9bcbf669b18e3b05851,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,22.6279499130824,FALSE,IFEval,0.377564861234857,37.7564861234857,BBH,0.541624689936422,34.0892473853206,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.321308724832215,9.50782997762864,MUSR,0.419822916666667,12.8778645833333,MMLU-PRO,0.367104388297872,29.6782653664303,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-18,0,Removed,"",0,6.124,2.23600826848483 @@ -1303,8 +1318,8 @@ cognitivecomputations/dolphin-2.9.2-Phi-3-Medium-abliterated_bfloat16_d50be5f22c cognitivecomputations/dolphin-2.9.2-qwen2-72b_bfloat16_e79582577c2bf2af304221af0e8308b7e7d46ca1_True,cognitivecomputations/dolphin-2.9.2-qwen2-72b,e79582577c2bf2af304221af0e8308b7e7d46ca1,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,35.7452923179215,TRUE,IFEval,0.634377895096123,63.4377895096123,BBH,0.629636493958407,47.6961737282619,MATH Level 5,0.20619335347432,20.619335347432,GPQA,0.36996644295302,15.9955257270693,MUSR,0.452072916666667,17.0424479166667,MMLU-PRO,0.547124335106383,49.680481678487,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-27,2024-10-20,1,Qwen/Qwen2-72B,other,132,72,25.1155535276709 cognitivecomputations/dolphin-2.9.2-qwen2-7b_bfloat16_c443c4eb5138ed746ac49ed98bf3c183dc5380ac_True,cognitivecomputations/dolphin-2.9.2-qwen2-7b,c443c4eb5138ed746ac49ed98bf3c183dc5380ac,bfloat16,chatmodels,Original,Qwen2ForCausalLM,21.1839653570505,TRUE,IFEval,0.353459930761491,35.3459930761491,BBH,0.489382637591956,27.9148749532555,MATH Level 5,0.129154078549849,12.9154078549849,GPQA,0.290268456375839,5.36912751677852,MUSR,0.419145833333333,11.6598958333333,MMLU-PRO,0.405086436170213,33.8984929078014,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-24,2024-07-10,1,Qwen/Qwen2-7B,apache-2.0,63,7.616,1.27919726982431 cognitivecomputations/dolphin-2.9.3-Yi-1.5-34B-32k_bfloat16_ff4eee6438194a670a95dff3118b5231eb568610_True,cognitivecomputations/dolphin-2.9.3-Yi-1.5-34B-32k,ff4eee6438194a670a95dff3118b5231eb568610,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,27.0732064143377,TRUE,IFEval,0.363926603633914,36.3926603633914,BBH,0.604699553777323,43.4064756523518,MATH Level 5,0.165407854984894,16.5407854984894,GPQA,0.343120805369128,12.4161073825503,MUSR,0.431052083333333,13.3481770833333,MMLU-PRO,0.463015292553192,40.3350325059102,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-23,2024-07-27,1,01-ai/Yi-1.5-34B-32k,apache-2.0,18,34,3.24526052711179 -cognitivecomputations/dolphin-2.9.3-mistral-7B-32k_bfloat16_4f4273ee8e7930dd64e2c6121c79d12546b883e2_True,cognitivecomputations/dolphin-2.9.3-mistral-7B-32k,4f4273ee8e7930dd64e2c6121c79d12546b883e2,bfloat16,chatmodels,Original,MistralForCausalLM,19.3738721831618,TRUE,IFEval,0.412636249595518,41.2636249595518,BBH,0.48125401481062,26.9063538917805,MATH Level 5,0.0521148036253777,5.21148036253777,GPQA,0.285234899328859,4.6979865771812,MUSR,0.464260416666667,17.9325520833333,MMLU-PRO,0.282081117021277,20.2312352245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-25,2024-07-04,1,mistralai/Mistral-7B-v0.3,apache-2.0,46,7.248,0.600082580420255 -cognitivecomputations/dolphin-2.9.3-mistral-nemo-12b_bfloat16_7b535c900688fc836fbeebaeb7133910b09bafda_True,cognitivecomputations/dolphin-2.9.3-mistral-nemo-12b,7b535c900688fc836fbeebaeb7133910b09bafda,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,24.6829041548415,TRUE,IFEval,0.560089451544125,56.0089451544125,BBH,0.548036918314418,36.0827586591529,MATH Level 5,0.0566465256797583,5.66465256797583,GPQA,0.315436241610738,8.7248322147651,MUSR,0.442989583333333,15.20703125,MMLU-PRO,0.337682845744681,26.4092050827423,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-23,2024-07-26,1,mistralai/Mistral-Nemo-Base-2407,apache-2.0,91,12.248,1.37514248165786 +cognitivecomputations/dolphin-2.9.3-mistral-7B-32k_bfloat16_4f4273ee8e7930dd64e2c6121c79d12546b883e2_True,cognitivecomputations/dolphin-2.9.3-mistral-7B-32k,4f4273ee8e7930dd64e2c6121c79d12546b883e2,bfloat16,chatmodels,Original,MistralForCausalLM,19.3738721831618,TRUE,IFEval,0.412636249595518,41.2636249595518,BBH,0.48125401481062,26.9063538917805,MATH Level 5,0.0521148036253777,5.21148036253777,GPQA,0.285234899328859,4.6979865771812,MUSR,0.464260416666667,17.9325520833333,MMLU-PRO,0.282081117021277,20.2312352245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-25,2024-07-04,1,mistralai/Mistral-7B-v0.3,apache-2.0,48,7.248,0.600082580420255 +cognitivecomputations/dolphin-2.9.3-mistral-nemo-12b_bfloat16_7b535c900688fc836fbeebaeb7133910b09bafda_True,cognitivecomputations/dolphin-2.9.3-mistral-nemo-12b,7b535c900688fc836fbeebaeb7133910b09bafda,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,24.6829041548415,TRUE,IFEval,0.560089451544125,56.0089451544125,BBH,0.548036918314418,36.0827586591529,MATH Level 5,0.0566465256797583,5.66465256797583,GPQA,0.315436241610738,8.7248322147651,MUSR,0.442989583333333,15.20703125,MMLU-PRO,0.337682845744681,26.4092050827423,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-23,2024-07-26,1,mistralai/Mistral-Nemo-Base-2407,apache-2.0,92,12.248,1.37514248165786 cognitivecomputations/dolphin-2.9.4-gemma2-2b_bfloat16_5c0854beb88a6711221771d1b13d51f733e6ca06_True,cognitivecomputations/dolphin-2.9.4-gemma2-2b,5c0854beb88a6711221771d1b13d51f733e6ca06,bfloat16,chatmodels,Original,Gemma2ForCausalLM,9.79744097359818,TRUE,IFEval,0.0895512794939649,8.95512794939649,BBH,0.408131874110552,17.3676325443774,MATH Level 5,0.0468277945619335,4.68277945619335,GPQA,0.284395973154362,4.58612975391499,MUSR,0.41796875,10.9127604166667,MMLU-PRO,0.210521941489362,12.2802157210402,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-24,2024-08-25,1,google/gemma-2-2b,gemma,34,2.614,1.51124801123075 cognitivecomputations/dolphin-2.9.4-llama3.1-8b_bfloat16_7b73d1b7760bf9abac168de3d388b30d1ca1a138_True,cognitivecomputations/dolphin-2.9.4-llama3.1-8b,7b73d1b7760bf9abac168de3d388b30d1ca1a138,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,6.95562754717428,TRUE,IFEval,0.275723967960567,27.5723967960567,BBH,0.352362638508326,8.97208868892153,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.263422818791946,1.78970917225951,MUSR,0.323614583333333,0.618489583333333,MMLU-PRO,0.123670212765957,2.63002364066194,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-04,2024-09-17,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,92,8.03,1.75631302244174 collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2_bfloat16_2560556d655d0ecaefec10f579c92292d65fb28b_False,collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2,2560556d655d0ecaefec10f579c92292d65fb28b,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,17.9516353382294,FALSE,IFEval,0.380887157187374,38.0887157187374,BBH,0.46480279544899,23.6485031761083,MATH Level 5,0.0574018126888218,5.74018126888218,GPQA,0.333053691275168,11.0738255033557,MUSR,0.343427083333333,1.59505208333333,MMLU-PRO,0.348071808510638,27.5635342789598,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-06-27,0,Removed,"",0,8.03,0.705789134715541 @@ -1318,7 +1333,7 @@ cyberagent/calm3-22b-chat_bfloat16_055922aa0f0fb1fbfbc97a2e31134532485ee99b_True darkc0de/BuddyGlassNeverSleeps_float16_f8849498f02c94b68ef0308a7bf6637264949a7d_False,darkc0de/BuddyGlassNeverSleeps,f8849498f02c94b68ef0308a7bf6637264949a7d,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.8458178279584,FALSE,IFEval,0.423901913589276,42.3901913589276,BBH,0.497722816536468,28.4779534944187,MATH Level 5,0.0641993957703927,6.41993957703927,GPQA,0.294463087248322,5.92841163310962,MUSR,0.399270833333333,8.60885416666667,MMLU-PRO,0.345246010638298,27.2495567375887,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-16,2024-09-16,1,darkc0de/BuddyGlassNeverSleeps (Merge),"",2,8.03,1.35414877415844 darkc0de/BuddyGlass_v0.3_Xortron7MethedUpSwitchedUp_bfloat16_57367fefe01c7d9653c303b28449b416fc777d93_False,darkc0de/BuddyGlass_v0.3_Xortron7MethedUpSwitchedUp,57367fefe01c7d9653c303b28449b416fc777d93,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,22.2653148564924,FALSE,IFEval,0.435842453578727,43.5842453578727,BBH,0.524308799865672,31.869311081858,MATH Level 5,0.124622356495468,12.4622356495468,GPQA,0.298657718120805,6.48769574944072,MUSR,0.414333333333333,9.49166666666667,MMLU-PRO,0.367270611702128,29.6967346335697,FALSE,FALSE,FALSE,FALSE,FALSE,2024-09-10,2024-09-15,1,darkc0de/BuddyGlass_v0.3_Xortron7MethedUpSwitchedUp (Merge),"",2,0.007,0.898182046260927 databricks/dbrx-instruct_bfloat16_c0a9245908c187da8f43a81e538e67ff360904ea_True,databricks/dbrx-instruct,c0a9245908c187da8f43a81e538e67ff360904ea,bfloat16,chatmodels,Original,DbrxForCausalLM,25.1990102724432,TRUE,IFEval,0.541579675261639,54.1579675261639,BBH,0.542896079693439,35.9638196035936,MATH Level 5,0.0687311178247734,6.87311178247734,GPQA,0.341442953020134,12.1923937360179,MUSR,0.426927083333333,12.19921875,MMLU-PRO,0.36826795212766,29.8075502364066,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-26,2024-06-12,0,databricks/dbrx-instruct,other,1106,131.597,47.95802727312 -databricks/dolly-v1-6b_bfloat16_c9a85b3a322b402e20c839c702c725afe0cb454d_False,databricks/dolly-v1-6b,c9a85b3a322b402e20c839c702c725afe0cb454d,bfloat16,pretrained,Original,GPTJForCausalLM,6.91829112647551,FALSE,IFEval,0.222443117594649,22.2443117594649,BBH,0.31720895287747,4.7813091701327,MATH Level 5,0.0151057401812689,1.51057401812689,GPQA,0.264261744966443,1.90156599552573,MUSR,0.400416666666667,8.11875,MMLU-PRO,0.126579122340426,2.95323581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2023-03-23,2024-06-12,0,databricks/dolly-v1-6b,cc-by-nc-4.0,310,6,0.660779912276233 +databricks/dolly-v1-6b_bfloat16_c9a85b3a322b402e20c839c702c725afe0cb454d_False,databricks/dolly-v1-6b,c9a85b3a322b402e20c839c702c725afe0cb454d,bfloat16,pretrained,Original,GPTJForCausalLM,6.91829112647551,FALSE,IFEval,0.222443117594649,22.2443117594649,BBH,0.31720895287747,4.7813091701327,MATH Level 5,0.0151057401812689,1.51057401812689,GPQA,0.264261744966443,1.90156599552573,MUSR,0.400416666666667,8.11875,MMLU-PRO,0.126579122340426,2.95323581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2023-03-23,2024-06-12,0,databricks/dolly-v1-6b,cc-by-nc-4.0,311,6,0.660779912276233 databricks/dolly-v2-12b_bfloat16_19308160448536e378e3db21a73a751579ee7fdd_False,databricks/dolly-v2-12b,19308160448536e378e3db21a73a751579ee7fdd,bfloat16,fine-tunedondomain-specificdatasets,Original,GPTNeoXForCausalLM,6.3830238203141,FALSE,IFEval,0.235507342739487,23.5507342739487,BBH,0.331997316737713,6.37789413745296,MATH Level 5,0.0143504531722054,1.43504531722054,GPQA,0.240771812080537,0,MUSR,0.37390625,5.50494791666667,MMLU-PRO,0.112865691489362,1.42952127659574,TRUE,FALSE,FALSE,FALSE,TRUE,2023-04-11,2024-06-12,0,databricks/dolly-v2-12b,mit,1952,12,1.39711946227966 databricks/dolly-v2-3b_bfloat16_f6c9be08f16fe4d3a719bee0a4a7c7415b5c65df_False,databricks/dolly-v2-3b,f6c9be08f16fe4d3a719bee0a4a7c7415b5c65df,bfloat16,fine-tunedondomain-specificdatasets,Original,GPTNeoXForCausalLM,5.46118895807585,FALSE,IFEval,0.224715975833012,22.4715975833012,BBH,0.307927859615448,3.32476895654539,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.260906040268456,1.45413870246085,MUSR,0.33378125,3.22265625,MMLU-PRO,0.114527925531915,1.61421394799054,TRUE,FALSE,FALSE,FALSE,TRUE,2023-04-13,2024-06-12,0,databricks/dolly-v2-3b,mit,287,3,0.758084484077729 databricks/dolly-v2-7b_bfloat16_d632f0c8b75b1ae5b26b250d25bfba4e99cb7c6f_False,databricks/dolly-v2-7b,d632f0c8b75b1ae5b26b250d25bfba4e99cb7c6f,bfloat16,fine-tunedondomain-specificdatasets,Original,GPTNeoXForCausalLM,5.57183177390665,FALSE,IFEval,0.200985607078108,20.0985607078108,BBH,0.317306281220703,5.44989251281721,MATH Level 5,0.00981873111782478,0.981873111782478,GPQA,0.268456375838926,2.46085011185682,MUSR,0.355302083333333,2.77942708333333,MMLU-PRO,0.114943484042553,1.66038711583924,TRUE,FALSE,FALSE,FALSE,TRUE,2023-04-13,2024-06-12,0,databricks/dolly-v2-7b,mit,148,7,0.830205993546681 @@ -1351,7 +1366,7 @@ djuna/MN-Chinofun-12B-2_bfloat16_d2aab6837c2ad2dfebb18b15549affd9dd2b8723_True,d djuna/MN-Chinofun-12B-3_bfloat16_fa64c9bc66221946d7425c4eea93828900083d84_True,djuna/MN-Chinofun-12B-3,fa64c9bc66221946d7425c4eea93828900083d84,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,18.1628671753124,TRUE,IFEval,0.305274449571581,30.5274449571581,BBH,0.53478574603334,34.2191964654497,MATH Level 5,0.0868580060422961,8.68580060422961,GPQA,0.265939597315436,2.12527964205817,MUSR,0.419791666666667,10.9072916666667,MMLU-PRO,0.302609707446809,22.5121897163121,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-05,1,djuna/MN-Chinofun-12B-3 (Merge),"",2,12.248,1.2077394247819 djuna/Q2.5-Partron-7B_bfloat16_3a6d3cca23c0e1c6bcba38887fc819729d5d16cf_True,djuna/Q2.5-Partron-7B,3a6d3cca23c0e1c6bcba38887fc819729d5d16cf,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,27.0772475093642,TRUE,IFEval,0.732121881053383,73.2121881053383,BBH,0.541847485072639,35.2572653166736,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.297818791946309,6.3758389261745,MUSR,0.416541666666667,11.0677083333333,MMLU-PRO,0.42827460106383,36.4749556737589,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-08,2024-11-08,1,djuna/Q2.5-Partron-7B (Merge),"",0,7.613,1.33476263935491 djuna/Q2.5-Veltha-14B_bfloat16_fd0c348618e5c8198b769d2f5ff1e3a810e007e7_True,djuna/Q2.5-Veltha-14B,fd0c348618e5c8198b769d2f5ff1e3a810e007e7,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,39.2088375386575,TRUE,IFEval,0.829166611258128,82.9166611258129,BBH,0.648421390292023,49.7524323992886,MATH Level 5,0.280211480362538,28.0211480362538,GPQA,0.359060402684564,14.5413870246085,MUSR,0.419427083333333,12.26171875,MMLU-PRO,0.52983710106383,47.7596778959811,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-22,2024-12-22,1,djuna/Q2.5-Veltha-14B (Merge),"",6,7.383,1.60674495472774 -djuna/Q2.5-Veltha-14B-0.5_bfloat16_db20da90002d4b1285f61e2648c4fdbec44e02e7_True,djuna/Q2.5-Veltha-14B-0.5,db20da90002d4b1285f61e2648c4fdbec44e02e7,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,39.9632353122728,TRUE,IFEval,0.77958261856319,77.958261856319,BBH,0.652302668830836,50.3181259857034,MATH Level 5,0.338368580060423,33.8368580060423,GPQA,0.368288590604027,15.7718120805369,MUSR,0.43390625,14.1716145833333,MMLU-PRO,0.529504654255319,47.7227393617021,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-22,2024-12-22,1,djuna/Q2.5-Veltha-14B-0.5 (Merge),"",6,7.383,1.47146139865559 +djuna/Q2.5-Veltha-14B-0.5_bfloat16_db20da90002d4b1285f61e2648c4fdbec44e02e7_True,djuna/Q2.5-Veltha-14B-0.5,db20da90002d4b1285f61e2648c4fdbec44e02e7,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,39.9632353122728,TRUE,IFEval,0.77958261856319,77.958261856319,BBH,0.652302668830836,50.3181259857034,MATH Level 5,0.338368580060423,33.8368580060423,GPQA,0.368288590604027,15.7718120805369,MUSR,0.43390625,14.1716145833333,MMLU-PRO,0.529504654255319,47.7227393617021,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-22,2024-12-22,1,djuna/Q2.5-Veltha-14B-0.5 (Merge),"",7,7.383,1.47146139865559 djuna-test-lab/TEST-L3.2-ReWish-3B_bfloat16_0cb7d434c4647faed475f17d74e9047007cd3782_True,djuna-test-lab/TEST-L3.2-ReWish-3B,0cb7d434c4647faed475f17d74e9047007cd3782,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,22.4455124376377,TRUE,IFEval,0.636775976630895,63.6775976630895,BBH,0.449540552927623,22.0667004324223,MATH Level 5,0.129154078549849,12.9154078549849,GPQA,0.283557046979866,4.47427293064877,MUSR,0.37775,7.91875,MMLU-PRO,0.312583111702128,23.6203457446808,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-23,2024-10-24,1,djuna-test-lab/TEST-L3.2-ReWish-3B (Merge),"",1,3.213,0.640630900962079 djuna-test-lab/TEST-L3.2-ReWish-3B-ties-w-base_bfloat16_ebab6c0266ae7846b2bb9a595a2651a23b031372_True,djuna-test-lab/TEST-L3.2-ReWish-3B-ties-w-base,ebab6c0266ae7846b2bb9a595a2651a23b031372,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,22.4201168576137,TRUE,IFEval,0.635252241829457,63.5252241829457,BBH,0.449540552927623,22.0667004324223,MATH Level 5,0.129154078549849,12.9154078549849,GPQA,0.283557046979866,4.47427293064877,MUSR,0.37775,7.91875,MMLU-PRO,0.312583111702128,23.6203457446808,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-23,2024-10-23,1,djuna-test-lab/TEST-L3.2-ReWish-3B-ties-w-base (Merge),"",0,3.213,1.28137393932878 dnhkng/RYS-Medium_bfloat16_de09a79e6b2efdcc97490a37b770764e62749fd0_False,dnhkng/RYS-Medium,de09a79e6b2efdcc97490a37b770764e62749fd0,bfloat16,continuouslypretrained,Original,Phi3ForCausalLM,25.9442272761267,FALSE,IFEval,0.440613128720683,44.0613128720683,BBH,0.628472687243283,47.7342013248615,MATH Level 5,0.0777945619335348,7.77945619335348,GPQA,0.328020134228188,10.4026845637584,MUSR,0.406927083333333,8.73255208333333,MMLU-PRO,0.432596409574468,36.9551566193854,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-17,2024-07-17,0,dnhkng/RYS-Medium,mit,3,18.731,2.1363783500494 @@ -1379,7 +1394,7 @@ dwikitheduck/gen-inst-1_bfloat16_73180b0a57469bbd12f7d037a1cc25e53c252ad6_True,d dwikitheduck/gen-try1_bfloat16_9c2cab728518e179e5d8891f3f9775515f15cea2_True,dwikitheduck/gen-try1,9c2cab728518e179e5d8891f3f9775515f15cea2,bfloat16,chatmodels,Original,Qwen2ForCausalLM,34.8300526812901,TRUE,IFEval,0.752205259821718,75.2205259821718,BBH,0.635851093347073,47.4131290314286,MATH Level 5,0.135196374622357,13.5196374622357,GPQA,0.341442953020134,12.1923937360179,MUSR,0.4415625,14.9619791666667,MMLU-PRO,0.511053856382979,45.6726507092199,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-11,2024-11-12,1,dwikitheduck/gen-try1 (Merge),apache-2.0,0,14.77,1.58308055537674 dwikitheduck/gen-try1-notemp_bfloat16_391925b02f6cd60e7c4ef1321fe89a92d6b9fdf0_False,dwikitheduck/gen-try1-notemp,391925b02f6cd60e7c4ef1321fe89a92d6b9fdf0,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,29.6691847174093,FALSE,IFEval,0.26270961050014,26.270961050014,BBH,0.626267088306491,45.7490926695055,MATH Level 5,0.27416918429003,27.416918429003,GPQA,0.354026845637584,13.8702460850112,MUSR,0.471416666666667,17.9270833333333,MMLU-PRO,0.521027260638298,46.7808067375887,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-11-13,0,Removed,"",0,14.77,1.89560587957928 dzakwan/dzakwan-MoE-4x7b-Beta_float16_e89f82f2afa1961335de5a6d6d05bd850d1d61d9_False,dzakwan/dzakwan-MoE-4x7b-Beta,e89f82f2afa1961335de5a6d6d05bd850d1d61d9,float16,basemergesandmoerges,Original,MixtralForCausalLM,20.7567149364237,FALSE,IFEval,0.444260118707252,44.4260118707252,BBH,0.514044131159397,32.0742084654425,MATH Level 5,0.0770392749244713,7.70392749244713,GPQA,0.286073825503356,4.80984340044743,MUSR,0.426739583333333,12.1091145833333,MMLU-PRO,0.310754654255319,23.4171838061466,TRUE,TRUE,TRUE,FALSE,FALSE,2024-05-26,2024-08-05,1,dzakwan/dzakwan-MoE-4x7b-Beta (Merge),apache-2.0,0,24.154,1.45602830651712 -ehristoforu/Falcon3-MoE-2x7B-Insruct_bfloat16_d7c85f436d22685010165483ba966d6ee2336cc8_True,ehristoforu/Falcon3-MoE-2x7B-Insruct,d7c85f436d22685010165483ba966d6ee2336cc8,bfloat16,pretrained,Original,MixtralForCausalLM,35.1570771392653,TRUE,IFEval,0.7642954028644,76.42954028644,BBH,0.564789641564995,38.0671542210182,MATH Level 5,0.321752265861027,32.1752265861027,GPQA,0.312080536912752,8.27740492170022,MUSR,0.484041666666667,21.6052083333333,MMLU-PRO,0.409491356382979,34.3879284869976,TRUE,FALSE,TRUE,FALSE,FALSE,2024-12-22,2024-12-22,1,ehristoforu/Falcon3-MoE-2x7B-Insruct (Merge),other,0,6.701,1.63621070635266 +ehristoforu/Falcon3-MoE-2x7B-Insruct_bfloat16_d7c85f436d22685010165483ba966d6ee2336cc8_True,ehristoforu/Falcon3-MoE-2x7B-Insruct,d7c85f436d22685010165483ba966d6ee2336cc8,bfloat16,pretrained,Original,MixtralForCausalLM,35.1570771392653,TRUE,IFEval,0.7642954028644,76.42954028644,BBH,0.564789641564995,38.0671542210182,MATH Level 5,0.321752265861027,32.1752265861027,GPQA,0.312080536912752,8.27740492170022,MUSR,0.484041666666667,21.6052083333333,MMLU-PRO,0.409491356382979,34.3879284869976,TRUE,FALSE,TRUE,FALSE,FALSE,2024-12-22,2024-12-22,1,ehristoforu/Falcon3-MoE-2x7B-Insruct (Merge),other,1,6.701,1.63621070635266 ehristoforu/Gemma2-9B-it-psy10k-mental_health_float16_4adc2d61d530d23026493d29e6191e06cf549fc6_True,ehristoforu/Gemma2-9B-it-psy10k-mental_health,4adc2d61d530d23026493d29e6191e06cf549fc6,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,26.7644935055422,TRUE,IFEval,0.588665851052984,58.8665851052984,BBH,0.553937694402764,35.5660094986327,MATH Level 5,0.137462235649547,13.7462235649547,GPQA,0.337248322147651,11.6331096196868,MUSR,0.408604166666667,9.3421875,MMLU-PRO,0.382895611702128,31.4328457446809,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2024-07-31,4,google/gemma-2-9b,apache-2.0,1,9.242,2.27683018291986 ehristoforu/Gemma2-9b-it-train6_float16_e72bf00b427c22c48b468818cf75300a373a0c8a_True,ehristoforu/Gemma2-9b-it-train6,e72bf00b427c22c48b468818cf75300a373a0c8a,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,28.8975315532327,TRUE,IFEval,0.702521531757958,70.2521531757958,BBH,0.58980925791336,40.9876253015965,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.328859060402685,10.5145413870246,MUSR,0.408416666666667,9.65208333333334,MMLU-PRO,0.394198803191489,32.6887559101655,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-22,2024-07-31,8,google/gemma-2-9b,apache-2.0,2,9.242,1.99368347439621 ehristoforu/HappyLlama1_float16_9bee1c404de70fc0ebe3cbcd2af2303a313a24be_True,ehristoforu/HappyLlama1,9bee1c404de70fc0ebe3cbcd2af2303a313a24be,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,26.0430329547881,TRUE,IFEval,0.736268656054824,73.6268656054824,BBH,0.499573230974285,28.4997734070813,MATH Level 5,0.101208459214502,10.1208459214502,GPQA,0.283557046979866,4.47427293064877,MUSR,0.4286875,11.2526041666667,MMLU-PRO,0.354554521276596,28.2838356973995,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-29,2024-11-30,1,voidful/Llama-3.2-8B-Instruct,apache-2.0,0,8.03,0.714360642416245 @@ -1439,26 +1454,26 @@ google/codegemma-1.1-2b_bfloat16_9d69e500da236427eab5867552ffc87108964f4d_False, google/flan-t5-base_float16_7bcac572ce56db69c1ea7c8af255c5d7c9672fc2_False,google/flan-t5-base,7bcac572ce56db69c1ea7c8af255c5d7c9672fc2,float16,pretrained,Original,T5ForConditionalGeneration,6.23940848953395,FALSE,IFEval,0.189070555016246,18.9070555016246,BBH,0.352598059930032,11.3376936773049,MATH Level 5,0,0,GPQA,0.238255033557047,0,MUSR,0.367114583333333,3.22265625,MMLU-PRO,0.135721409574468,3.96904550827423,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-21,2024-08-14,0,google/flan-t5-base,apache-2.0,826,0.248,0.156621440424456 google/flan-t5-large_float16_0613663d0d48ea86ba8cb3d7a44f0f65dc596a2a_False,google/flan-t5-large,0613663d0d48ea86ba8cb3d7a44f0f65dc596a2a,float16,pretrained,Original,T5ForConditionalGeneration,9.41894870600608,FALSE,IFEval,0.220094903744287,22.0094903744287,BBH,0.415311503567943,17.5100182800673,MATH Level 5,0,0,GPQA,0.250838926174497,0.111856823266221,MUSR,0.408322916666667,9.00703125,MMLU-PRO,0.170877659574468,7.87529550827423,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-21,2024-08-14,0,google/flan-t5-large,apache-2.0,648,0.783,0.233491371635308 google/flan-t5-small_float16_0fc9ddf78a1e988dac52e2dac162b0ede4fd74ab_False,google/flan-t5-small,0fc9ddf78a1e988dac52e2dac162b0ede4fd74ab,float16,pretrained,Original,T5ForConditionalGeneration,6.00378064236063,FALSE,IFEval,0.152425564169736,15.2425564169736,BBH,0.328290109764084,6.36311196167965,MATH Level 5,0,0,GPQA,0.260906040268456,1.45413870246085,MUSR,0.412291666666667,10.3697916666667,MMLU-PRO,0.123337765957447,2.59308510638298,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-21,2024-06-27,0,google/flan-t5-small,apache-2.0,294,0.077,0.143130242275139 -google/flan-t5-xl_float16_7d6315df2c2fb742f0f5b556879d730926ca9001_False,google/flan-t5-xl,7d6315df2c2fb742f0f5b556879d730926ca9001,float16,pretrained,Original,T5ForConditionalGeneration,11.5917795285333,FALSE,IFEval,0.223741893730856,22.3741893730856,BBH,0.453106360621123,22.6950558112154,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.25251677852349,0.335570469798655,MUSR,0.41809375,11.3283854166667,MMLU-PRO,0.214677526595745,12.7419473995272,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-21,2024-08-07,0,google/flan-t5-xl,apache-2.0,476,2.85,0.348929344293381 -google/flan-t5-xl_bfloat16_7d6315df2c2fb742f0f5b556879d730926ca9001_False,google/flan-t5-xl,7d6315df2c2fb742f0f5b556879d730926ca9001,bfloat16,pretrained,Original,T5ForConditionalGeneration,11.5871674375561,FALSE,IFEval,0.22069442412798,22.069442412798,BBH,0.45372172155694,22.8375876635233,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.245805369127517,0,MUSR,0.42203125,11.85390625,MMLU-PRO,0.214178856382979,12.6865395981087,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-21,2024-08-07,0,google/flan-t5-xl,apache-2.0,476,2.85,0.285351730178784 +google/flan-t5-xl_float16_7d6315df2c2fb742f0f5b556879d730926ca9001_False,google/flan-t5-xl,7d6315df2c2fb742f0f5b556879d730926ca9001,float16,pretrained,Original,T5ForConditionalGeneration,11.5917795285333,FALSE,IFEval,0.223741893730856,22.3741893730856,BBH,0.453106360621123,22.6950558112154,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.25251677852349,0.335570469798655,MUSR,0.41809375,11.3283854166667,MMLU-PRO,0.214677526595745,12.7419473995272,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-21,2024-08-07,0,google/flan-t5-xl,apache-2.0,477,2.85,0.348929344293381 +google/flan-t5-xl_bfloat16_7d6315df2c2fb742f0f5b556879d730926ca9001_False,google/flan-t5-xl,7d6315df2c2fb742f0f5b556879d730926ca9001,bfloat16,pretrained,Original,T5ForConditionalGeneration,11.5871674375561,FALSE,IFEval,0.22069442412798,22.069442412798,BBH,0.45372172155694,22.8375876635233,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.245805369127517,0,MUSR,0.42203125,11.85390625,MMLU-PRO,0.214178856382979,12.6865395981087,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-21,2024-08-07,0,google/flan-t5-xl,apache-2.0,477,2.85,0.285351730178784 google/flan-t5-xxl_float16_ae7c9136adc7555eeccc78cdd960dfd60fb346ce_False,google/flan-t5-xxl,ae7c9136adc7555eeccc78cdd960dfd60fb346ce,float16,fine-tunedondomain-specificdatasets,Original,T5ForConditionalGeneration,13.4858434255225,FALSE,IFEval,0.220045036059877,22.0045036059877,BBH,0.506588801577692,30.1192556001059,MATH Level 5,0,0,GPQA,0.27013422818792,2.68456375838927,MUSR,0.42175,11.1854166666667,MMLU-PRO,0.234291888297872,14.9213209219858,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-21,2024-09-06,0,google/flan-t5-xxl,apache-2.0,1219,11.267,0.70647682731463 google/flan-ul2_bfloat16_452d74ce28ac4a7f211d6ba3ef0717027f7a8074_False,google/flan-ul2,452d74ce28ac4a7f211d6ba3ef0717027f7a8074,bfloat16,pretrained,Original,T5ForConditionalGeneration,13.5501175247888,FALSE,IFEval,0.239254068094877,23.9254068094877,BBH,0.505373804912565,30.0202901256771,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.287751677852349,5.03355704697987,MUSR,0.384354166666667,5.57760416666667,MMLU-PRO,0.249335106382979,16.5927895981087,TRUE,FALSE,FALSE,FALSE,TRUE,2023-03-03,2024-08-07,0,google/flan-ul2,apache-2.0,554,19.46,0.559966283448423 google/gemma-1.1-2b-it_bfloat16_bf4924f313df5166dee1467161e886e55f2eb4d4_True,google/gemma-1.1-2b-it,bf4924f313df5166dee1467161e886e55f2eb4d4,bfloat16,chatmodels,Original,GemmaForCausalLM,7.77643528435205,TRUE,IFEval,0.306748316688608,30.6748316688608,BBH,0.318463497481492,5.86282672277435,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.269295302013423,2.57270693512304,MUSR,0.339395833333333,2.02447916666667,MMLU-PRO,0.148354388297872,5.3727098108747,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-26,2024-06-12,0,google/gemma-1.1-2b-it,gemma,152,2.506,0.32921478142276 google/gemma-1.1-7b-it_bfloat16_16128b0aeb50762ea96430c0c06a37941bf9f274_True,google/gemma-1.1-7b-it,16128b0aeb50762ea96430c0c06a37941bf9f274,bfloat16,chatmodels,Original,GemmaForCausalLM,17.4795862430713,TRUE,IFEval,0.503910734628563,50.3910734628563,BBH,0.393529796283325,15.9342093850132,MATH Level 5,0.0362537764350453,3.62537764350453,GPQA,0.293624161073826,5.8165548098434,MUSR,0.423020833333333,11.5109375,MMLU-PRO,0.258394281914894,17.5993646572104,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-26,2024-06-12,0,google/gemma-1.1-7b-it,gemma,267,8.538,0.578299189963354 google/gemma-2-27b_bfloat16_938270f5272feb02779b55c2bb2fffdd0f53ff0c_False,google/gemma-2-27b,938270f5272feb02779b55c2bb2fffdd0f53ff0c,bfloat16,pretrained,Original,Gemma2ForCausalLM,23.8506386398765,FALSE,IFEval,0.247522130170171,24.7522130170171,BBH,0.564290831748206,37.3907374541865,MATH Level 5,0.161631419939577,16.1631419939577,GPQA,0.350671140939597,13.4228187919463,MUSR,0.439635416666667,13.92109375,MMLU-PRO,0.437084441489362,37.4538268321513,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-08-24,0,google/gemma-2-27b,gemma,192,27.227,5.61424927838634 -google/gemma-2-27b-it_bfloat16_f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b_True,google/gemma-2-27b-it,f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b,bfloat16,chatmodels,Original,Gemma2ForCausalLM,32.3223187688799,TRUE,IFEval,0.797767700811624,79.7767700811624,BBH,0.64513874331688,49.2728421513039,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.375,16.6666666666667,MUSR,0.403302083333333,9.11276041666667,MMLU-PRO,0.445146276595745,38.3495862884161,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-08-07,1,google/gemma-2-27b,gemma,473,27.227,4.82621118669274 +google/gemma-2-27b-it_bfloat16_f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b_True,google/gemma-2-27b-it,f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b,bfloat16,chatmodels,Original,Gemma2ForCausalLM,32.3223187688799,TRUE,IFEval,0.797767700811624,79.7767700811624,BBH,0.64513874331688,49.2728421513039,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.375,16.6666666666667,MUSR,0.403302083333333,9.11276041666667,MMLU-PRO,0.445146276595745,38.3495862884161,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-08-07,1,google/gemma-2-27b,gemma,474,27.227,4.82621118669274 google/gemma-2-2b_bfloat16_4d05c88d00441bf62bf87dcfd29e204c05089f36_True,google/gemma-2-2b,4d05c88d00441bf62bf87dcfd29e204c05089f36,bfloat16,pretrained,Original,InternLM2ForCausalLM,10.1294631550552,TRUE,IFEval,0.199312269223438,19.9312269223438,BBH,0.365596699642259,11.7558075322361,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.26258389261745,1.67785234899329,MUSR,0.423177083333333,11.43046875,MMLU-PRO,0.218001994680851,13.1113327423168,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,0,google/gemma-2-2b,gemma,466,2.614,1.51879572271398 google/gemma-2-2b_float16_0738188b3055bc98daf0fe7211f0091357e5b979_False,google/gemma-2-2b,0738188b3055bc98daf0fe7211f0091357e5b979,float16,fine-tunedondomain-specificdatasets,Original,Gemma2ForCausalLM,10.3344393348315,FALSE,IFEval,0.201760218442621,20.1760218442621,BBH,0.370867461247026,12.4973062285736,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.26258389261745,1.67785234899329,MUSR,0.421875,11.2677083333333,MMLU-PRO,0.221658909574468,13.5176566193853,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-04,0,google/gemma-2-2b,gemma,466,2.614,1.41825735113158 -google/gemma-2-2b-it_bfloat16_2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f_True,google/gemma-2-2b-it,2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f,bfloat16,fine-tunedondomain-specificdatasets,Original,InternLM2ForCausalLM,17.0469392949665,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.419923089142747,17.9807928815234,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.274328859060403,3.24384787472036,MUSR,0.392885416666667,7.07734375,MMLU-PRO,0.25498670212766,17.2207446808511,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,1,google/gemma-2-2b,gemma,806,2.614,1.23474327420585 +google/gemma-2-2b-it_bfloat16_2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f_True,google/gemma-2-2b-it,2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f,bfloat16,fine-tunedondomain-specificdatasets,Original,InternLM2ForCausalLM,17.0469392949665,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.419923089142747,17.9807928815234,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.274328859060403,3.24384787472036,MUSR,0.392885416666667,7.07734375,MMLU-PRO,0.25498670212766,17.2207446808511,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,1,google/gemma-2-2b,gemma,811,2.614,1.23474327420585 google/gemma-2-2b-jpn-it_float16_6b046bbc091084a1ec89fe03e58871fde10868eb_False,google/gemma-2-2b-jpn-it,6b046bbc091084a1ec89fe03e58871fde10868eb,float16,pretrained,Original,Gemma2ForCausalLM,17.1154057059385,FALSE,IFEval,0.507782683280363,50.7782683280363,BBH,0.422556989006581,18.5256264498327,MATH Level 5,0.0347432024169184,3.47432024169184,GPQA,0.285234899328859,4.6979865771812,MUSR,0.396385416666667,7.68151041666667,MMLU-PRO,0.2578125,17.5347222222222,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-25,2024-10-11,2,google/gemma-2-2b,gemma,147,2.614,1.01143721051409 google/gemma-2-2b-jpn-it_bfloat16_6b046bbc091084a1ec89fe03e58871fde10868eb_True,google/gemma-2-2b-jpn-it,6b046bbc091084a1ec89fe03e58871fde10868eb,bfloat16,chatmodels,Original,Gemma2ForCausalLM,15.8855787074056,TRUE,IFEval,0.528840144150853,52.8840144150853,BBH,0.417844022621712,17.848086390818,MATH Level 5,0,0,GPQA,0.275167785234899,3.35570469798658,MUSR,0.372760416666667,4.92838541666667,MMLU-PRO,0.246675531914894,16.2972813238771,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-25,2024-10-14,2,google/gemma-2-2b,gemma,147,2.614,0.854400249040011 google/gemma-2-9b_bfloat16_beb0c08e9eeb0548f3aca2ac870792825c357b7d_False,google/gemma-2-9b,beb0c08e9eeb0548f3aca2ac870792825c357b7d,bfloat16,pretrained,Original,Gemma2ForCausalLM,21.1549343088298,FALSE,IFEval,0.203983208996574,20.3983208996574,BBH,0.537737339762188,34.0968185358978,MATH Level 5,0.131419939577039,13.1419939577039,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446114583333333,14.29765625,MMLU-PRO,0.410322473404255,34.480274822695,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,0,google/gemma-2-9b,gemma,616,9,5.6631856917904 -google/gemma-2-9b-it_bfloat16_1937c70277fcc5f7fb0fc772fc5bc69378996e71_True,google/gemma-2-9b-it,1937c70277fcc5f7fb0fc772fc5bc69378996e71,bfloat16,chatmodels,Original,Gemma2ForCausalLM,28.8627904641512,TRUE,IFEval,0.743562636027961,74.3562636027961,BBH,0.599034250416413,42.1366196836647,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.360738255033557,14.7651006711409,MUSR,0.407270833333333,9.7421875,MMLU-PRO,0.387549867021277,31.9499852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,1,google/gemma-2-9b,gemma,602,9,5.01449702077493 +google/gemma-2-9b-it_bfloat16_1937c70277fcc5f7fb0fc772fc5bc69378996e71_True,google/gemma-2-9b-it,1937c70277fcc5f7fb0fc772fc5bc69378996e71,bfloat16,chatmodels,Original,Gemma2ForCausalLM,28.8627904641512,TRUE,IFEval,0.743562636027961,74.3562636027961,BBH,0.599034250416413,42.1366196836647,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.360738255033557,14.7651006711409,MUSR,0.407270833333333,9.7421875,MMLU-PRO,0.387549867021277,31.9499852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,1,google/gemma-2-9b,gemma,604,9,5.01449702077493 google/gemma-2b_bfloat16_2ac59a5d7bf4e1425010f0d457dde7d146658953_False,google/gemma-2b,2ac59a5d7bf4e1425010f0d457dde7d146658953,bfloat16,pretrained,Original,GemmaForCausalLM,7.35870138352179,FALSE,IFEval,0.203758250331343,20.3758250331343,BBH,0.338099397582924,8.46671286484037,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.25503355704698,0.671140939597318,MUSR,0.39778125,7.55598958333334,MMLU-PRO,0.136552526595745,4.06139184397163,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b,gemma,925,2.506,1.23625082450337 -google/gemma-2b-it_bfloat16_de144fb2268dee1066f515465df532c05e699d48_True,google/gemma-2b-it,de144fb2268dee1066f515465df532c05e699d48,bfloat16,chatmodels,Original,GemmaForCausalLM,7.22145367714292,TRUE,IFEval,0.269029508371122,26.9029508371122,BBH,0.315081919887885,5.21430302216362,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.278523489932886,3.80313199105145,MUSR,0.334125,3.03229166666667,MMLU-PRO,0.13530585106383,3.92287234042553,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b-it,gemma,685,2.506,0.352950331047759 -google/gemma-7b_bfloat16_a0eac5b80dba224e6ed79d306df50b1e92c2125d_False,google/gemma-7b,a0eac5b80dba224e6ed79d306df50b1e92c2125d,bfloat16,pretrained,Original,GemmaForCausalLM,15.45540668709,FALSE,IFEval,0.265932171083835,26.5932171083835,BBH,0.436152852392864,21.1160993232917,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.286912751677852,4.92170022371365,MUSR,0.406239583333333,10.9799479166667,MMLU-PRO,0.294797207446809,21.6441341607565,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-08,0,google/gemma-7b,gemma,3078,8.538,1.25491405781993 +google/gemma-2b-it_bfloat16_de144fb2268dee1066f515465df532c05e699d48_True,google/gemma-2b-it,de144fb2268dee1066f515465df532c05e699d48,bfloat16,chatmodels,Original,GemmaForCausalLM,7.22145367714292,TRUE,IFEval,0.269029508371122,26.9029508371122,BBH,0.315081919887885,5.21430302216362,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.278523489932886,3.80313199105145,MUSR,0.334125,3.03229166666667,MMLU-PRO,0.13530585106383,3.92287234042553,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b-it,gemma,686,2.506,0.352950331047759 +google/gemma-7b_bfloat16_a0eac5b80dba224e6ed79d306df50b1e92c2125d_False,google/gemma-7b,a0eac5b80dba224e6ed79d306df50b1e92c2125d,bfloat16,pretrained,Original,GemmaForCausalLM,15.45540668709,FALSE,IFEval,0.265932171083835,26.5932171083835,BBH,0.436152852392864,21.1160993232917,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.286912751677852,4.92170022371365,MUSR,0.406239583333333,10.9799479166667,MMLU-PRO,0.294797207446809,21.6441341607565,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-08,0,google/gemma-7b,gemma,3079,8.538,1.25491405781993 google/gemma-7b-it_bfloat16_18329f019fb74ca4b24f97371785268543d687d2_True,google/gemma-7b-it,18329f019fb74ca4b24f97371785268543d687d2,bfloat16,chatmodels,Original,GemmaForCausalLM,12.8681419014102,TRUE,IFEval,0.386832493339894,38.6832493339894,BBH,0.364558292227017,11.8800913445494,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.284395973154362,4.58612975391499,MUSR,0.427427083333333,12.5283854166667,MMLU-PRO,0.169464760638298,7.71830673758865,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-13,2024-06-12,1,google/gemma-7b,gemma,1143,8.538,1.0999544452693 -google/mt5-base_float16_2eb15465c5dd7f72a8f7984306ad05ebc3dd1e1f_False,google/mt5-base,2eb15465c5dd7f72a8f7984306ad05ebc3dd1e1f,float16,fine-tunedondomain-specificdatasets,Original,MT5ForConditionalGeneration,3.56528212264935,FALSE,IFEval,0.164515707212419,16.4515707212419,BBH,0.288316002284888,1.29855138817669,MATH Level 5,0,0,GPQA,0.239093959731544,0,MUSR,0.367208333333333,2.86770833333333,MMLU-PRO,0.106964760638298,0.773862293144208,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-base,apache-2.0,200,0.39,0.200039818164465 +google/mt5-base_float16_2eb15465c5dd7f72a8f7984306ad05ebc3dd1e1f_False,google/mt5-base,2eb15465c5dd7f72a8f7984306ad05ebc3dd1e1f,float16,fine-tunedondomain-specificdatasets,Original,MT5ForConditionalGeneration,3.56528212264935,FALSE,IFEval,0.164515707212419,16.4515707212419,BBH,0.288316002284888,1.29855138817669,MATH Level 5,0,0,GPQA,0.239093959731544,0,MUSR,0.367208333333333,2.86770833333333,MMLU-PRO,0.106964760638298,0.773862293144208,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-base,apache-2.0,202,0.39,0.200039818164465 google/mt5-small_float16_73fb5dbe4756edadc8fbe8c769b0a109493acf7a_False,google/mt5-small,73fb5dbe4756edadc8fbe8c769b0a109493acf7a,float16,fine-tunedondomain-specificdatasets,Original,MT5ForConditionalGeneration,4.25592817327735,FALSE,IFEval,0.171809687185557,17.1809687185557,BBH,0.276584202992908,1.07097147950089,MATH Level 5,0,0,GPQA,0.24244966442953,0,MUSR,0.38575,5.91875,MMLU-PRO,0.112283909574468,1.36487884160756,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-small,apache-2.0,116,0.17,0.180493674360773 google/mt5-xl_float16_63fc6450d80515b48e026b69ef2fbbd426433e84_False,google/mt5-xl,63fc6450d80515b48e026b69ef2fbbd426433e84,float16,fine-tunedondomain-specificdatasets,Original,MT5ForConditionalGeneration,5.19142015303163,FALSE,IFEval,0.195964485343333,19.5964485343333,BBH,0.304735837080435,3.2824619143354,MATH Level 5,0,0,GPQA,0.264261744966443,1.90156599552573,MUSR,0.379520833333333,5.04010416666667,MMLU-PRO,0.111951462765957,1.32794030732861,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-xl,apache-2.0,23,3.23,0.903767224577182 google/mt5-xxl_float16_e07c395916dfbc315d4e5e48b4a54a1e8821b5c0_False,google/mt5-xxl,e07c395916dfbc315d4e5e48b4a54a1e8821b5c0,float16,fine-tunedondomain-specificdatasets,Original,T5ForConditionalGeneration,5.10307678308611,FALSE,IFEval,0.23575668116154,23.575668116154,BBH,0.295934415911691,2.50471080044775,MATH Level 5,0,0,GPQA,0.241610738255034,0,MUSR,0.368947916666667,3.55182291666667,MMLU-PRO,0.108876329787234,0.986258865248226,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-09-06,0,google/mt5-xxl,apache-2.0,68,11.9,2.28193850262229 @@ -1469,8 +1484,8 @@ google/recurrentgemma-9b-it_bfloat16_43e62f98c3d496a5469ef4b18c1b11e417d68d1d_Tr google/switch-base-8_float16_92fe2d22b024d9937146fe097ba3d3a7ba146e1b_False,google/switch-base-8,92fe2d22b024d9937146fe097ba3d3a7ba146e1b,float16,fine-tunedondomain-specificdatasets,Original,SwitchTransformersForConditionalGeneration,3.29595026839661,FALSE,IFEval,0.158520503375488,15.8520503375488,BBH,0.287631327306693,1.70247810498213,MATH Level 5,0,0,GPQA,0.25,0,MUSR,0.351739583333333,1.13333333333333,MMLU-PRO,0.109790558510638,1.08783983451537,TRUE,FALSE,FALSE,FALSE,TRUE,2022-10-24,2024-09-06,0,google/switch-base-8,apache-2.0,16,0.62,0.146702933877402 google/umt5-base_float16_0de9394d54f8975e71838d309de1cb496c894ab9_False,google/umt5-base,0de9394d54f8975e71838d309de1cb496c894ab9,float16,fine-tunedondomain-specificdatasets,Original,UMT5ForConditionalGeneration,3.44104602550114,FALSE,IFEval,0.174632198123202,17.4632198123202,BBH,0.278772623289455,0.813553178847296,MATH Level 5,0,0,GPQA,0.254194630872483,0.559284116331097,MUSR,0.33821875,0.944010416666666,MMLU-PRO,0.107795877659574,0.866208628841606,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-02,2024-09-06,0,google/umt5-base,apache-2.0,13,-1,0.668046044558199 goulue5/merging_LLM_float16_587115b34d72ef957fee2d8348b3ade3ae06d4a8_False,goulue5/merging_LLM,587115b34d72ef957fee2d8348b3ade3ae06d4a8,float16,basemergesandmoerges,Original,Qwen2ForCausalLM,16.4099852745745,FALSE,IFEval,0.323260061082373,32.3260061082373,BBH,0.42164986115901,18.282830291312,MATH Level 5,0.0785498489425982,7.85498489425982,GPQA,0.291107382550336,5.48098434004475,MUSR,0.43328125,12.76015625,MMLU-PRO,0.29579454787234,21.7549497635934,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-21,2024-11-22,0,goulue5/merging_LLM,"",0,1.544,0.551465090928402 -gpt2_bfloat16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,bfloat16,pretrained,Original,GPT2LMHeadModel,6.39102973137443,FALSE,IFEval,0.193416800755329,19.3416800755329,BBH,0.303638540151673,2.71429784738774,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.26006711409396,1.34228187919463,MUSR,0.432416666666667,12.9854166666667,MMLU-PRO,0.114943484042553,1.66038711583924,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-26,0,gpt2,mit,2461,0.137,0.323928012416449 -gpt2_float16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,float16,pretrained,Original,GPT2LMHeadModel,5.97773692810457,FALSE,IFEval,0.0833333333333333,8.33333333333333,BBH,0.308333333333333,9.19975490196079,MATH Level 5,0,0,GPQA,0.233333333333333,0,MUSR,0.433333333333333,18.3333333333333,MMLU-PRO,0.1,0,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-26,0,gpt2,mit,2461,0.137,0.0392451730685468 +gpt2_bfloat16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,bfloat16,pretrained,Original,GPT2LMHeadModel,6.39102973137443,FALSE,IFEval,0.193416800755329,19.3416800755329,BBH,0.303638540151673,2.71429784738774,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.26006711409396,1.34228187919463,MUSR,0.432416666666667,12.9854166666667,MMLU-PRO,0.114943484042553,1.66038711583924,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-26,0,gpt2,mit,2464,0.137,0.323928012416449 +gpt2_float16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,float16,pretrained,Original,GPT2LMHeadModel,5.97773692810457,FALSE,IFEval,0.0833333333333333,8.33333333333333,BBH,0.308333333333333,9.19975490196079,MATH Level 5,0,0,GPQA,0.233333333333333,0,MUSR,0.433333333333333,18.3333333333333,MMLU-PRO,0.1,0,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-26,0,gpt2,mit,2464,0.137,0.0392451730685468 gradientai/Llama-3-8B-Instruct-Gradient-1048k_bfloat16_8697fb25cb77c852311e03b4464b8467471d56a4_True,gradientai/Llama-3-8B-Instruct-Gradient-1048k,8697fb25cb77c852311e03b4464b8467471d56a4,bfloat16,chatmodels,Original,LlamaForCausalLM,18.2455696265917,TRUE,IFEval,0.44555889484346,44.555889484346,BBH,0.434590310706957,21.0105289871587,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.277684563758389,3.69127516778523,MUSR,0.42975,13.51875,MMLU-PRO,0.29404920212766,21.5610224586288,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-29,2024-06-12,0,gradientai/Llama-3-8B-Instruct-Gradient-1048k,llama3,678,8.03,0.887164486766284 grimjim/Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge_bfloat16_7a8d334dce0a2ce948f75612b8d3a61c53d094aa_False,grimjim/Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge,7a8d334dce0a2ce948f75612b8d3a61c53d094aa,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,20.887036378959,FALSE,IFEval,0.427124474172972,42.7124474172972,BBH,0.496169453500683,28.2580149129877,MATH Level 5,0.102719033232628,10.2719033232628,GPQA,0.290268456375839,5.36912751677852,MUSR,0.404322916666667,9.54036458333333,MMLU-PRO,0.362533244680851,29.1703605200946,TRUE,TRUE,FALSE,FALSE,FALSE,2024-06-28,2024-06-29,1,grimjim/Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge (Merge),llama3,2,8.03,0.54754835391993 grimjim/Llama-3-Instruct-8B-SimPO-SPPO-Iter3-merge_bfloat16_8f4d460ea20e24e48914156af7def305c0cd347f_True,grimjim/Llama-3-Instruct-8B-SimPO-SPPO-Iter3-merge,8f4d460ea20e24e48914156af7def305c0cd347f,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,23.6884747801112,TRUE,IFEval,0.680589724154133,68.0589724154133,BBH,0.502173409117659,29.0732859144765,MATH Level 5,0.06797583081571,6.797583081571,GPQA,0.26258389261745,1.67785234899329,MUSR,0.388510416666667,6.69713541666667,MMLU-PRO,0.368434175531915,29.8260195035461,TRUE,TRUE,FALSE,FALSE,FALSE,2024-06-28,2024-09-17,1,grimjim/Llama-3-Instruct-8B-SimPO-SPPO-Iter3-merge (Merge),llama3,2,8,0.616941673112788 @@ -1513,6 +1528,7 @@ huihui-ai/QwQ-32B-Coder-Fusion-9010_bfloat16_6d19e2749fabb24efe732a2614e7458d61d huihui-ai/Qwen2.5-14B-Instruct-abliterated-v2_bfloat16_68f298d4017b8999dc963fbc560b02eaefa41de3_True,huihui-ai/Qwen2.5-14B-Instruct-abliterated-v2,68f298d4017b8999dc963fbc560b02eaefa41de3,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,32.9112203859138,TRUE,IFEval,0.832763733560287,83.2763733560287,BBH,0.63238224470529,47.4061882492622,MATH Level 5,0,0,GPQA,0.333892617449664,11.1856823266219,MUSR,0.42196875,11.5794270833333,MMLU-PRO,0.496176861702128,44.0196513002364,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-09,2024-12-07,2,Qwen/Qwen2.5-14B,apache-2.0,9,14.77,1.62398272378957 huihui-ai/Qwen2.5-7B-Instruct-abliterated_bfloat16_c04c14c82962506e2b16f58f9f6b0a2e60a6afde_True,huihui-ai/Qwen2.5-7B-Instruct-abliterated,c04c14c82962506e2b16f58f9f6b0a2e60a6afde,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,26.6475056681965,TRUE,IFEval,0.75460334135649,75.460334135649,BBH,0.526158997282991,32.8866732143205,MATH Level 5,0,0,GPQA,0.315436241610738,8.7248322147651,MUSR,0.396666666666667,7.48333333333333,MMLU-PRO,0.41796875,35.3298611111111,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-19,2024-09-24,2,Qwen/Qwen2.5-7B,apache-2.0,2,7.616,2.16612430569387 huihui-ai/Qwen2.5-7B-Instruct-abliterated-v2_bfloat16_05d179c1108cc2dc1c1a16a8255ac6f57eac5d32_True,huihui-ai/Qwen2.5-7B-Instruct-abliterated-v2,05d179c1108cc2dc1c1a16a8255ac6f57eac5d32,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,26.999904985788,TRUE,IFEval,0.760648412877831,76.0648412877831,BBH,0.537668844279425,34.369626512494,MATH Level 5,0,0,GPQA,0.308724832214765,7.82997762863535,MUSR,0.3980625,8.09114583333333,MMLU-PRO,0.42079454787234,35.6438386524823,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-22,2024-09-24,2,Qwen/Qwen2.5-7B,apache-2.0,26,7.616,2.21974001546824 +iFaz/llama32_3B_en_emo_v2_float16_a2e03c1a0cd3cba34c197971eddd8c42f3c88479_False,iFaz/llama32_3B_en_emo_v2,a2e03c1a0cd3cba34c197971eddd8c42f3c88479,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.2402758158472,FALSE,IFEval,0.545401756229028,54.5401756229028,BBH,0.428351830558297,19.0291627810121,MATH Level 5,0.104984894259819,10.4984894259819,GPQA,0.26761744966443,2.3489932885906,MUSR,0.348229166666667,6.76197916666667,MMLU-PRO,0.300365691489362,22.2628546099291,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-25,2024-12-26,2,meta-llama/Llama-3.2-3B-Instruct,apache-2.0,0,0.924,1.08879882905222 iRyanBell/ARC1_bfloat16_28176c0fb77fa43e1410766faf35d2a2681566e9_False,iRyanBell/ARC1,28176c0fb77fa43e1410766faf35d2a2681566e9,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.6239105916904,FALSE,IFEval,0.441112913735555,44.1112913735555,BBH,0.49029996581447,26.5644951326317,MATH Level 5,0.0664652567975831,6.64652567975831,GPQA,0.294463087248322,5.92841163310962,MUSR,0.399052083333333,8.14817708333334,MMLU-PRO,0.337101063829787,26.3445626477541,TRUE,FALSE,FALSE,FALSE,FALSE,2024-05-30,2024-06-26,0,iRyanBell/ARC1,llama3,1,8.03,0.924664498382478 iRyanBell/ARC1-II_bfloat16_c81076b9bdaac0722b33e411a49b07a296e8fae8_False,iRyanBell/ARC1-II,c81076b9bdaac0722b33e411a49b07a296e8fae8,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,9.32025640577659,FALSE,IFEval,0.170835605083401,17.0835605083401,BBH,0.338177810298844,7.24622941067945,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.271812080536913,2.9082774049217,MUSR,0.491291666666667,20.3114583333333,MMLU-PRO,0.168550531914894,7.61672576832151,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-12,2024-06-26,0,iRyanBell/ARC1-II,llama3,1,8.03,0.895276262218848 ibivibiv/colossus_120b_float16_b4c11f98bd874bfa454a0bb46153335cfb9b06a3_False,ibivibiv/colossus_120b,b4c11f98bd874bfa454a0bb46153335cfb9b06a3,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,25.3774389549443,FALSE,IFEval,0.427598771260256,42.7598771260256,BBH,0.606140858649419,44.0714975274784,MATH Level 5,0.054380664652568,5.4380664652568,GPQA,0.308724832214765,7.82997762863535,MUSR,0.4733125,19.2640625,MMLU-PRO,0.396110372340426,32.9011524822695,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-12,2024-06-27,0,ibivibiv/colossus_120b,apache-2.0,1,117.749,13.7524317330804 @@ -1523,17 +1539,17 @@ ibm-granite/granite-3.0-1b-a400m-instruct_bfloat16_acb9675a7d67b8657d9b8105d5cbd ibm-granite/granite-3.0-2b-base_bfloat16_532f55c03d71a31905c0b825eba4b24fe7f7936b_False,ibm-granite/granite-3.0-2b-base,532f55c03d71a31905c0b825eba4b24fe7f7936b,bfloat16,pretrained,Original,GraniteForCausalLM,14.1083729916145,FALSE,IFEval,0.387382146039176,38.7382146039176,BBH,0.404748055938062,17.5637497258283,MATH Level 5,0.0551359516616314,5.51359516616314,GPQA,0.280201342281879,4.0268456375839,MUSR,0.343427083333333,3.46171875,MMLU-PRO,0.238115026595745,15.3461140661939,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,"",0,ibm-granite/granite-3.0-2b-base,apache-2.0,19,2.634,1.04616689146427 ibm-granite/granite-3.0-2b-instruct_bfloat16_342f92f4a0b4d6d83c0b61dc6c122e253a4efebd_True,ibm-granite/granite-3.0-2b-instruct,342f92f4a0b4d6d83c0b61dc6c122e253a4efebd,bfloat16,chatmodels,Original,GraniteForCausalLM,18.3205664133779,TRUE,IFEval,0.513977357854936,51.3977357854936,BBH,0.441197720626303,21.7378914109024,MATH Level 5,0.0876132930513595,8.76132930513595,GPQA,0.299496644295302,6.59955257270694,MUSR,0.351489583333333,1.26953125,MMLU-PRO,0.281416223404255,20.1573581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,"",1,ibm-granite/granite-3.0-2b-instruct (Merge),apache-2.0,46,2.634,1.01894808156813 ibm-granite/granite-3.0-3b-a800m-base_bfloat16_0d1d12f91791b25289ef407e39d88f00d1256d10_False,ibm-granite/granite-3.0-3b-a800m-base,0d1d12f91791b25289ef407e39d88f00d1256d10,bfloat16,pretrained,Original,GraniteForCausalLM,9.42690086736977,FALSE,IFEval,0.273226151056973,27.3226151056973,BBH,0.366749749713086,11.3484424218006,MATH Level 5,0.0445619335347432,4.45619335347432,GPQA,0.251677852348993,0.223713646532442,MUSR,0.34196875,3.31276041666667,MMLU-PRO,0.189079122340426,9.89768026004728,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-03,"",0,ibm-granite/granite-3.0-3b-a800m-base,apache-2.0,4,3.374,3.53578382360079 -ibm-granite/granite-3.0-3b-a800m-instruct_bfloat16_ab0c732243cfd50a601fa393dd46a2c5993746f7_True,ibm-granite/granite-3.0-3b-a800m-instruct,ab0c732243cfd50a601fa393dd46a2c5993746f7,bfloat16,chatmodels,Original,GraniteForCausalLM,13.6603599755218,TRUE,IFEval,0.429821761814209,42.9821761814209,BBH,0.375278052917334,13.16300959501,MATH Level 5,0.06797583081571,6.797583081571,GPQA,0.281040268456376,4.13870246085012,MUSR,0.348666666666667,2.08333333333333,MMLU-PRO,0.215176196808511,12.7973552009456,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-03,2024-10-20,1,ibm-granite/granite-3.0-3b-a800m-instruct (Merge),apache-2.0,16,3.374,3.07668055312678 +ibm-granite/granite-3.0-3b-a800m-instruct_bfloat16_ab0c732243cfd50a601fa393dd46a2c5993746f7_True,ibm-granite/granite-3.0-3b-a800m-instruct,ab0c732243cfd50a601fa393dd46a2c5993746f7,bfloat16,chatmodels,Original,GraniteForCausalLM,13.6603599755218,TRUE,IFEval,0.429821761814209,42.9821761814209,BBH,0.375278052917334,13.16300959501,MATH Level 5,0.06797583081571,6.797583081571,GPQA,0.281040268456376,4.13870246085012,MUSR,0.348666666666667,2.08333333333333,MMLU-PRO,0.215176196808511,12.7973552009456,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-03,2024-10-20,1,ibm-granite/granite-3.0-3b-a800m-instruct (Merge),apache-2.0,17,3.374,3.07668055312678 ibm-granite/granite-3.0-8b-base_bfloat16_1edd1f646abfcd90ed5d6c0d9711fbb02c947884_False,ibm-granite/granite-3.0-8b-base,1edd1f646abfcd90ed5d6c0d9711fbb02c947884,bfloat16,pretrained,Original,GraniteForCausalLM,21.6531600483463,FALSE,IFEval,0.458348293638657,45.8348293638657,BBH,0.494376063736533,27.9743582989824,MATH Level 5,0.0989425981873112,9.89425981873112,GPQA,0.325503355704698,10.0671140939597,MUSR,0.408135416666667,10.4502604166667,MMLU-PRO,0.331283244680851,25.6981382978723,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,2024-10-20,0,ibm-granite/granite-3.0-8b-base,apache-2.0,22,8.171,1.88565587931952 ibm-granite/granite-3.0-8b-instruct_bfloat16_e0a466fb25b9e07e9c2dc93380a360189700d1f8_True,ibm-granite/granite-3.0-8b-instruct,e0a466fb25b9e07e9c2dc93380a360189700d1f8,bfloat16,chatmodels,Original,GraniteForCausalLM,23.8640332348529,TRUE,IFEval,0.530963399335984,53.0963399335984,BBH,0.519187463184023,31.5881590647151,MATH Level 5,0.132175226586103,13.2175226586103,GPQA,0.332214765100671,10.9619686800895,MUSR,0.3900625,7.02447916666667,MMLU-PRO,0.345661569148936,27.2957299054374,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,2024-10-20,1,ibm-granite/granite-3.0-8b-instruct (Merge),apache-2.0,196,8.171,1.7129925870079 ibm-granite/granite-3.1-1b-a400m-base_bfloat16_6bbcb9db44432d0a5d4cf13cdc082324b7ee9e7b_False,ibm-granite/granite-3.1-1b-a400m-base,6bbcb9db44432d0a5d4cf13cdc082324b7ee9e7b,bfloat16,pretrained,Original,GraniteMoeForCausalLM,6.22427469055773,FALSE,IFEval,0.251943731521253,25.1943731521253,BBH,0.329869954650672,6.42984500540235,MATH Level 5,0.0219033232628399,2.19033232628399,GPQA,0.251677852348993,0.223713646532442,MUSR,0.3500625,1.7578125,MMLU-PRO,0.113946143617021,1.54957151300236,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-1b-a400m-base,apache-2.0,2,1.335,1.12341183736504 ibm-granite/granite-3.1-1b-a400m-instruct_float16_c4f8e0dd19f0ce00bca6c9742751d1827e8fa03a_True,ibm-granite/granite-3.1-1b-a400m-instruct,c4f8e0dd19f0ce00bca6c9742751d1827e8fa03a,float16,chatmodels,Original,GraniteMoeForCausalLM,10.0517271754769,TRUE,IFEval,0.46863987553026,46.863987553026,BBH,0.327983438537518,6.17818321590479,MATH Level 5,0.040785498489426,4.0785498489426,GPQA,0.23993288590604,0,MUSR,0.33025,0.78125,MMLU-PRO,0.121675531914894,2.40839243498818,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-1b-a400m-instruct (Merge),apache-2.0,8,1.335,1.04808410688418 ibm-granite/granite-3.1-2b-base_bfloat16_31f1cf9bd26ca0c69bfaf86824ee6dc4268b8b73_False,ibm-granite/granite-3.1-2b-base,31f1cf9bd26ca0c69bfaf86824ee6dc4268b8b73,bfloat16,pretrained,Original,GraniteForCausalLM,13.1902381427805,FALSE,IFEval,0.352161154625283,35.2161154625283,BBH,0.404718802891887,16.8436898468885,MATH Level 5,0.0558912386706949,5.58912386706949,GPQA,0.277684563758389,3.69127516778523,MUSR,0.348572916666667,3.90494791666667,MMLU-PRO,0.225066489361702,13.8962765957447,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-2b-base,apache-2.0,4,2.534,0.494221356581282 -ibm-granite/granite-3.1-2b-instruct_float16_8f683a244be9034aeea43dd2a80b7b4fe01d376f_True,ibm-granite/granite-3.1-2b-instruct,8f683a244be9034aeea43dd2a80b7b4fe01d376f,float16,chatmodels,Original,GraniteForCausalLM,21.0576307475066,TRUE,IFEval,0.628557782240012,62.8557782240012,BBH,0.440898585580565,21.8229561407945,MATH Level 5,0.113293051359517,11.3293051359517,GPQA,0.289429530201342,5.2572706935123,MUSR,0.360541666666667,4.86770833333334,MMLU-PRO,0.281914893617021,20.2127659574468,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-2b-instruct (Merge),apache-2.0,15,2.534,0.505641903795969 +ibm-granite/granite-3.1-2b-instruct_float16_8f683a244be9034aeea43dd2a80b7b4fe01d376f_True,ibm-granite/granite-3.1-2b-instruct,8f683a244be9034aeea43dd2a80b7b4fe01d376f,float16,chatmodels,Original,GraniteForCausalLM,21.0576307475066,TRUE,IFEval,0.628557782240012,62.8557782240012,BBH,0.440898585580565,21.8229561407945,MATH Level 5,0.113293051359517,11.3293051359517,GPQA,0.289429530201342,5.2572706935123,MUSR,0.360541666666667,4.86770833333334,MMLU-PRO,0.281914893617021,20.2127659574468,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-2b-instruct (Merge),apache-2.0,17,2.534,0.505641903795969 ibm-granite/granite-3.1-3b-a800m-base_bfloat16_e16343c6e3120c5f4e99ef53e48e9f882c9a8bd3_False,ibm-granite/granite-3.1-3b-a800m-base,e16343c6e3120c5f4e99ef53e48e9f882c9a8bd3,bfloat16,pretrained,Original,GraniteMoeForCausalLM,9.91293476951527,FALSE,IFEval,0.29962942769629,29.962942769629,BBH,0.362822992347764,11.9056051994898,MATH Level 5,0.0400302114803625,4.00302114803625,GPQA,0.277684563758389,3.69127516778523,MUSR,0.327520833333333,1.10677083333333,MMLU-PRO,0.179271941489362,8.80799349881797,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-3b-a800m-base,apache-2.0,2,3.299,1.62281050352824 -ibm-granite/granite-3.1-3b-a800m-instruct_float16_503b5f483d33443ba85a876d3c25f8b85779c9cc_True,ibm-granite/granite-3.1-3b-a800m-instruct,503b5f483d33443ba85a876d3c25f8b85779c9cc,float16,chatmodels,Original,GraniteMoeForCausalLM,17.1014424266068,TRUE,IFEval,0.551646298488012,55.1646298488012,BBH,0.400949452194719,16.6872363666604,MATH Level 5,0.103474320241692,10.3474320241692,GPQA,0.288590604026846,5.14541387024609,MUSR,0.348635416666667,2.51276041666667,MMLU-PRO,0.214760638297872,12.7511820330969,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-3b-a800m-instruct (Merge),apache-2.0,13,3.299,1.63636360410558 -ibm-granite/granite-3.1-8b-base_float16_174c7f4d7e9a016bdb85ecdf3319fe1f2d8991c4_False,ibm-granite/granite-3.1-8b-base,174c7f4d7e9a016bdb85ecdf3319fe1f2d8991c4,float16,pretrained,Original,GraniteForCausalLM,20.0697880358223,FALSE,IFEval,0.422103352438197,42.2103352438197,BBH,0.477695667711164,26.0195886710118,MATH Level 5,0.095166163141994,9.5166163141994,GPQA,0.321308724832215,9.50782997762864,MUSR,0.392229166666667,8.36197916666667,MMLU-PRO,0.323221409574468,24.8023788416076,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-8b-base,apache-2.0,8,8.171,0.598692557378878 -ibm-granite/granite-3.1-8b-instruct_float16_f6749f3946b2dc9983b870317a71ddf7a65c0806_True,ibm-granite/granite-3.1-8b-instruct,f6749f3946b2dc9983b870317a71ddf7a65c0806,float16,chatmodels,Original,GraniteForCausalLM,30.5526905408918,TRUE,IFEval,0.720756481690803,72.0756481690803,BBH,0.536446043381602,34.0896552994141,MATH Level 5,0.216767371601208,21.6767371601209,GPQA,0.312080536912752,8.27740492170022,MUSR,0.470708333333333,19.0052083333333,MMLU-PRO,0.353723404255319,28.1914893617021,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-8b-instruct (Merge),apache-2.0,74,8.171,0.61783334381855 +ibm-granite/granite-3.1-3b-a800m-instruct_float16_503b5f483d33443ba85a876d3c25f8b85779c9cc_True,ibm-granite/granite-3.1-3b-a800m-instruct,503b5f483d33443ba85a876d3c25f8b85779c9cc,float16,chatmodels,Original,GraniteMoeForCausalLM,17.1014424266068,TRUE,IFEval,0.551646298488012,55.1646298488012,BBH,0.400949452194719,16.6872363666604,MATH Level 5,0.103474320241692,10.3474320241692,GPQA,0.288590604026846,5.14541387024609,MUSR,0.348635416666667,2.51276041666667,MMLU-PRO,0.214760638297872,12.7511820330969,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,1,ibm-granite/granite-3.1-3b-a800m-instruct (Merge),apache-2.0,14,3.299,1.63636360410558 +ibm-granite/granite-3.1-8b-base_float16_174c7f4d7e9a016bdb85ecdf3319fe1f2d8991c4_False,ibm-granite/granite-3.1-8b-base,174c7f4d7e9a016bdb85ecdf3319fe1f2d8991c4,float16,pretrained,Original,GraniteForCausalLM,20.0697880358223,FALSE,IFEval,0.422103352438197,42.2103352438197,BBH,0.477695667711164,26.0195886710118,MATH Level 5,0.095166163141994,9.5166163141994,GPQA,0.321308724832215,9.50782997762864,MUSR,0.392229166666667,8.36197916666667,MMLU-PRO,0.323221409574468,24.8023788416076,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-16,0,ibm-granite/granite-3.1-8b-base,apache-2.0,12,8.171,0.598692557378878 +ibm-granite/granite-3.1-8b-instruct_float16_f6749f3946b2dc9983b870317a71ddf7a65c0806_False,ibm-granite/granite-3.1-8b-instruct,f6749f3946b2dc9983b870317a71ddf7a65c0806,float16,fine-tunedondomain-specificdatasets,Original,GraniteForCausalLM,27.3201282953417,FALSE,IFEval,0.625235486287495,62.5235486287495,BBH,0.527274553976235,32.8985826399362,MATH Level 5,0.166163141993958,16.6163141993958,GPQA,0.317114093959732,8.94854586129754,MUSR,0.444010416666667,14.8346354166667,MMLU-PRO,0.352892287234043,28.0991430260047,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-06,2024-12-25,1,ibm-granite/granite-3.1-8b-instruct (Merge),apache-2.0,80,4.085,1.22321775404798 ibm-granite/granite-7b-base_bfloat16_23fcb4cb5b69f8a122fb944491e9f1ad664ba37b_False,ibm-granite/granite-7b-base,23fcb4cb5b69f8a122fb944491e9f1ad664ba37b,bfloat16,pretrained,Original,LlamaForCausalLM,7.75764452802273,FALSE,IFEval,0.241427190964419,24.1427190964419,BBH,0.348043727161062,9.0508000028991,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.245805369127517,0,MUSR,0.355489583333333,3.40286458333333,MMLU-PRO,0.183427526595745,9.26972517730496,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-19,2024-06-12,0,ibm-granite/granite-7b-base,apache-2.0,27,6.738,0.652623838561169 ibm-granite/granite-7b-instruct_bfloat16_c6d1adfa5cdba2c8344e055bb7de87b7935250a8_True,ibm-granite/granite-7b-instruct,c6d1adfa5cdba2c8344e055bb7de87b7935250a8,bfloat16,chatmodels,Original,LlamaForCausalLM,11.8083734516443,TRUE,IFEval,0.297231346161518,29.7231346161518,BBH,0.372295296032695,12.6393287024653,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.285234899328859,4.6979865771812,MUSR,0.402,8.81666666666667,MMLU-PRO,0.228640292553192,14.2933658392435,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-19,2024-10-02,1,ibm/granite-7b-base,apache-2.0,5,6.738,0.711451918965055 icefog72/Ice0.15-02.10-RP_bfloat16_ab67a8b63836ec7c8e6729d79d9dfd2708b20eb3_False,icefog72/Ice0.15-02.10-RP,ab67a8b63836ec7c8e6729d79d9dfd2708b20eb3,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,21.4913274610034,FALSE,IFEval,0.534335562972912,53.4335562972912,BBH,0.49763847361884,30.1301040710686,MATH Level 5,0.0574018126888218,5.74018126888218,GPQA,0.277684563758389,3.69127516778523,MUSR,0.431979166666667,12.9973958333333,MMLU-PRO,0.306599069148936,22.9554521276596,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-02,2024-10-02,0,icefog72/Ice0.15-02.10-RP,cc-by-nc-4.0,7,7.242,0.592822160421274 @@ -1572,7 +1588,7 @@ informatiker/Qwen2-7B-Instruct-abliterated_bfloat16_7577d60acfe4544d5ab303f0a4d6 instruction-pretrain/InstructLM-500M_float16_e9d33823c76303dfaff6a8397a8b70d0118ea350_False,instruction-pretrain/InstructLM-500M,e9d33823c76303dfaff6a8397a8b70d0118ea350,float16,pretrained,Original,MistralForCausalLM,2.85435031976667,FALSE,IFEval,0.1027662158628,10.27662158628,BBH,0.294087178725297,2.31705371604848,MATH Level 5,0,0,GPQA,0.256711409395973,0.894854586129753,MUSR,0.352822916666667,2.06953125,MMLU-PRO,0.114112367021277,1.56804078014184,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-18,2024-06-27,0,instruction-pretrain/InstructLM-500M,apache-2.0,34,0.5,0.245792145066826 internlm/internlm2-1_8b_bfloat16_c24f301c7374ad9f9b58d1ea80f68b5f57cbca13_False,internlm/internlm2-1_8b,c24f301c7374ad9f9b58d1ea80f68b5f57cbca13,bfloat16,pretrained,Original,InternLM2ForCausalLM,8.59707245146007,FALSE,IFEval,0.219770209710236,21.9770209710236,BBH,0.38797328000281,13.6338579659067,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.248322147651007,0,MUSR,0.38128125,8.22682291666667,MMLU-PRO,0.158826462765957,6.53627364066194,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-30,2024-06-12,0,internlm/internlm2-1_8b,other,28,8,0.663645516912293 internlm/internlm2-chat-1_8b_bfloat16_4e226eeb354499f4d34ef4c27f6939f377475cc1_True,internlm/internlm2-chat-1_8b,4e226eeb354499f4d34ef4c27f6939f377475cc1,bfloat16,chatmodels,Original,InternLM2ForCausalLM,10.553683634515,TRUE,IFEval,0.238654547711184,23.8654547711184,BBH,0.445227166411921,20.6723574325619,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.265939597315436,2.12527964205817,MUSR,0.363052083333333,4.61484375,MMLU-PRO,0.183926196808511,9.3251329787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-30,2024-06-12,0,internlm/internlm2-chat-1_8b,other,30,1.889,0.596422562282053 -internlm/internlm2_5-1_8b-chat_bfloat16_4426f00b854561fa60d555d2b628064b56bcb758_True,internlm/internlm2_5-1_8b-chat,4426f00b854561fa60d555d2b628064b56bcb758,bfloat16,chatmodels,Original,InternLM2ForCausalLM,12.1063376112746,TRUE,IFEval,0.384908708892405,38.4908708892406,BBH,0.448892678699644,21.0309269365696,MATH Level 5,0,0,GPQA,0.290268456375839,5.36912751677852,MUSR,0.359395833333333,4.42447916666667,MMLU-PRO,0.129903590425532,3.32262115839244,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-30,2024-08-07,0,internlm/internlm2_5-1_8b-chat,other,24,1.89,0.771665647358543 +internlm/internlm2_5-1_8b-chat_bfloat16_4426f00b854561fa60d555d2b628064b56bcb758_True,internlm/internlm2_5-1_8b-chat,4426f00b854561fa60d555d2b628064b56bcb758,bfloat16,chatmodels,Original,InternLM2ForCausalLM,12.1063376112746,TRUE,IFEval,0.384908708892405,38.4908708892406,BBH,0.448892678699644,21.0309269365696,MATH Level 5,0,0,GPQA,0.290268456375839,5.36912751677852,MUSR,0.359395833333333,4.42447916666667,MMLU-PRO,0.129903590425532,3.32262115839244,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-30,2024-08-07,0,internlm/internlm2_5-1_8b-chat,other,25,1.89,0.771665647358543 internlm/internlm2_5-20b-chat_bfloat16_ef17bde929761255fee76d95e2c25969ccd93b0d_True,internlm/internlm2_5-20b-chat,ef17bde929761255fee76d95e2c25969ccd93b0d,bfloat16,chatmodels,Original,InternLM2ForCausalLM,32.0820127392498,TRUE,IFEval,0.70099779695652,70.099779695652,BBH,0.747358053367289,62.8324591528799,MATH Level 5,0,0,GPQA,0.321308724832215,9.50782997762864,MUSR,0.455822916666667,16.74453125,MMLU-PRO,0.399767287234043,33.3074763593381,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-30,2024-08-12,0,internlm/internlm2_5-20b-chat,other,87,19.86,3.73270787133241 internlm/internlm2_5-7b-chat_float16_bebb00121ee105b823647c3ba2b1e152652edc33_True,internlm/internlm2_5-7b-chat,bebb00121ee105b823647c3ba2b1e152652edc33,float16,chatmodels,Original,InternLM2ForCausalLM,30.5768555628262,TRUE,IFEval,0.614019689978147,61.4019689978147,BBH,0.710773697280275,57.6736480423206,MATH Level 5,0.0898791540785499,8.98791540785499,GPQA,0.329697986577181,10.6263982102908,MUSR,0.4415,14.3541666666667,MMLU-PRO,0.373753324468085,30.4170360520095,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-27,2024-07-03,0,internlm/internlm2_5-7b-chat,other,185,7.738,1.45338151351539 intervitens/mini-magnum-12b-v1.1_bfloat16_3b19e12711d3f4d9b81fdeb73860e9019ebe2404_True,intervitens/mini-magnum-12b-v1.1,3b19e12711d3f4d9b81fdeb73860e9019ebe2404,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,20.6385035434935,TRUE,IFEval,0.515550960340785,51.5550960340785,BBH,0.506180035650624,29.7311868686869,MATH Level 5,0.0385196374622356,3.85196374622356,GPQA,0.288590604026846,5.14541387024609,MUSR,0.400447916666667,8.08932291666667,MMLU-PRO,0.329122340425532,25.4580378250591,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-24,2024-07-25,0,intervitens/mini-magnum-12b-v1.1,apache-2.0,73,12.248,2.23094834843233 @@ -1710,7 +1726,7 @@ macadeliccc/Samantha-Qwen-2-7B_float16_59058972fa9b56d132d04589eb17cbba277c2826_ macadeliccc/magistrate-3.2-3b-base_bfloat16_2a40ac9ca1904fca2c1e69573e27f0ff8039b738_False,macadeliccc/magistrate-3.2-3b-base,2a40ac9ca1904fca2c1e69573e27f0ff8039b738,bfloat16,continuouslypretrained,Original,LlamaForCausalLM,5.97056866221897,FALSE,IFEval,0.115930176376459,11.5930176376459,BBH,0.334270105604753,6.91028093911619,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.260906040268456,1.45413870246085,MUSR,0.39759375,7.53255208333333,MMLU-PRO,0.168882978723404,7.65366430260047,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-28,2024-10-01,1,meta-llama/Llama-3.2-3B,llama3.2,1,3.213,0.730342962887556 macadeliccc/magistrate-3.2-3b-it_bfloat16_122961278c97195dd59d67b244907359013e4de5_True,macadeliccc/magistrate-3.2-3b-it,122961278c97195dd59d67b244907359013e4de5,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,7.03772378640789,TRUE,IFEval,0.229187444868504,22.9187444868504,BBH,0.32565067903272,5.32315541981334,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.24748322147651,0,MUSR,0.376322916666667,5.74036458333333,MMLU-PRO,0.159242021276596,6.58244680851064,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-01,2024-10-01,2,meta-llama/Llama-3.2-3B,llama3.2,0,3.213,0.702951029303344 maldv/Awqward2.5-32B-Instruct_bfloat16_fd8f6751645a1923d588f80ec1d8292cb69691a1_True,maldv/Awqward2.5-32B-Instruct,fd8f6751645a1923d588f80ec1d8292cb69691a1,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.3638263088866,TRUE,IFEval,0.825469753587149,82.5469753587149,BBH,0.697446550677304,57.2073386817348,MATH Level 5,0,0,GPQA,0.340604026845638,12.0805369127517,MUSR,0.427489583333333,13.86953125,MMLU-PRO,0.572307180851064,52.4785756501182,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-18,2024-12-18,1,maldv/Awqward2.5-32B-Instruct (Merge),apache-2.0,1,16.382,3.72254727211103 -maldv/Qwentile2.5-32B-Instruct_bfloat16_1cb04716c8aba33838b7f5dad99b23b7f0c6c152_True,maldv/Qwentile2.5-32B-Instruct,1cb04716c8aba33838b7f5dad99b23b7f0c6c152,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,43.5462855183237,TRUE,IFEval,0.739316125657699,73.9316125657699,BBH,0.696283745109837,57.2058776368836,MATH Level 5,0.380664652567976,38.0664652567976,GPQA,0.384228187919463,17.8970917225951,MUSR,0.468229166666667,19.9619791666667,MMLU-PRO,0.587932180851064,54.2146867612293,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,maldv/Qwentile2.5-32B-Instruct (Merge),apache-2.0,7,16.382,3.53254173559104 +maldv/Qwentile2.5-32B-Instruct_bfloat16_1cb04716c8aba33838b7f5dad99b23b7f0c6c152_True,maldv/Qwentile2.5-32B-Instruct,1cb04716c8aba33838b7f5dad99b23b7f0c6c152,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,43.5462855183237,TRUE,IFEval,0.739316125657699,73.9316125657699,BBH,0.696283745109837,57.2058776368836,MATH Level 5,0.380664652567976,38.0664652567976,GPQA,0.384228187919463,17.8970917225951,MUSR,0.468229166666667,19.9619791666667,MMLU-PRO,0.587932180851064,54.2146867612293,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,maldv/Qwentile2.5-32B-Instruct (Merge),apache-2.0,8,16.382,3.53254173559104 maldv/badger-kappa-llama-3-8b_bfloat16_aa6863eb816ca6ad29453b8aaf846962c4328998_True,maldv/badger-kappa-llama-3-8b,aa6863eb816ca6ad29453b8aaf846962c4328998,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,21.1666884980011,TRUE,IFEval,0.469464354579183,46.9464354579183,BBH,0.508492799775682,30.1532386043738,MATH Level 5,0.0861027190332326,8.61027190332326,GPQA,0.302852348993289,7.04697986577182,MUSR,0.376510416666667,4.29713541666667,MMLU-PRO,0.369514627659575,29.9460697399527,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-02,2024-06-27,0,maldv/badger-kappa-llama-3-8b,llama3,2,8.03,0.959125322864996 maldv/badger-lambda-llama-3-8b_bfloat16_8ef157d0d3c12212ca5e70d354869aed90e03f22_True,maldv/badger-lambda-llama-3-8b,8ef157d0d3c12212ca5e70d354869aed90e03f22,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,20.8934977809886,TRUE,IFEval,0.486075834341769,48.6075834341769,BBH,0.496348665104448,28.1030500143537,MATH Level 5,0.0913897280966767,9.13897280966767,GPQA,0.281879194630873,4.25055928411633,MUSR,0.375364583333333,4.52057291666667,MMLU-PRO,0.376662234042553,30.7402482269504,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-10,2024-06-26,0,maldv/badger-lambda-llama-3-8b,cc-by-nc-4.0,10,8.03,1.11102221764741 maldv/badger-mu-llama-3-8b_bfloat16_952a269bb1e6c18ee772c6d088e74d305df4425d_True,maldv/badger-mu-llama-3-8b,952a269bb1e6c18ee772c6d088e74d305df4425d,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,19.7934696192965,TRUE,IFEval,0.49194581488229,49.194581488229,BBH,0.514287576852281,30.5139651421457,MATH Level 5,0.0241691842900302,2.41691842900302,GPQA,0.259228187919463,1.23042505592841,MUSR,0.355458333333333,5.69895833333333,MMLU-PRO,0.367353723404255,29.7059692671395,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-27,2024-06-27,0,maldv/badger-mu-llama-3-8b,cc-by-nc-4.0,3,8.03,0.904635313226999 @@ -1720,7 +1736,7 @@ matouLeLoup/ECE-PRYMMAL-0.5B-FT-MUSR-ENSEMBLE-V2Mathis_bfloat16_3fd229bcc3b4d250 matouLeLoup/ECE-PRYMMAL-0.5B-FT-V4-MUSR-ENSEMBLE-Mathis_bfloat16_455945ed4318bbeae008a253f877f56a68291b8b_False,matouLeLoup/ECE-PRYMMAL-0.5B-FT-V4-MUSR-ENSEMBLE-Mathis,455945ed4318bbeae008a253f877f56a68291b8b,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,7.28706205765386,FALSE,IFEval,0.187321861549577,18.7321861549577,BBH,0.323911742482544,7.91851204090326,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.260906040268456,1.45413870246085,MUSR,0.375208333333333,4.60104166666667,MMLU-PRO,0.171958111702128,7.99534574468085,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-31,2024-10-31,0,matouLeLoup/ECE-PRYMMAL-0.5B-FT-V4-MUSR-ENSEMBLE-Mathis,"",1,0.494,0.860741591289416 matouLeLoup/ECE-PRYMMAL-0.5B-FT-V4-MUSR-Mathis_float16_dd86c3d7f77748a0ba18d911ceb93358a69ce160_False,matouLeLoup/ECE-PRYMMAL-0.5B-FT-V4-MUSR-Mathis,dd86c3d7f77748a0ba18d911ceb93358a69ce160,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,7.25734499719376,FALSE,IFEval,0.188246075967322,18.8246075967322,BBH,0.323278873809028,8.07957710329185,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.263422818791946,1.78970917225951,MUSR,0.368479166666667,4.1265625,MMLU-PRO,0.172041223404255,8.00458037825059,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-25,2024-10-31,0,matouLeLoup/ECE-PRYMMAL-0.5B-FT-V4-MUSR-Mathis,"",1,0.494,0.903717875191878 matouLeLoup/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis_bfloat16_7a9d848188a674302d64a865786d4508be19571a_True,matouLeLoup/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis,7a9d848188a674302d64a865786d4508be19571a,bfloat16,fine-tunedondomain-specificdatasets,Adapter,?,5.8127460045848,TRUE,IFEval,0.165214962964933,16.5214962964933,BBH,0.302372951646132,3.08335187762666,MATH Level 5,0.00906344410876133,0.906344410876133,GPQA,0.256711409395973,0.894854586129753,MUSR,0.427302083333333,12.1794270833333,MMLU-PRO,0.111619015957447,1.29100177304964,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-12,2024-11-12,0,matouLeLoup/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis,"",0,0.63,1.09895097845108 -mattshumer/Reflection-Llama-3.1-70B_float16_458962ed801fac4eadd01a91a2029a3a82f4cd84_True,mattshumer/Reflection-Llama-3.1-70B,458962ed801fac4eadd01a91a2029a3a82f4cd84,float16,chatmodels,Original,LlamaForCausalLM,26.5614615353162,TRUE,IFEval,0.656259835015537,65.6259835015537,BBH,0.599883995822013,42.3894448802231,MATH Level 5,0,0,GPQA,0.260906040268456,1.45413870246085,MUSR,0.412666666666667,10.0166666666667,MMLU-PRO,0.458942819148936,39.8825354609929,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-05,2024-09-09,2,meta-llama/Meta-Llama-3.1-70B,llama3.1,1709,70.554,28.6508458545704 +mattshumer/Reflection-Llama-3.1-70B_float16_458962ed801fac4eadd01a91a2029a3a82f4cd84_False,mattshumer/Reflection-Llama-3.1-70B,458962ed801fac4eadd01a91a2029a3a82f4cd84,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,26.5614615353162,FALSE,IFEval,0.656259835015537,65.6259835015537,BBH,0.599883995822013,42.3894448802231,MATH Level 5,0,0,GPQA,0.260906040268456,1.45413870246085,MUSR,0.412666666666667,10.0166666666667,MMLU-PRO,0.458942819148936,39.8825354609929,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-05,2024-12-25,2,meta-llama/Meta-Llama-3.1-70B,llama3.1,1709,35.277,28.6508458545704 mattshumer/ref_70_e3_float16_5d2d9dbb9e0bf61879255f63f1b787296fe524cc_True,mattshumer/ref_70_e3,5d2d9dbb9e0bf61879255f63f1b787296fe524cc,float16,chatmodels,Original,LlamaForCausalLM,30.7379964362804,TRUE,IFEval,0.629432128973346,62.9432128973346,BBH,0.650083948110427,49.2744666000302,MATH Level 5,0,0,GPQA,0.335570469798658,11.4093959731544,MUSR,0.432760416666667,12.9950520833333,MMLU-PRO,0.530252659574468,47.8058510638298,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-08,2024-09-08,2,meta-llama/Meta-Llama-3.1-70B,llama3.1,57,70.554,39.9053086437939 maywell/Qwen2-7B-Multilingual-RP_bfloat16_487e8f0498419e4d1188f661dbb63bd629be4638_True,maywell/Qwen2-7B-Multilingual-RP,487e8f0498419e4d1188f661dbb63bd629be4638,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,23.4634668102093,TRUE,IFEval,0.434717660252574,43.4717660252574,BBH,0.506205868086107,30.5435614764747,MATH Level 5,0.225075528700906,22.5075528700906,GPQA,0.296979865771812,6.26398210290828,MUSR,0.3695625,6.22864583333333,MMLU-PRO,0.385887632978723,31.7652925531915,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-24,2024-09-05,0,maywell/Qwen2-7B-Multilingual-RP,apache-2.0,44,7.616,0.959412835757315 meditsolutions/Llama-3.1-MedIT-SUN-8B_bfloat16_0c11abbaa40e76b538b8c0f9c50e965078999087_True,meditsolutions/Llama-3.1-MedIT-SUN-8B,0c11abbaa40e76b538b8c0f9c50e965078999087,bfloat16,chatmodels,Original,LlamaForCausalLM,30.0431023159445,TRUE,IFEval,0.783729393564631,78.3729393564631,BBH,0.518692490459741,32.0016505675502,MATH Level 5,0.200151057401813,20.0151057401813,GPQA,0.308724832214765,7.82997762863535,MUSR,0.405625,9.63645833333333,MMLU-PRO,0.391622340425532,32.4024822695035,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-06,2024-11-06,1,meditsolutions/Llama-3.1-MedIT-SUN-8B (Merge),llama3.1,1,8.03,0.713050034565408 @@ -1735,44 +1751,45 @@ meditsolutions/MSH-Lite-7B-v1-Bielik-v2.3-Instruct-Llama-Prune_bfloat16_a0ffd0cd meditsolutions/MSH-v1-Bielik-v2.3-Instruct-MedIT-merge_bfloat16_2db5e8871fb3be7e658e3bc6e2885d26b891b8b8_True,meditsolutions/MSH-v1-Bielik-v2.3-Instruct-MedIT-merge,2db5e8871fb3be7e658e3bc6e2885d26b891b8b8,bfloat16,chatmodels,Original,MistralForCausalLM,27.3800110711418,TRUE,IFEval,0.581421738764257,58.1421738764257,BBH,0.56717222908585,38.0234352820579,MATH Level 5,0.137462235649547,13.7462235649547,GPQA,0.345637583892617,12.751677852349,MUSR,0.438458333333333,13.840625,MMLU-PRO,0.349983377659575,27.7759308510638,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-29,2024-11-06,1,meditsolutions/MSH-v1-Bielik-v2.3-Instruct-MedIT-merge (Merge),apache-2.0,1,11.169,0.842740828768023 meditsolutions/MedIT-Mesh-3B-Instruct_bfloat16_469d1a58f7747c3d456b3308b5a7042df4ab49e3_True,meditsolutions/MedIT-Mesh-3B-Instruct,469d1a58f7747c3d456b3308b5a7042df4ab49e3,bfloat16,chatmodels,Original,Phi3ForCausalLM,27.5629407033966,TRUE,IFEval,0.581421738764257,58.1421738764257,BBH,0.557552335686538,37.5470541937436,MATH Level 5,0.15785498489426,15.785498489426,GPQA,0.323825503355705,9.84340044742729,MUSR,0.404760416666667,10.5950520833333,MMLU-PRO,0.401180186170213,33.4644651300237,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-01,2024-11-01,1,meditsolutions/MedIT-Mesh-3B-Instruct (Merge),mit,0,3.821,0.530486348795166 meditsolutions/SmolLM2-MedIT-Upscale-2B_bfloat16_5696c9ea7cbdee0f8ad1845f5a2dc7309f376143_True,meditsolutions/SmolLM2-MedIT-Upscale-2B,5696c9ea7cbdee0f8ad1845f5a2dc7309f376143,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,15.1672472718847,TRUE,IFEval,0.642920783521058,64.2920783521058,BBH,0.355112244592801,10.5143261382457,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.264261744966443,1.90156599552573,MUSR,0.331364583333333,2.45390625,MMLU-PRO,0.197057845744681,10.7842050827423,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-02,2024-12-02,1,meditsolutions/SmolLM2-MedIT-Upscale-2B (Merge),apache-2.0,4,2.114,0.336141616257199 -meetkai/functionary-small-v3.1_bfloat16_8e43bc1d2e259b91799e704c410a95b8ca458121_True,meetkai/functionary-small-v3.1,8e43bc1d2e259b91799e704c410a95b8ca458121,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,21.6412408596034,TRUE,IFEval,0.627458476841447,62.7458476841447,BBH,0.498178104277938,28.6163146658361,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.288590604026846,5.14541387024609,MUSR,0.383364583333333,6.18723958333333,MMLU-PRO,0.33485704787234,26.0952275413712,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-26,2024-11-10,0,meetkai/functionary-small-v3.1,mit,16,8.03,0.704369699282996 +meetkai/functionary-small-v3.1_bfloat16_8e43bc1d2e259b91799e704c410a95b8ca458121_True,meetkai/functionary-small-v3.1,8e43bc1d2e259b91799e704c410a95b8ca458121,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,21.6412408596034,TRUE,IFEval,0.627458476841447,62.7458476841447,BBH,0.498178104277938,28.6163146658361,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.288590604026846,5.14541387024609,MUSR,0.383364583333333,6.18723958333333,MMLU-PRO,0.33485704787234,26.0952275413712,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-26,2024-11-10,0,meetkai/functionary-small-v3.1,mit,17,8.03,0.704369699282996 meraGPT/mera-mix-4x7B_bfloat16_09d965c5ef9b66ce419986027e03a915cb869e43_True,meraGPT/mera-mix-4x7B,09d965c5ef9b66ce419986027e03a915cb869e43,bfloat16,basemergesandmoerges,Original,MixtralForCausalLM,17.8549587329397,TRUE,IFEval,0.483177967792125,48.3177967792125,BBH,0.401898991636617,17.486438954655,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.304530201342282,7.27069351230425,MUSR,0.40565625,9.27369791666667,MMLU-PRO,0.274767287234043,19.4185874704492,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-13,2024-06-27,0,meraGPT/mera-mix-4x7B,apache-2.0,18,24.154,1.66440066308799 mergekit-community/VirtuosoSmall-InstructModelStock_bfloat16_4ac90913a36d0f1b7bcf6ed31561137d1f7b0aa6_False,mergekit-community/VirtuosoSmall-InstructModelStock,4ac90913a36d0f1b7bcf6ed31561137d1f7b0aa6,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.6911865437051,FALSE,IFEval,0.523794642659255,52.3794642659255,BBH,0.651789919356719,49.941772258845,MATH Level 5,0.317220543806647,31.7220543806647,GPQA,0.38255033557047,17.6733780760626,MUSR,0.475572916666667,19.31328125,MMLU-PRO,0.542054521276596,49.1171690307329,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,mergekit-community/VirtuosoSmall-InstructModelStock (Merge),"",2,7.383,1.98692770052692 mergekit-community/mergekit-della-zgowfmf_bfloat16_8d99e6b381db8b64944b3dcfb05daa444206782d_False,mergekit-community/mergekit-della-zgowfmf,8d99e6b381db8b64944b3dcfb05daa444206782d,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.7750478092914,FALSE,IFEval,0.482753538389252,48.2753538389252,BBH,0.659079052802925,50.9953734877346,MATH Level 5,0.331570996978852,33.1570996978852,GPQA,0.39010067114094,18.6800894854586,MUSR,0.483385416666667,20.48984375,MMLU-PRO,0.541472739361702,49.0525265957447,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-19,2024-12-19,1,mergekit-community/mergekit-della-zgowfmf (Merge),"",0,7.383,1.9355344859159 mergekit-community/mergekit-model_stock-azgztvm_bfloat16_7f63ea96f89147daf909251cd3c1f1a20e005559_False,mergekit-community/mergekit-model_stock-azgztvm,7f63ea96f89147daf909251cd3c1f1a20e005559,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,35.8314586321922,FALSE,IFEval,0.506159213110103,50.6159213110103,BBH,0.654277554675585,50.2943766945105,MATH Level 5,0.284743202416918,28.4743202416918,GPQA,0.381711409395973,17.5615212527964,MUSR,0.473,19.0916666666667,MMLU-PRO,0.540558510638298,48.9509456264775,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-20,2024-12-20,1,mergekit-community/mergekit-model_stock-azgztvm (Merge),"",0,7.383,2.03389890189032 +mergekit-community/mergekit-ties-ykqemwr_float16_81ba78a711ee017c3174f0b3cbf2135ec5b45d3d_False,mergekit-community/mergekit-ties-ykqemwr,81ba78a711ee017c3174f0b3cbf2135ec5b45d3d,float16,basemergesandmoerges,Original,MistralForCausalLM,22.3784099659013,FALSE,IFEval,0.359954919613293,35.9954919613293,BBH,0.545549667788534,34.7098858064906,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.322147651006711,9.61968680089485,MUSR,0.419791666666667,11.7072916666667,MMLU-PRO,0.373420877659575,30.3800975177305,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-25,2024-12-25,1,mergekit-community/mergekit-ties-ykqemwr (Merge),"",0,6.124,1.03392601384004 meta-llama/Llama-2-13b-chat-hf_float16_a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8_True,meta-llama/Llama-2-13b-chat-hf,a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8,float16,chatmodels,Original,LlamaForCausalLM,11.0163422752105,TRUE,IFEval,0.398472719052115,39.8472719052115,BBH,0.334273670667142,7.15537996862699,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.231543624161074,0,MUSR,0.400729166666667,8.1578125,MMLU-PRO,0.192320478723404,10.2578309692671,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-06-12,0,meta-llama/Llama-2-13b-chat-hf,llama2,1037,13.016,0.874569508215166 -meta-llama/Llama-2-13b-hf_float16_5c31dfb671ce7cfe2d7bb7c04375e44c55e815b1_False,meta-llama/Llama-2-13b-hf,5c31dfb671ce7cfe2d7bb7c04375e44c55e815b1,float16,pretrained,Original,LlamaForCausalLM,11.0148335140031,FALSE,IFEval,0.248246873850273,24.8246873850273,BBH,0.412562422338351,17.2225598250581,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.281040268456376,4.13870246085012,MUSR,0.35375,3.38541666666667,MMLU-PRO,0.237782579787234,15.3091755319149,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-06-12,0,meta-llama/Llama-2-13b-hf,llama2,577,13.016,1.11238015630798 -meta-llama/Llama-2-70b-chat-hf_float16_e9149a12809580e8602995856f8098ce973d1080_True,meta-llama/Llama-2-70b-chat-hf,e9149a12809580e8602995856f8098ce973d1080,float16,chatmodels,Original,LlamaForCausalLM,12.7464047385667,TRUE,IFEval,0.495792275606502,49.5792275606502,BBH,0.304247414616427,4.61376708259061,MATH Level 5,0.00981873111782478,0.981873111782478,GPQA,0.264261744966443,1.90156599552573,MUSR,0.368666666666667,3.48333333333334,MMLU-PRO,0.24326795212766,15.9186613475177,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-14,2024-06-12,0,meta-llama/Llama-2-70b-chat-hf,llama2,2169,68.977,22.8984550552606 +meta-llama/Llama-2-13b-hf_float16_5c31dfb671ce7cfe2d7bb7c04375e44c55e815b1_False,meta-llama/Llama-2-13b-hf,5c31dfb671ce7cfe2d7bb7c04375e44c55e815b1,float16,pretrained,Original,LlamaForCausalLM,11.0148335140031,FALSE,IFEval,0.248246873850273,24.8246873850273,BBH,0.412562422338351,17.2225598250581,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.281040268456376,4.13870246085012,MUSR,0.35375,3.38541666666667,MMLU-PRO,0.237782579787234,15.3091755319149,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-06-12,0,meta-llama/Llama-2-13b-hf,llama2,578,13.016,1.11238015630798 +meta-llama/Llama-2-70b-chat-hf_float16_e9149a12809580e8602995856f8098ce973d1080_True,meta-llama/Llama-2-70b-chat-hf,e9149a12809580e8602995856f8098ce973d1080,float16,chatmodels,Original,LlamaForCausalLM,12.7464047385667,TRUE,IFEval,0.495792275606502,49.5792275606502,BBH,0.304247414616427,4.61376708259061,MATH Level 5,0.00981873111782478,0.981873111782478,GPQA,0.264261744966443,1.90156599552573,MUSR,0.368666666666667,3.48333333333334,MMLU-PRO,0.24326795212766,15.9186613475177,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-14,2024-06-12,0,meta-llama/Llama-2-70b-chat-hf,llama2,2170,68.977,22.8984550552606 meta-llama/Llama-2-70b-hf_float16_3aba440b59558f995867ba6e1f58f21d0336b5bb_False,meta-llama/Llama-2-70b-hf,3aba440b59558f995867ba6e1f58f21d0336b5bb,float16,pretrained,Original,LlamaForCausalLM,18.3096580216144,FALSE,IFEval,0.240678067527494,24.0678067527494,BBH,0.547259119044934,35.9000618637217,MATH Level 5,0.0287009063444109,2.87009063444109,GPQA,0.302852348993289,7.04697986577182,MUSR,0.412354166666667,9.77760416666667,MMLU-PRO,0.371758643617021,30.1954048463357,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-11,2024-06-12,0,meta-llama/Llama-2-70b-hf,llama2,841,68.977,29.6212466171519 -meta-llama/Llama-2-7b-chat-hf_float16_f5db02db724555f92da89c216ac04704f23d4590_True,meta-llama/Llama-2-7b-chat-hf,f5db02db724555f92da89c216ac04704f23d4590,float16,pretrained,Original,LlamaForCausalLM,9.39548527825095,TRUE,IFEval,0.398647810032935,39.8647810032935,BBH,0.311354635500219,4.45917164595948,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.253355704697987,0.447427293064876,MUSR,0.367552083333333,3.27734375,MMLU-PRO,0.168799867021277,7.64442966903073,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-08-30,0,meta-llama/Llama-2-7b-chat-hf,llama2,4099,6.738,1.15687903615516 -meta-llama/Llama-2-7b-hf_float16_01c7f73d771dfac7d292323805ebc428287df4f9_False,meta-llama/Llama-2-7b-hf,01c7f73d771dfac7d292323805ebc428287df4f9,float16,pretrained,Original,LlamaForCausalLM,8.73082889563367,FALSE,IFEval,0.251893863836842,25.1893863836842,BBH,0.349619581998218,10.351416657849,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.266778523489933,2.23713646532438,MUSR,0.3700625,3.7578125,MMLU-PRO,0.18608710106383,9.56523345153664,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-06-12,0,meta-llama/Llama-2-7b-hf,llama2,1859,6.738,0.563094562772064 -meta-llama/Llama-3.1-8B_float16_d04e592bb4f6aa9cfee91e2e20afa771667e1d4b_False,meta-llama/Llama-3.1-8B,d04e592bb4f6aa9cfee91e2e20afa771667e1d4b,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,14.2194553235834,FALSE,IFEval,0.124598288097803,12.4598288097803,BBH,0.465959054460073,25.3044706347549,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.310402684563758,8.05369127516779,MUSR,0.3811875,8.71510416666667,MMLU-PRO,0.328789893617021,25.4210992907801,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-12-07,0,meta-llama/Llama-3.1-8B,llama3.1,1223,8.03,0.713243580943846 -meta-llama/Llama-3.2-1B_bfloat16_a7c18587d7f473bfea02aa5639aa349403307b54_False,meta-llama/Llama-3.2-1B,a7c18587d7f473bfea02aa5639aa349403307b54,bfloat16,pretrained,Original,LlamaForCausalLM,4.03149449541509,FALSE,IFEval,0.147779004153424,14.7779004153424,BBH,0.311495409646081,4.36602965655676,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.228187919463087,0,MUSR,0.344729166666667,2.5578125,MMLU-PRO,0.120345744680851,2.26063829787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-23,0,meta-llama/Llama-3.2-1B,llama3.2,1320,1.24,0.41912851784102 -meta-llama/Llama-3.2-1B-Instruct_bfloat16_d0a2081ed47e20ce524e8bc5d132f3fad2f69ff0_True,meta-llama/Llama-3.2-1B-Instruct,d0a2081ed47e20ce524e8bc5d132f3fad2f69ff0,bfloat16,chatmodels,Original,LlamaForCausalLM,13.8137204928249,TRUE,IFEval,0.569831380736446,56.9831380736446,BBH,0.349684980617683,8.74252131230305,MATH Level 5,0.0324773413897281,3.24773413897281,GPQA,0.275167785234899,3.35570469798658,MUSR,0.332854166666667,2.9734375,MMLU-PRO,0.168218085106383,7.57978723404255,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-23,0,meta-llama/Llama-3.2-1B-Instruct,llama3.2,661,1.24,0.404904524907622 -meta-llama/Llama-3.2-3B_bfloat16_95c102307f55fbd6d18ddf28bfbcb537ffdc2806_False,meta-llama/Llama-3.2-3B,95c102307f55fbd6d18ddf28bfbcb537ffdc2806,bfloat16,pretrained,Original,LlamaForCausalLM,8.5845296652033,FALSE,IFEval,0.133740696906431,13.374069690643,BBH,0.390511711699106,14.2326648843641,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.26761744966443,2.3489932885906,MUSR,0.35771875,3.81484375,MMLU-PRO,0.248753324468085,16.5281471631206,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-27,0,meta-llama/Llama-3.2-3B,llama3.2,419,3.213,1.33181264899492 -meta-llama/Llama-3.2-3B-Instruct_bfloat16_276b29ce8303c9b88966a9b32fc75692dce4d8e1_True,meta-llama/Llama-3.2-3B-Instruct,276b29ce8303c9b88966a9b32fc75692dce4d8e1,bfloat16,chatmodels,Original,LlamaForCausalLM,24.1165339900694,TRUE,IFEval,0.739316125657699,73.9316125657699,BBH,0.461007023946607,24.0591864468855,MATH Level 5,0.171450151057402,17.1450151057402,GPQA,0.278523489932886,3.80313199105145,MUSR,0.352854166666667,1.3734375,MMLU-PRO,0.319481382978723,24.3868203309693,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-27,0,meta-llama/Llama-3.2-3B-Instruct,llama3.2,819,3.213,1.27120351986613 -meta-llama/Llama-3.3-70B-Instruct_bfloat16__False,meta-llama/Llama-3.3-70B-Instruct,"",bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,36.8288410384085,FALSE,IFEval,0.899758197139146,89.9758197139146,BBH,0.691931282832581,56.5614107880222,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446125,15.565625,MMLU-PRO,0.533161569148936,48.1290632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-26,2024-12-09,1,meta-llama/Llama-3.3-70B-Instruct (Merge),llama3.3,1284,70.554,38.2795370537265 +meta-llama/Llama-2-7b-chat-hf_float16_f5db02db724555f92da89c216ac04704f23d4590_True,meta-llama/Llama-2-7b-chat-hf,f5db02db724555f92da89c216ac04704f23d4590,float16,pretrained,Original,LlamaForCausalLM,9.39548527825095,TRUE,IFEval,0.398647810032935,39.8647810032935,BBH,0.311354635500219,4.45917164595948,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.253355704697987,0.447427293064876,MUSR,0.367552083333333,3.27734375,MMLU-PRO,0.168799867021277,7.64442966903073,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-08-30,0,meta-llama/Llama-2-7b-chat-hf,llama2,4100,6.738,1.15687903615516 +meta-llama/Llama-2-7b-hf_float16_01c7f73d771dfac7d292323805ebc428287df4f9_False,meta-llama/Llama-2-7b-hf,01c7f73d771dfac7d292323805ebc428287df4f9,float16,pretrained,Original,LlamaForCausalLM,8.73082889563367,FALSE,IFEval,0.251893863836842,25.1893863836842,BBH,0.349619581998218,10.351416657849,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.266778523489933,2.23713646532438,MUSR,0.3700625,3.7578125,MMLU-PRO,0.18608710106383,9.56523345153664,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-13,2024-06-12,0,meta-llama/Llama-2-7b-hf,llama2,1862,6.738,0.563094562772064 +meta-llama/Llama-3.1-8B_float16_d04e592bb4f6aa9cfee91e2e20afa771667e1d4b_False,meta-llama/Llama-3.1-8B,d04e592bb4f6aa9cfee91e2e20afa771667e1d4b,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,14.2194553235834,FALSE,IFEval,0.124598288097803,12.4598288097803,BBH,0.465959054460073,25.3044706347549,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.310402684563758,8.05369127516779,MUSR,0.3811875,8.71510416666667,MMLU-PRO,0.328789893617021,25.4210992907801,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-12-07,0,meta-llama/Llama-3.1-8B,llama3.1,1224,8.03,0.713243580943846 +meta-llama/Llama-3.2-1B_bfloat16_a7c18587d7f473bfea02aa5639aa349403307b54_False,meta-llama/Llama-3.2-1B,a7c18587d7f473bfea02aa5639aa349403307b54,bfloat16,pretrained,Original,LlamaForCausalLM,4.03149449541509,FALSE,IFEval,0.147779004153424,14.7779004153424,BBH,0.311495409646081,4.36602965655676,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.228187919463087,0,MUSR,0.344729166666667,2.5578125,MMLU-PRO,0.120345744680851,2.26063829787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-23,0,meta-llama/Llama-3.2-1B,llama3.2,1328,1.24,0.41912851784102 +meta-llama/Llama-3.2-1B-Instruct_bfloat16_d0a2081ed47e20ce524e8bc5d132f3fad2f69ff0_True,meta-llama/Llama-3.2-1B-Instruct,d0a2081ed47e20ce524e8bc5d132f3fad2f69ff0,bfloat16,chatmodels,Original,LlamaForCausalLM,13.8137204928249,TRUE,IFEval,0.569831380736446,56.9831380736446,BBH,0.349684980617683,8.74252131230305,MATH Level 5,0.0324773413897281,3.24773413897281,GPQA,0.275167785234899,3.35570469798658,MUSR,0.332854166666667,2.9734375,MMLU-PRO,0.168218085106383,7.57978723404255,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-23,0,meta-llama/Llama-3.2-1B-Instruct,llama3.2,662,1.24,0.404904524907622 +meta-llama/Llama-3.2-3B_bfloat16_95c102307f55fbd6d18ddf28bfbcb537ffdc2806_False,meta-llama/Llama-3.2-3B,95c102307f55fbd6d18ddf28bfbcb537ffdc2806,bfloat16,pretrained,Original,LlamaForCausalLM,8.5845296652033,FALSE,IFEval,0.133740696906431,13.374069690643,BBH,0.390511711699106,14.2326648843641,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.26761744966443,2.3489932885906,MUSR,0.35771875,3.81484375,MMLU-PRO,0.248753324468085,16.5281471631206,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-27,0,meta-llama/Llama-3.2-3B,llama3.2,420,3.213,1.33181264899492 +meta-llama/Llama-3.2-3B-Instruct_bfloat16_276b29ce8303c9b88966a9b32fc75692dce4d8e1_True,meta-llama/Llama-3.2-3B-Instruct,276b29ce8303c9b88966a9b32fc75692dce4d8e1,bfloat16,chatmodels,Original,LlamaForCausalLM,24.1165339900694,TRUE,IFEval,0.739316125657699,73.9316125657699,BBH,0.461007023946607,24.0591864468855,MATH Level 5,0.171450151057402,17.1450151057402,GPQA,0.278523489932886,3.80313199105145,MUSR,0.352854166666667,1.3734375,MMLU-PRO,0.319481382978723,24.3868203309693,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-18,2024-09-27,0,meta-llama/Llama-3.2-3B-Instruct,llama3.2,822,3.213,1.27120351986613 +meta-llama/Llama-3.3-70B-Instruct_bfloat16__False,meta-llama/Llama-3.3-70B-Instruct,"",bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,36.8288410384085,FALSE,IFEval,0.899758197139146,89.9758197139146,BBH,0.691931282832581,56.5614107880222,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446125,15.565625,MMLU-PRO,0.533161569148936,48.1290632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-26,2024-12-09,1,meta-llama/Llama-3.3-70B-Instruct (Merge),llama3.3,1298,70.554,38.2795370537265 meta-llama/Meta-Llama-3-70B_bfloat16_b4d08b7db49d488da3ac49adf25a6b9ac01ae338_False,meta-llama/Meta-Llama-3-70B,b4d08b7db49d488da3ac49adf25a6b9ac01ae338,bfloat16,pretrained,Original,LlamaForCausalLM,26.6675858211602,FALSE,IFEval,0.160319064526567,16.0319064526567,BBH,0.646107459990447,48.7098126475059,MATH Level 5,0.183534743202417,18.3534743202417,GPQA,0.397651006711409,19.6868008948546,MUSR,0.451822916666667,16.0111979166667,MMLU-PRO,0.470910904255319,41.2123226950355,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-70B,llama3,840,70.554,23.4071857793614 meta-llama/Meta-Llama-3-70B-Instruct_bfloat16_7129260dd854a80eb10ace5f61c20324b472b31c_True,meta-llama/Meta-Llama-3-70B-Instruct,7129260dd854a80eb10ace5f61c20324b472b31c,bfloat16,chatmodels,Original,LlamaForCausalLM,36.5106934142651,TRUE,IFEval,0.809907711538717,80.9907711538717,BBH,0.654669943237205,50.1851331844035,MATH Level 5,0.253021148036254,25.3021148036254,GPQA,0.286912751677852,4.92170022371365,MUSR,0.415364583333333,10.9205729166667,MMLU-PRO,0.520694813829787,46.7438682033097,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,1,meta-llama/Meta-Llama-3-70B,llama3,1446,70.554,18.2391501177391 -meta-llama/Meta-Llama-3-8B_bfloat16_62bd457b6fe961a42a631306577e622c83876cb6_False,meta-llama/Meta-Llama-3-8B,62bd457b6fe961a42a631306577e622c83876cb6,bfloat16,pretrained,Original,LlamaForCausalLM,13.4632115530557,FALSE,IFEval,0.145506145915061,14.5506145915061,BBH,0.459790519524026,24.500763796768,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.305369127516779,7.38255033557047,MUSR,0.36140625,6.24244791666667,MMLU-PRO,0.320977393617021,24.5530437352246,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-8B,llama3,5927,8.03,0.87256849761081 -meta-llama/Meta-Llama-3-8B-Instruct_bfloat16_e1945c40cd546c78e41f1151f4db032b271faeaa_True,meta-llama/Meta-Llama-3-8B-Instruct,e1945c40cd546c78e41f1151f4db032b271faeaa,bfloat16,chatmodels,Original,LlamaForCausalLM,23.9087356939368,TRUE,IFEval,0.740839860459137,74.0839860459137,BBH,0.498871111361695,28.2449495763436,MATH Level 5,0.0868580060422961,8.68580060422961,GPQA,0.259228187919463,1.23042505592841,MUSR,0.356822916666667,1.60286458333334,MMLU-PRO,0.366439494680851,29.6043882978723,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-8B-Instruct,llama3,3713,8.03,0.797499677890947 -meta-llama/Meta-Llama-3-8B-Instruct_float16_e1945c40cd546c78e41f1151f4db032b271faeaa_False,meta-llama/Meta-Llama-3-8B-Instruct,e1945c40cd546c78e41f1151f4db032b271faeaa,float16,chatmodels,Original,LlamaForCausalLM,20.5965713292081,FALSE,IFEval,0.478232201669349,47.8232201669349,BBH,0.491026417512868,26.7952835025737,MATH Level 5,0.0906344410876133,9.06344410876133,GPQA,0.292785234899329,5.70469798657718,MUSR,0.380541666666667,5.40104166666667,MMLU-PRO,0.359125664893617,28.7917405437352,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-07-08,0,meta-llama/Meta-Llama-3-8B-Instruct,llama3,3713,8.03,0.949473257188463 +meta-llama/Meta-Llama-3-8B_bfloat16_62bd457b6fe961a42a631306577e622c83876cb6_False,meta-llama/Meta-Llama-3-8B,62bd457b6fe961a42a631306577e622c83876cb6,bfloat16,pretrained,Original,LlamaForCausalLM,13.4632115530557,FALSE,IFEval,0.145506145915061,14.5506145915061,BBH,0.459790519524026,24.500763796768,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.305369127516779,7.38255033557047,MUSR,0.36140625,6.24244791666667,MMLU-PRO,0.320977393617021,24.5530437352246,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-8B,llama3,5928,8.03,0.87256849761081 +meta-llama/Meta-Llama-3-8B-Instruct_bfloat16_e1945c40cd546c78e41f1151f4db032b271faeaa_True,meta-llama/Meta-Llama-3-8B-Instruct,e1945c40cd546c78e41f1151f4db032b271faeaa,bfloat16,chatmodels,Original,LlamaForCausalLM,23.9087356939368,TRUE,IFEval,0.740839860459137,74.0839860459137,BBH,0.498871111361695,28.2449495763436,MATH Level 5,0.0868580060422961,8.68580060422961,GPQA,0.259228187919463,1.23042505592841,MUSR,0.356822916666667,1.60286458333334,MMLU-PRO,0.366439494680851,29.6043882978723,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-06-12,0,meta-llama/Meta-Llama-3-8B-Instruct,llama3,3715,8.03,0.797499677890947 +meta-llama/Meta-Llama-3-8B-Instruct_float16_e1945c40cd546c78e41f1151f4db032b271faeaa_False,meta-llama/Meta-Llama-3-8B-Instruct,e1945c40cd546c78e41f1151f4db032b271faeaa,float16,chatmodels,Original,LlamaForCausalLM,20.5965713292081,FALSE,IFEval,0.478232201669349,47.8232201669349,BBH,0.491026417512868,26.7952835025737,MATH Level 5,0.0906344410876133,9.06344410876133,GPQA,0.292785234899329,5.70469798657718,MUSR,0.380541666666667,5.40104166666667,MMLU-PRO,0.359125664893617,28.7917405437352,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-17,2024-07-08,0,meta-llama/Meta-Llama-3-8B-Instruct,llama3,3715,8.03,0.949473257188463 meta-llama/Meta-Llama-3.1-70B_bfloat16_f7d3cc45ed4ff669a354baf2e0f05e65799a0bee_True,meta-llama/Meta-Llama-3.1-70B,f7d3cc45ed4ff669a354baf2e0f05e65799a0bee,bfloat16,pretrained,Original,LlamaForCausalLM,26.2002158433759,TRUE,IFEval,0.168437523548629,16.8437523548629,BBH,0.626006918317161,46.3994129558189,MATH Level 5,0.18429003021148,18.429003021148,GPQA,0.38758389261745,18.34451901566,MUSR,0.4571875,16.5817708333333,MMLU-PRO,0.465425531914894,40.6028368794326,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-07-23,0,meta-llama/Meta-Llama-3.1-70B,llama3.1,327,70.554,13.6018520327186 -meta-llama/Meta-Llama-3.1-70B-Instruct_bfloat16_b9461463b511ed3c0762467538ea32cf7c9669f2_True,meta-llama/Meta-Llama-3.1-70B-Instruct,b9461463b511ed3c0762467538ea32cf7c9669f2,bfloat16,chatmodels,Original,LlamaForCausalLM,42.1763127975088,TRUE,IFEval,0.866885419575615,86.6885419575615,BBH,0.691728745366365,55.9279917389847,MATH Level 5,0.306646525679758,30.6646525679758,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4580625,17.6911458333333,MMLU-PRO,0.530917553191489,47.8797281323877,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-15,1,meta-llama/Meta-Llama-3.1-70B,llama3.1,754,70.554,26.8020157168701 -meta-llama/Meta-Llama-3.1-8B_bfloat16_e5c39e551424c763dbc3e58e32ef2999d33a6d8d_True,meta-llama/Meta-Llama-3.1-8B,e5c39e551424c763dbc3e58e32ef2999d33a6d8d,bfloat16,pretrained,Original,LlamaForCausalLM,13.8690662612791,TRUE,IFEval,0.126996369632575,12.6996369632575,BBH,0.4666136555004,25.2947798510872,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.296140939597315,6.15212527964205,MUSR,0.382520833333333,8.98177083333333,MMLU-PRO,0.324551196808511,24.9501329787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-07-23,0,meta-llama/Meta-Llama-3.1-8B,llama3.1,1223,8.03,3.5985230038683 -meta-llama/Meta-Llama-3.1-8B-Instruct_bfloat16_df34336b42332c6d360959e259cd6271c6a09fd4_True,meta-llama/Meta-Llama-3.1-8B-Instruct,df34336b42332c6d360959e259cd6271c6a09fd4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2044584981019,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.26761744966443,2.3489932885906,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376163563829787,30.6848404255319,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-08-15,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,3318,8.03,2.48701186834409 +meta-llama/Meta-Llama-3.1-70B-Instruct_bfloat16_b9461463b511ed3c0762467538ea32cf7c9669f2_True,meta-llama/Meta-Llama-3.1-70B-Instruct,b9461463b511ed3c0762467538ea32cf7c9669f2,bfloat16,chatmodels,Original,LlamaForCausalLM,42.1763127975088,TRUE,IFEval,0.866885419575615,86.6885419575615,BBH,0.691728745366365,55.9279917389847,MATH Level 5,0.306646525679758,30.6646525679758,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4580625,17.6911458333333,MMLU-PRO,0.530917553191489,47.8797281323877,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-15,1,meta-llama/Meta-Llama-3.1-70B,llama3.1,755,70.554,26.8020157168701 +meta-llama/Meta-Llama-3.1-8B_bfloat16_e5c39e551424c763dbc3e58e32ef2999d33a6d8d_True,meta-llama/Meta-Llama-3.1-8B,e5c39e551424c763dbc3e58e32ef2999d33a6d8d,bfloat16,pretrained,Original,LlamaForCausalLM,13.8690662612791,TRUE,IFEval,0.126996369632575,12.6996369632575,BBH,0.4666136555004,25.2947798510872,MATH Level 5,0.0513595166163142,5.13595166163142,GPQA,0.296140939597315,6.15212527964205,MUSR,0.382520833333333,8.98177083333333,MMLU-PRO,0.324551196808511,24.9501329787234,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-14,2024-07-23,0,meta-llama/Meta-Llama-3.1-8B,llama3.1,1224,8.03,3.5985230038683 +meta-llama/Meta-Llama-3.1-8B-Instruct_bfloat16_df34336b42332c6d360959e259cd6271c6a09fd4_True,meta-llama/Meta-Llama-3.1-8B-Instruct,df34336b42332c6d360959e259cd6271c6a09fd4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2044584981019,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.26761744966443,2.3489932885906,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376163563829787,30.6848404255319,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-08-15,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,3325,8.03,2.48701186834409 microsoft/DialoGPT-medium_bfloat16_7b40bb0f92c45fefa957d088000d8648e5c7fa33_True,microsoft/DialoGPT-medium,7b40bb0f92c45fefa957d088000d8648e5c7fa33,bfloat16,chatmodels,Original,GPT2LMHeadModel,5.25143360679031,TRUE,IFEval,0.147904227449833,14.7904227449833,BBH,0.301415638014199,2.55685577233522,MATH Level 5,0,0,GPQA,0.254194630872483,0.559284116331097,MUSR,0.428666666666667,12.2833333333333,MMLU-PRO,0.11186835106383,1.31870567375887,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-13,0,microsoft/DialoGPT-medium,mit,336,0.345,0.129464485100266 microsoft/Orca-2-13b_bfloat16_2539ff53e6baa4cc603774ad5a2d646f4041ea4e_False,microsoft/Orca-2-13b,2539ff53e6baa4cc603774ad5a2d646f4041ea4e,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,18.1494038209109,FALSE,IFEval,0.31279338820995,31.279338820995,BBH,0.488448972883961,27.3080194999426,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.280201342281879,4.0268456375839,MUSR,0.51296875,25.7877604166667,MMLU-PRO,0.274933510638298,19.4370567375887,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-14,2024-06-12,0,microsoft/Orca-2-13b,other,665,13,1.00858169959549 microsoft/Orca-2-7b_bfloat16_60e31e6bdcf582ad103b807cb74b73ee1d2c4b17_False,microsoft/Orca-2-7b,60e31e6bdcf582ad103b807cb74b73ee1d2c4b17,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,14.2160083291346,FALSE,IFEval,0.218346210277619,21.8346210277619,BBH,0.445213226754594,22.4294684028185,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.260906040268456,1.45413870246085,MUSR,0.502614583333333,24.0934895833333,MMLU-PRO,0.23188164893617,14.6535165484634,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-14,2024-06-12,0,microsoft/Orca-2-7b,other,216,7,1.20931193274994 microsoft/Phi-3-medium-128k-instruct_bfloat16_fa7d2aa4f5ea69b2e36b20d050cdae79c9bfbb3f_True,microsoft/Phi-3-medium-128k-instruct,fa7d2aa4f5ea69b2e36b20d050cdae79c9bfbb3f,bfloat16,chatmodels,Original,Phi3ForCausalLM,31.7116532556656,TRUE,IFEval,0.604002934436185,60.4002934436185,BBH,0.638232253087055,48.4604512739902,MATH Level 5,0.172960725075529,17.2960725075529,GPQA,0.336409395973154,11.5212527964206,MUSR,0.412947916666667,11.3518229166667,MMLU-PRO,0.471160239361702,41.2400265957447,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-08-21,0,microsoft/Phi-3-medium-128k-instruct,mit,374,13.96,1.94755874452617 microsoft/Phi-3-medium-4k-instruct_bfloat16_d194e4e74ffad5a5e193e26af25bcfc80c7f1ffc_True,microsoft/Phi-3-medium-4k-instruct,d194e4e74ffad5a5e193e26af25bcfc80c7f1ffc,bfloat16,chatmodels,Original,Phi3ForCausalLM,32.8962495702928,TRUE,IFEval,0.642271395452954,64.2271395452954,BBH,0.641246489055555,49.3806100742202,MATH Level 5,0.183534743202417,18.3534743202417,GPQA,0.336409395973154,11.5212527964206,MUSR,0.42575,13.0520833333333,MMLU-PRO,0.467586436170213,40.8429373522459,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-12,0,microsoft/Phi-3-medium-4k-instruct,mit,211,13.96,1.45526252332937 -microsoft/Phi-3-mini-128k-instruct_bfloat16_5be6479b4bc06a081e8f4c6ece294241ccd32dec_True,microsoft/Phi-3-mini-128k-instruct,5be6479b4bc06a081e8f4c6ece294241ccd32dec,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.6262872732554,TRUE,IFEval,0.597633168880792,59.7633168880792,BBH,0.557453179267985,37.0997666322403,MATH Level 5,0.0974320241691843,9.74320241691843,GPQA,0.317953020134228,9.06040268456376,MUSR,0.3936875,7.7109375,MMLU-PRO,0.373420877659575,30.3800975177305,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-08-21,0,microsoft/Phi-3-mini-128k-instruct,mit,1617,3.821,24.2222515926888 -microsoft/Phi-3-mini-4k-instruct_bfloat16_ff07dc01615f8113924aed013115ab2abd32115b_True,microsoft/Phi-3-mini-4k-instruct,ff07dc01615f8113924aed013115ab2abd32115b,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.9677326380416,TRUE,IFEval,0.561288492311511,56.1288492311511,BBH,0.567597262633488,39.2693352377728,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.319630872483222,9.2841163310962,MUSR,0.395020833333333,7.64427083333334,MMLU-PRO,0.386635638297872,31.8484042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-06-12,0,microsoft/Phi-3-mini-4k-instruct,mit,1092,3.821,0.804074829912372 -microsoft/Phi-3-mini-4k-instruct_float16_c1358f8a35e6d2af81890deffbbfa575b978c62f_True,microsoft/Phi-3-mini-4k-instruct,c1358f8a35e6d2af81890deffbbfa575b978c62f,float16,chatmodels,Original,Phi3ForCausalLM,27.4111166417796,TRUE,IFEval,0.547674614467391,54.7674614467391,BBH,0.549071891949582,36.5598553051879,MATH Level 5,0.154833836858006,15.4833836858006,GPQA,0.332214765100671,10.9619686800895,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.402177526595745,33.5752807328605,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-07-02,0,microsoft/Phi-3-mini-4k-instruct,mit,1092,3.821,0.786699265454341 +microsoft/Phi-3-mini-128k-instruct_bfloat16_5be6479b4bc06a081e8f4c6ece294241ccd32dec_True,microsoft/Phi-3-mini-128k-instruct,5be6479b4bc06a081e8f4c6ece294241ccd32dec,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.6262872732554,TRUE,IFEval,0.597633168880792,59.7633168880792,BBH,0.557453179267985,37.0997666322403,MATH Level 5,0.0974320241691843,9.74320241691843,GPQA,0.317953020134228,9.06040268456376,MUSR,0.3936875,7.7109375,MMLU-PRO,0.373420877659575,30.3800975177305,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-08-21,0,microsoft/Phi-3-mini-128k-instruct,mit,1618,3.821,24.2222515926888 +microsoft/Phi-3-mini-4k-instruct_bfloat16_ff07dc01615f8113924aed013115ab2abd32115b_True,microsoft/Phi-3-mini-4k-instruct,ff07dc01615f8113924aed013115ab2abd32115b,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.9677326380416,TRUE,IFEval,0.561288492311511,56.1288492311511,BBH,0.567597262633488,39.2693352377728,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.319630872483222,9.2841163310962,MUSR,0.395020833333333,7.64427083333334,MMLU-PRO,0.386635638297872,31.8484042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-06-12,0,microsoft/Phi-3-mini-4k-instruct,mit,1093,3.821,0.804074829912372 +microsoft/Phi-3-mini-4k-instruct_float16_c1358f8a35e6d2af81890deffbbfa575b978c62f_True,microsoft/Phi-3-mini-4k-instruct,c1358f8a35e6d2af81890deffbbfa575b978c62f,float16,chatmodels,Original,Phi3ForCausalLM,27.4111166417796,TRUE,IFEval,0.547674614467391,54.7674614467391,BBH,0.549071891949582,36.5598553051879,MATH Level 5,0.154833836858006,15.4833836858006,GPQA,0.332214765100671,10.9619686800895,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.402177526595745,33.5752807328605,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-07-02,0,microsoft/Phi-3-mini-4k-instruct,mit,1093,3.821,0.786699265454341 microsoft/Phi-3-small-128k-instruct_bfloat16_f80aaa30bfc64c2b8ab214b541d9050e97163bc4_True,microsoft/Phi-3-small-128k-instruct,f80aaa30bfc64c2b8ab214b541d9050e97163bc4,bfloat16,chatmodels,Original,Phi3SmallForCausalLM,28.5909915695228,TRUE,IFEval,0.636825844315306,63.6825844315306,BBH,0.620217677869698,45.6340696414479,MATH Level 5,0,0,GPQA,0.317114093959732,8.94854586129754,MUSR,0.43784375,14.4971354166667,MMLU-PRO,0.449052526595745,38.7836140661939,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-13,0,microsoft/Phi-3-small-128k-instruct,mit,173,7.392,2.50846790619425 microsoft/Phi-3-small-8k-instruct_bfloat16_1535ae26fb4faada95c6950e8bc6e867cdad6b00_True,microsoft/Phi-3-small-8k-instruct,1535ae26fb4faada95c6950e8bc6e867cdad6b00,bfloat16,chatmodels,Original,Phi3SmallForCausalLM,29.6709218521057,TRUE,IFEval,0.649665110794913,64.9665110794913,BBH,0.620836488087056,46.2055703663891,MATH Level 5,0.0284301430770108,2.84301430770108,GPQA,0.312080536912752,8.27740492170022,MUSR,0.455791666666667,16.7739583333333,MMLU-PRO,0.45063164893617,38.9590721040189,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-13,0,microsoft/Phi-3-small-8k-instruct,mit,159,7.392,1.0254536035218 microsoft/Phi-3.5-MoE-instruct_bfloat16_482a9ba0eb0e1fa1671e3560e009d7cec2e5147c_True,microsoft/Phi-3.5-MoE-instruct,482a9ba0eb0e1fa1671e3560e009d7cec2e5147c,bfloat16,chatmodels,Original,Phi3ForCausalLM,35.4565075216065,TRUE,IFEval,0.692454908531585,69.2454908531585,BBH,0.640762564622586,48.7746463593219,MATH Level 5,0.226586102719033,22.6586102719033,GPQA,0.355704697986577,14.0939597315436,MUSR,0.456479166666667,17.3265625,MMLU-PRO,0.465757978723404,40.6397754137116,TRUE,FALSE,TRUE,FALSE,TRUE,2024-08-17,2024-08-21,0,microsoft/Phi-3.5-MoE-instruct,mit,540,42,4.63227861394431 -microsoft/Phi-3.5-mini-instruct_bfloat16_64963004ad95869fa73a30279371c8778509ac84_True,microsoft/Phi-3.5-mini-instruct,64963004ad95869fa73a30279371c8778509ac84,bfloat16,chatmodels,Original,Phi3ForCausalLM,27.5675734687961,TRUE,IFEval,0.577450054743636,57.7450054743636,BBH,0.551778512611196,36.7458539085166,MATH Level 5,0.159365558912387,15.9365558912387,GPQA,0.339765100671141,11.9686800894855,MUSR,0.402125,10.0989583333333,MMLU-PRO,0.396193484042553,32.9103871158392,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-16,2024-08-21,0,microsoft/Phi-3.5-mini-instruct,mit,713,3.821,3.69600430233737 +microsoft/Phi-3.5-mini-instruct_bfloat16_64963004ad95869fa73a30279371c8778509ac84_True,microsoft/Phi-3.5-mini-instruct,64963004ad95869fa73a30279371c8778509ac84,bfloat16,chatmodels,Original,Phi3ForCausalLM,27.5675734687961,TRUE,IFEval,0.577450054743636,57.7450054743636,BBH,0.551778512611196,36.7458539085166,MATH Level 5,0.159365558912387,15.9365558912387,GPQA,0.339765100671141,11.9686800894855,MUSR,0.402125,10.0989583333333,MMLU-PRO,0.396193484042553,32.9103871158392,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-16,2024-08-21,0,microsoft/Phi-3.5-mini-instruct,mit,719,3.821,3.69600430233737 microsoft/phi-1_bfloat16_b9ac0e6d78d43970ecf88e9e0154b3a7da20ed89_False,microsoft/phi-1,b9ac0e6d78d43970ecf88e9e0154b3a7da20ed89,bfloat16,pretrained,Original,PhiForCausalLM,5.52396572810627,FALSE,IFEval,0.206805719934219,20.6805719934219,BBH,0.313947558958378,4.27399921221468,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.26510067114094,2.01342281879195,MUSR,0.352510416666667,3.69713541666667,MMLU-PRO,0.116190159574468,1.79890661938534,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-10,2024-06-13,0,microsoft/phi-1,mit,207,1.418,0.28622924752808 microsoft/phi-1_5_float16_675aa382d814580b22651a30acb1a585d7c25963_False,microsoft/phi-1_5,675aa382d814580b22651a30acb1a585d7c25963,float16,pretrained,Original,PhiForCausalLM,7.05767379443971,FALSE,IFEval,0.203283953244059,20.3283953244059,BBH,0.335975832119967,7.46893877007024,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.26761744966443,2.3489932885906,MUSR,0.340416666666667,3.38541666666667,MMLU-PRO,0.169132313829787,7.68136820330969,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-10,2024-06-09,0,microsoft/phi-1_5,mit,1319,1.418,0.340862069057633 microsoft/phi-2_float16_ef382358ec9e382308935a992d908de099b64c23_False,microsoft/phi-2,ef382358ec9e382308935a992d908de099b64c23,float16,pretrained,Original,PhiForCausalLM,15.4713509741263,FALSE,IFEval,0.273875539125077,27.3875539125077,BBH,0.48812087712497,28.0385192934393,MATH Level 5,0.0256797583081571,2.56797583081571,GPQA,0.271812080536913,2.9082774049217,MUSR,0.409895833333333,13.8369791666667,MMLU-PRO,0.26279920212766,18.0888002364066,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-13,2024-06-09,0,microsoft/phi-2,mit,3258,2.78,0.423520982590239 @@ -1789,23 +1806,23 @@ minghaowu/Qwen1.5-1.8B-OpenHermes-2.5_bfloat16_40700de82968350c192318877fe522630 ministral/Ministral-3b-instruct_bfloat16_2c95908929198d6e69af8638f0dbbd9bc6b93f9e_False,ministral/Ministral-3b-instruct,2c95908929198d6e69af8638f0dbbd9bc6b93f9e,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,3.38161348841134,FALSE,IFEval,0.13576421672274,13.576421672274,BBH,0.319185984783324,4.67586357856467,MATH Level 5,0,0,GPQA,0.251677852348993,0.223713646532442,MUSR,0.33825,0.78125,MMLU-PRO,0.109291888297872,1.03243203309693,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-14,2024-10-25,0,ministral/Ministral-3b-instruct,apache-2.0,37,3.316,0.264486930516462 mistral-community/Mistral-7B-v0.2_bfloat16_2c3e624962b1a3f3fbf52e15969565caa7bc064a_False,mistral-community/Mistral-7B-v0.2,2c3e624962b1a3f3fbf52e15969565caa7bc064a,bfloat16,pretrained,Original,MistralForCausalLM,14.2153624426921,FALSE,IFEval,0.2266397602805,22.66397602805,BBH,0.451018796279758,23.9508653830296,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.291946308724832,5.59284116331097,MUSR,0.403177083333333,8.36380208333333,MMLU-PRO,0.295295877659575,21.6995419621749,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-23,2024-06-12,0,mistral-community/Mistral-7B-v0.2,apache-2.0,232,7.242,0.553213277920435 mistral-community/mixtral-8x22B-v0.3_bfloat16_211b177b79ab5ef245ee334d106c27623e786882_False,mistral-community/mixtral-8x22B-v0.3,211b177b79ab5ef245ee334d106c27623e786882,bfloat16,pretrained,Original,MixtralForCausalLM,25.789406608528,FALSE,IFEval,0.258263629392235,25.8263629392235,BBH,0.625000217843585,45.7310408976333,MATH Level 5,0.182779456193354,18.2779456193354,GPQA,0.37751677852349,17.0022371364653,MUSR,0.403697916666667,7.46223958333334,MMLU-PRO,0.463929521276596,40.4366134751773,TRUE,FALSE,TRUE,FALSE,TRUE,2024-05-25,2024-06-13,0,mistral-community/mixtral-8x22B-v0.3,apache-2.0,3,140.63,52.4944851685548 -mistralai/Codestral-22B-v0.1_bfloat16_8f5fe23af91885222a1563283c87416745a5e212_True,mistralai/Codestral-22B-v0.1,8f5fe23af91885222a1563283c87416745a5e212,bfloat16,pretrained,Original,MistralForCausalLM,23.2799174068646,TRUE,IFEval,0.577175228393995,57.7175228393995,BBH,0.513913692100317,30.7376344119456,MATH Level 5,0.100453172205438,10.0453172205438,GPQA,0.298657718120805,6.48769574944072,MUSR,0.418708333333333,10.7385416666667,MMLU-PRO,0.315575132978723,23.9527925531915,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-29,2024-09-28,0,mistralai/Codestral-22B-v0.1,other,1167,22.247,1.3066695609381 -mistralai/Ministral-8B-Instruct-2410_bfloat16_199e57c1d66379760f6413f79d27008d1d1dbd6e_True,mistralai/Ministral-8B-Instruct-2410,199e57c1d66379760f6413f79d27008d1d1dbd6e,bfloat16,chatmodels,Original,MistralForCausalLM,22.0078589303086,TRUE,IFEval,0.589639933155139,58.963993315514,BBH,0.476164020168914,25.8247744094178,MATH Level 5,0.0649546827794562,6.49546827794562,GPQA,0.284395973154362,4.58612975391499,MUSR,0.41375,10.71875,MMLU-PRO,0.329122340425532,25.4580378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-15,2024-12-01,0,mistralai/Ministral-8B-Instruct-2410,other,369,8.02,0.797086392156932 +mistralai/Codestral-22B-v0.1_bfloat16_8f5fe23af91885222a1563283c87416745a5e212_True,mistralai/Codestral-22B-v0.1,8f5fe23af91885222a1563283c87416745a5e212,bfloat16,pretrained,Original,MistralForCausalLM,23.2799174068646,TRUE,IFEval,0.577175228393995,57.7175228393995,BBH,0.513913692100317,30.7376344119456,MATH Level 5,0.100453172205438,10.0453172205438,GPQA,0.298657718120805,6.48769574944072,MUSR,0.418708333333333,10.7385416666667,MMLU-PRO,0.315575132978723,23.9527925531915,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-29,2024-09-28,0,mistralai/Codestral-22B-v0.1,other,1169,22.247,1.3066695609381 +mistralai/Ministral-8B-Instruct-2410_bfloat16_199e57c1d66379760f6413f79d27008d1d1dbd6e_True,mistralai/Ministral-8B-Instruct-2410,199e57c1d66379760f6413f79d27008d1d1dbd6e,bfloat16,chatmodels,Original,MistralForCausalLM,22.0078589303086,TRUE,IFEval,0.589639933155139,58.963993315514,BBH,0.476164020168914,25.8247744094178,MATH Level 5,0.0649546827794562,6.49546827794562,GPQA,0.284395973154362,4.58612975391499,MUSR,0.41375,10.71875,MMLU-PRO,0.329122340425532,25.4580378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-15,2024-12-01,0,mistralai/Ministral-8B-Instruct-2410,other,372,8.02,0.797086392156932 mistralai/Mistral-7B-Instruct-v0.1_bfloat16_73068f3702d050a2fd5aa2ca1e612e5036429398_True,mistralai/Mistral-7B-Instruct-v0.1,73068f3702d050a2fd5aa2ca1e612e5036429398,bfloat16,chatmodels,Original,MistralForCausalLM,12.6957006941243,TRUE,IFEval,0.448706099815157,44.8706099815157,BBH,0.33548084759811,7.64702053582754,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.25,0,MUSR,0.384760416666667,6.12838541666667,MMLU-PRO,0.241439494680851,15.7154994089835,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-27,2024-06-27,1,mistralai/Mistral-7B-v0.1,apache-2.0,1538,7.242,1.21604471748007 -mistralai/Mistral-7B-Instruct-v0.2_bfloat16_41b61a33a2483885c981aa79e0df6b32407ed873_True,mistralai/Mistral-7B-Instruct-v0.2,41b61a33a2483885c981aa79e0df6b32407ed873,bfloat16,chatmodels,Original,MistralForCausalLM,18.4575391254667,TRUE,IFEval,0.549622778671702,54.9622778671702,BBH,0.445973552032928,22.9106019367136,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.276006711409396,3.4675615212528,MUSR,0.396604166666667,7.60885416666667,MMLU-PRO,0.271692154255319,19.0769060283688,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-11,2024-06-12,0,mistralai/Mistral-7B-Instruct-v0.2,apache-2.0,2600,7.242,0.534406629050985 -mistralai/Mistral-7B-Instruct-v0.3_bfloat16_83e9aa141f2e28c82232fea5325f54edf17c43de_True,mistralai/Mistral-7B-Instruct-v0.3,83e9aa141f2e28c82232fea5325f54edf17c43de,bfloat16,chatmodels,Original,MistralForCausalLM,19.174746309635,TRUE,IFEval,0.546525441384416,54.6525441384416,BBH,0.472196317126484,25.569114948859,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.279362416107383,3.91498881431767,MUSR,0.37390625,4.30494791666667,MMLU-PRO,0.30751329787234,23.0570330969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-12,1,mistralai/Mistral-7B-v0.3,apache-2.0,1200,7.248,0.5377834643891 +mistralai/Mistral-7B-Instruct-v0.2_bfloat16_41b61a33a2483885c981aa79e0df6b32407ed873_True,mistralai/Mistral-7B-Instruct-v0.2,41b61a33a2483885c981aa79e0df6b32407ed873,bfloat16,chatmodels,Original,MistralForCausalLM,18.4575391254667,TRUE,IFEval,0.549622778671702,54.9622778671702,BBH,0.445973552032928,22.9106019367136,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.276006711409396,3.4675615212528,MUSR,0.396604166666667,7.60885416666667,MMLU-PRO,0.271692154255319,19.0769060283688,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-11,2024-06-12,0,mistralai/Mistral-7B-Instruct-v0.2,apache-2.0,2601,7.242,0.534406629050985 +mistralai/Mistral-7B-Instruct-v0.3_bfloat16_83e9aa141f2e28c82232fea5325f54edf17c43de_True,mistralai/Mistral-7B-Instruct-v0.3,83e9aa141f2e28c82232fea5325f54edf17c43de,bfloat16,chatmodels,Original,MistralForCausalLM,19.174746309635,TRUE,IFEval,0.546525441384416,54.6525441384416,BBH,0.472196317126484,25.569114948859,MATH Level 5,0.0354984894259819,3.54984894259819,GPQA,0.279362416107383,3.91498881431767,MUSR,0.37390625,4.30494791666667,MMLU-PRO,0.30751329787234,23.0570330969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-12,1,mistralai/Mistral-7B-v0.3,apache-2.0,1201,7.248,0.5377834643891 mistralai/Mistral-7B-v0.1_bfloat16_26bca36bde8333b5d7f72e9ed20ccda6a618af24_False,mistralai/Mistral-7B-v0.1,26bca36bde8333b5d7f72e9ed20ccda6a618af24,bfloat16,pretrained,Original,MistralForCausalLM,14.5626190834339,FALSE,IFEval,0.238554812342363,23.8554812342363,BBH,0.443106781218371,22.1684024578981,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.291946308724832,5.59284116331097,MUSR,0.4139375,10.6755208333333,MMLU-PRO,0.301279920212766,22.3644355791962,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-20,2024-06-12,0,mistralai/Mistral-7B-v0.1,apache-2.0,3507,7.242,0.675534465568117 mistralai/Mistral-7B-v0.3_bfloat16_b67d6a03ca097c5122fa65904fce0413500bf8c8_False,mistralai/Mistral-7B-v0.3,b67d6a03ca097c5122fa65904fce0413500bf8c8,bfloat16,pretrained,Original,MistralForCausalLM,14.2153624426921,FALSE,IFEval,0.2266397602805,22.66397602805,BBH,0.451018796279758,23.9508653830296,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.291946308724832,5.59284116331097,MUSR,0.403177083333333,8.36380208333333,MMLU-PRO,0.295295877659575,21.6995419621749,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-22,2024-06-12,0,mistralai/Mistral-7B-v0.3,apache-2.0,409,7.248,0.660475600081291 mistralai/Mistral-Large-Instruct-2411_float16_3a5cb136f6106edf5c1210369068eb5a4f787cab_True,mistralai/Mistral-Large-Instruct-2411,3a5cb136f6106edf5c1210369068eb5a4f787cab,float16,chatmodels,Original,MistralForCausalLM,38.4552314758039,TRUE,IFEval,0.840057713533425,84.0057713533425,BBH,0.674664773567507,52.7448919952634,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.437080536912752,24.9440715883669,MUSR,0.454,17.2166666666667,MMLU-PRO,0.556183510638298,50.6870567375887,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-14,2024-11-19,0,mistralai/Mistral-Large-Instruct-2411,other,176,122.61,26.272305228873 -mistralai/Mistral-Nemo-Base-2407_bfloat16_d2efb15544d5401f761235bef327babb850887d0_False,mistralai/Mistral-Nemo-Base-2407,d2efb15544d5401f761235bef327babb850887d0,bfloat16,pretrained,Original,MistralForCausalLM,15.1386511082141,FALSE,IFEval,0.162991972410981,16.2991972410981,BBH,0.503506200036929,29.3747364409669,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.293624161073826,5.8165548098434,MUSR,0.392135416666667,6.51692708333334,MMLU-PRO,0.347157579787234,27.4619533096927,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-07-19,0,mistralai/Mistral-Nemo-Base-2407,apache-2.0,266,11.58,1.70299545491031 -mistralai/Mistral-Nemo-Instruct-2407_bfloat16_4d14c1db68fe20dbf80b8eca85d39b909c5fe1d5_True,mistralai/Mistral-Nemo-Instruct-2407,4d14c1db68fe20dbf80b8eca85d39b909c5fe1d5,bfloat16,chatmodels,Original,MistralForCausalLM,23.6333743622513,TRUE,IFEval,0.638024885082692,63.8024885082692,BBH,0.503652395031081,29.6799703811528,MATH Level 5,0.0649546827794562,6.49546827794562,GPQA,0.290268456375839,5.36912751677852,MUSR,0.39,8.48333333333333,MMLU-PRO,0.351728723404255,27.9698581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-17,2024-08-29,1,mistralai/Mistral-Nemo-Base-2407,apache-2.0,1315,12.248,2.99760056248369 -mistralai/Mistral-Small-Instruct-2409_bfloat16_63e53df6575e7085d62113f4383835ff979b3795_True,mistralai/Mistral-Small-Instruct-2409,63e53df6575e7085d62113f4383835ff979b3795,bfloat16,chatmodels,Original,MistralForCausalLM,26.2627489764183,TRUE,IFEval,0.666975846310013,66.6975846310013,BBH,0.521307509814622,30.7920960925092,MATH Level 5,0.143504531722054,14.3504531722054,GPQA,0.323825503355705,9.84340044742729,MUSR,0.363208333333333,3.00104166666667,MMLU-PRO,0.396027260638298,32.8919178486998,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,0,mistralai/Mistral-Small-Instruct-2409,other,361,22.05,1.37933750885174 -mistralai/Mistral-Small-Instruct-2409_float16_63e53df6575e7085d62113f4383835ff979b3795_False,mistralai/Mistral-Small-Instruct-2409,63e53df6575e7085d62113f4383835ff979b3795,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,29.8182425699334,FALSE,IFEval,0.628282955890371,62.8282955890371,BBH,0.583028384689821,40.5597130348992,MATH Level 5,0.197885196374622,19.7885196374622,GPQA,0.333053691275168,11.0738255033557,MUSR,0.406333333333333,10.225,MMLU-PRO,0.409906914893617,34.4341016548463,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-25,0,mistralai/Mistral-Small-Instruct-2409,other,361,22.247,1.61000748804136 +mistralai/Mistral-Nemo-Base-2407_bfloat16_d2efb15544d5401f761235bef327babb850887d0_False,mistralai/Mistral-Nemo-Base-2407,d2efb15544d5401f761235bef327babb850887d0,bfloat16,pretrained,Original,MistralForCausalLM,15.1386511082141,FALSE,IFEval,0.162991972410981,16.2991972410981,BBH,0.503506200036929,29.3747364409669,MATH Level 5,0.0536253776435045,5.36253776435045,GPQA,0.293624161073826,5.8165548098434,MUSR,0.392135416666667,6.51692708333334,MMLU-PRO,0.347157579787234,27.4619533096927,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-07-19,0,mistralai/Mistral-Nemo-Base-2407,apache-2.0,267,11.58,1.70299545491031 +mistralai/Mistral-Nemo-Instruct-2407_bfloat16_4d14c1db68fe20dbf80b8eca85d39b909c5fe1d5_True,mistralai/Mistral-Nemo-Instruct-2407,4d14c1db68fe20dbf80b8eca85d39b909c5fe1d5,bfloat16,chatmodels,Original,MistralForCausalLM,23.6333743622513,TRUE,IFEval,0.638024885082692,63.8024885082692,BBH,0.503652395031081,29.6799703811528,MATH Level 5,0.0649546827794562,6.49546827794562,GPQA,0.290268456375839,5.36912751677852,MUSR,0.39,8.48333333333333,MMLU-PRO,0.351728723404255,27.9698581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-17,2024-08-29,1,mistralai/Mistral-Nemo-Base-2407,apache-2.0,1319,12.248,2.99760056248369 +mistralai/Mistral-Small-Instruct-2409_bfloat16_63e53df6575e7085d62113f4383835ff979b3795_True,mistralai/Mistral-Small-Instruct-2409,63e53df6575e7085d62113f4383835ff979b3795,bfloat16,chatmodels,Original,MistralForCausalLM,26.2627489764183,TRUE,IFEval,0.666975846310013,66.6975846310013,BBH,0.521307509814622,30.7920960925092,MATH Level 5,0.143504531722054,14.3504531722054,GPQA,0.323825503355705,9.84340044742729,MUSR,0.363208333333333,3.00104166666667,MMLU-PRO,0.396027260638298,32.8919178486998,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-19,0,mistralai/Mistral-Small-Instruct-2409,other,362,22.05,1.37933750885174 +mistralai/Mistral-Small-Instruct-2409_float16_63e53df6575e7085d62113f4383835ff979b3795_False,mistralai/Mistral-Small-Instruct-2409,63e53df6575e7085d62113f4383835ff979b3795,float16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,29.8182425699334,FALSE,IFEval,0.628282955890371,62.8282955890371,BBH,0.583028384689821,40.5597130348992,MATH Level 5,0.197885196374622,19.7885196374622,GPQA,0.333053691275168,11.0738255033557,MUSR,0.406333333333333,10.225,MMLU-PRO,0.409906914893617,34.4341016548463,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-17,2024-09-25,0,mistralai/Mistral-Small-Instruct-2409,other,362,22.247,1.61000748804136 mistralai/Mixtral-8x22B-Instruct-v0.1_bfloat16_b0c3516041d014f640267b14feb4e9a84c8e8c71_True,mistralai/Mixtral-8x22B-Instruct-v0.1,b0c3516041d014f640267b14feb4e9a84c8e8c71,bfloat16,chatmodels,Original,MixtralForCausalLM,33.885680288082,TRUE,IFEval,0.718358400156031,71.8358400156031,BBH,0.612492492627202,44.1143455872484,MATH Level 5,0.187311178247734,18.7311178247734,GPQA,0.373322147651007,16.4429530201342,MUSR,0.431114583333333,13.4893229166667,MMLU-PRO,0.448304521276596,38.7005023640662,TRUE,FALSE,TRUE,FALSE,TRUE,2024-04-16,2024-06-12,1,mistralai/Mixtral-8x22B-v0.1,apache-2.0,696,140.621,47.147578592378 mistralai/Mixtral-8x22B-v0.1_bfloat16_b03e260818710044a2f088d88fab12bb220884fb_False,mistralai/Mixtral-8x22B-v0.1,b03e260818710044a2f088d88fab12bb220884fb,bfloat16,pretrained,Original,MixtralForCausalLM,25.7283481584049,FALSE,IFEval,0.258263629392235,25.8263629392235,BBH,0.623980747318727,45.5884038434272,MATH Level 5,0.182779456193354,18.2779456193354,GPQA,0.375838926174497,16.7785234899329,MUSR,0.403697916666667,7.46223958333334,MMLU-PRO,0.463929521276596,40.4366134751773,TRUE,FALSE,TRUE,FALSE,TRUE,2024-04-16,2024-06-12,0,mistralai/Mixtral-8x22B-v0.1,apache-2.0,202,140.621,104.697316275112 -mistralai/Mixtral-8x7B-Instruct-v0.1_bfloat16_1e637f2d7cb0a9d6fb1922f305cb784995190a83_True,mistralai/Mixtral-8x7B-Instruct-v0.1,1e637f2d7cb0a9d6fb1922f305cb784995190a83,bfloat16,chatmodels,Original,MixtralForCausalLM,23.8422789394817,TRUE,IFEval,0.559914360563305,55.9914360563305,BBH,0.496236540133565,29.7423983809673,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.302852348993289,7.04697986577182,MUSR,0.420322916666667,11.0736979166667,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-10,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,4235,46.703,13.7649393661468 -mistralai/Mixtral-8x7B-v0.1_bfloat16_985aa055896a8f943d4a9f2572e6ea1341823841_False,mistralai/Mixtral-8x7B-v0.1,985aa055896a8f943d4a9f2572e6ea1341823841,bfloat16,pretrained,Original,MixtralForCausalLM,19.4519879614403,FALSE,IFEval,0.24152692633324,24.152692633324,BBH,0.508666743762444,30.2941949189615,MATH Level 5,0.095166163141994,9.5166163141994,GPQA,0.313758389261745,8.50111856823266,MUSR,0.432135416666667,12.58359375,MMLU-PRO,0.384973404255319,31.6637115839244,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-01,2024-08-20,0,mistralai/Mixtral-8x7B-v0.1,apache-2.0,1655,46.703,18.3878645797549 -mistralai/Mixtral-8x7B-v0.1_float16_985aa055896a8f943d4a9f2572e6ea1341823841_False,mistralai/Mixtral-8x7B-v0.1,985aa055896a8f943d4a9f2572e6ea1341823841,float16,fine-tunedondomain-specificdatasets,Original,MixtralForCausalLM,19.6651089183161,FALSE,IFEval,0.232609476189843,23.2609476189843,BBH,0.509771137755339,30.4002992674255,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.320469798657718,9.39597315436242,MUSR,0.4413125,13.6640625,MMLU-PRO,0.387134308510638,31.9038120567376,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-01,2024-06-27,0,mistralai/Mixtral-8x7B-v0.1,apache-2.0,1655,46.703,5.13509985481396 +mistralai/Mixtral-8x7B-Instruct-v0.1_bfloat16_1e637f2d7cb0a9d6fb1922f305cb784995190a83_True,mistralai/Mixtral-8x7B-Instruct-v0.1,1e637f2d7cb0a9d6fb1922f305cb784995190a83,bfloat16,chatmodels,Original,MixtralForCausalLM,23.8422789394817,TRUE,IFEval,0.559914360563305,55.9914360563305,BBH,0.496236540133565,29.7423983809673,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.302852348993289,7.04697986577182,MUSR,0.420322916666667,11.0736979166667,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-10,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,4241,46.703,13.7649393661468 +mistralai/Mixtral-8x7B-v0.1_bfloat16_985aa055896a8f943d4a9f2572e6ea1341823841_False,mistralai/Mixtral-8x7B-v0.1,985aa055896a8f943d4a9f2572e6ea1341823841,bfloat16,pretrained,Original,MixtralForCausalLM,19.4519879614403,FALSE,IFEval,0.24152692633324,24.152692633324,BBH,0.508666743762444,30.2941949189615,MATH Level 5,0.095166163141994,9.5166163141994,GPQA,0.313758389261745,8.50111856823266,MUSR,0.432135416666667,12.58359375,MMLU-PRO,0.384973404255319,31.6637115839244,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-01,2024-08-20,0,mistralai/Mixtral-8x7B-v0.1,apache-2.0,1657,46.703,18.3878645797549 +mistralai/Mixtral-8x7B-v0.1_float16_985aa055896a8f943d4a9f2572e6ea1341823841_False,mistralai/Mixtral-8x7B-v0.1,985aa055896a8f943d4a9f2572e6ea1341823841,float16,fine-tunedondomain-specificdatasets,Original,MixtralForCausalLM,19.6651089183161,FALSE,IFEval,0.232609476189843,23.2609476189843,BBH,0.509771137755339,30.4002992674255,MATH Level 5,0.0936555891238671,9.36555891238671,GPQA,0.320469798657718,9.39597315436242,MUSR,0.4413125,13.6640625,MMLU-PRO,0.387134308510638,31.9038120567376,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-01,2024-06-27,0,mistralai/Mixtral-8x7B-v0.1,apache-2.0,1657,46.703,5.13509985481396 mixtao/MixTAO-7Bx2-MoE-v8.1_bfloat16_339130b87b6ef2484fea9fbfacba8a714ac03347_False,mixtao/MixTAO-7Bx2-MoE-v8.1,339130b87b6ef2484fea9fbfacba8a714ac03347,bfloat16,fine-tunedondomain-specificdatasets,Original,MixtralForCausalLM,21.0779269837969,FALSE,IFEval,0.416233371897676,41.6233371897676,BBH,0.518905939173352,32.3103423396992,MATH Level 5,0.0906344410876133,9.06344410876133,GPQA,0.284395973154362,4.58612975391499,MUSR,0.446333333333333,15.2916666666667,MMLU-PRO,0.312333776595745,23.5926418439716,TRUE,FALSE,TRUE,FALSE,FALSE,2024-02-26,2024-10-04,0,mixtao/MixTAO-7Bx2-MoE-v8.1,apache-2.0,55,12.879,0.924035071773507 mkxu/llama-3-8b-po1_float16_1b16e10de696c43cd2b49fac9f6195dc551438ee_False,mkxu/llama-3-8b-po1,1b16e10de696c43cd2b49fac9f6195dc551438ee,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.7670021917018,FALSE,IFEval,0.408114912875615,40.8114912875615,BBH,0.497608548522464,29.1817588733231,MATH Level 5,0.0702416918429003,7.02416918429003,GPQA,0.296979865771812,6.26398210290828,MUSR,0.380416666666667,6.85208333333334,MMLU-PRO,0.356216755319149,28.4685283687943,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-29,2024-11-29,0,mkxu/llama-3-8b-po1,"",0,8.03,0.512188140666852 mlabonne/AlphaMonarch-7B_float16_3de065d84411d74e5b3590f67f52b0b71faf6161_True,mlabonne/AlphaMonarch-7B,3de065d84411d74e5b3590f67f52b0b71faf6161,float16,chatmodels,Original,MistralForCausalLM,17.6557974256451,TRUE,IFEval,0.493943846771012,49.3943846771012,BBH,0.462552203718321,23.9473780254263,MATH Level 5,0.0422960725075529,4.22960725075529,GPQA,0.27013422818792,2.68456375838927,MUSR,0.412135416666667,9.31692708333333,MMLU-PRO,0.247257313829787,16.3619237588653,TRUE,TRUE,FALSE,FALSE,TRUE,2024-02-14,2024-06-12,1,mlabonne/AlphaMonarch-7B (Merge),cc-by-nc-4.0,148,7.242,0.572571709880913 @@ -1918,7 +1935,7 @@ nhyha/merge_Qwen2.5-7B-Instruct_20241023_0314_bfloat16_4d93f65c1f870556f05c77a1e nidum/Nidum-Limitless-Gemma-2B_float16_e209e3513d2b34c0e6c433ede26e17604c25cb1a_True,nidum/Nidum-Limitless-Gemma-2B,e209e3513d2b34c0e6c433ede26e17604c25cb1a,float16,fine-tunedondomain-specificdatasets,Original,GemmaForCausalLM,5.93942184856343,TRUE,IFEval,0.242351405382164,24.2351405382164,BBH,0.307880152007632,3.45106015161011,MATH Level 5,0,0,GPQA,0.264261744966443,1.90156599552573,MUSR,0.37403125,4.12057291666667,MMLU-PRO,0.117353723404255,1.9281914893617,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-02,2024-08-07,0,nidum/Nidum-Limitless-Gemma-2B,apache-2.0,4,2.506,0.396813696091378 nisten/franqwenstein-35b_float16_7180aa73e82945a1d2ae0eb304508e21d57e4c27_False,nisten/franqwenstein-35b,7180aa73e82945a1d2ae0eb304508e21d57e4c27,float16,basemergesandmoerges,Original,Qwen2ForCausalLM,35.9419257874126,FALSE,IFEval,0.379863207400808,37.9863207400808,BBH,0.664657917804927,52.2274680776535,MATH Level 5,0.302870090634441,30.2870090634441,GPQA,0.403523489932886,20.4697986577181,MUSR,0.494020833333333,22.1192708333333,MMLU-PRO,0.573055186170213,52.5616873522459,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-03,2024-10-03,1,nisten/franqwenstein-35b (Merge),mit,7,34.714,5.01776970227729 nisten/franqwenstein-35b_bfloat16_901351a987d664a1cd7f483115a167d3ae5694ec_True,nisten/franqwenstein-35b,901351a987d664a1cd7f483115a167d3ae5694ec,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,34.4511168312242,TRUE,IFEval,0.391353830059797,39.1353830059797,BBH,0.659113259870112,51.6802768732971,MATH Level 5,0.304380664652568,30.4380664652568,GPQA,0.359060402684564,14.5413870246085,MUSR,0.468104166666667,19.6796875,MMLU-PRO,0.56108710106383,51.2319001182033,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-03,2024-10-03,1,nisten/franqwenstein-35b (Merge),mit,7,34.714,6.32860413016356 -nisten/tqwendo-36b_bfloat16_c50f38e8421785af4b8596f81e0098a6585b4f05_False,nisten/tqwendo-36b,c50f38e8421785af4b8596f81e0098a6585b4f05,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,36.67666504459,FALSE,IFEval,0.677767213216488,67.7767213216488,BBH,0.643183083265909,49.4149364818743,MATH Level 5,0.393504531722054,39.3504531722054,GPQA,0.331375838926175,10.8501118568233,MUSR,0.442958333333333,15.103125,MMLU-PRO,0.438081781914894,37.5646424349882,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,nisten/tqwendo-36b (Merge),mit,2,17.845,9.15039126082312 +nisten/tqwendo-36b_bfloat16_c50f38e8421785af4b8596f81e0098a6585b4f05_False,nisten/tqwendo-36b,c50f38e8421785af4b8596f81e0098a6585b4f05,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,36.67666504459,FALSE,IFEval,0.677767213216488,67.7767213216488,BBH,0.643183083265909,49.4149364818743,MATH Level 5,0.393504531722054,39.3504531722054,GPQA,0.331375838926175,10.8501118568233,MUSR,0.442958333333333,15.103125,MMLU-PRO,0.438081781914894,37.5646424349882,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,nisten/tqwendo-36b (Merge),mit,3,17.845,9.15039126082312 nlpguy/Mistral-NeMo-Minitron-Upscale-v1_bfloat16_9e6d747cbb81e1f25915a0f42802cbeb85b61c3e_False,nlpguy/Mistral-NeMo-Minitron-Upscale-v1,9e6d747cbb81e1f25915a0f42802cbeb85b61c3e,bfloat16,pretrained,Original,MistralForCausalLM,10.8769297446175,FALSE,IFEval,0.16484040124647,16.484040124647,BBH,0.446799840979671,22.0689096857721,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.280201342281879,4.0268456375839,MUSR,0.380354166666667,4.84427083333334,MMLU-PRO,0.253740026595745,17.082225177305,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-29,2024-09-29,1,nlpguy/Mistral-NeMo-Minitron-Upscale-v1 (Merge),other,0,12.451,2.93430579968674 nlpguy/Mistral-NeMo-Minitron-Upscale-v2_bfloat16_4ac077e496705687fdcbe51f3b915be42e91bf79_False,nlpguy/Mistral-NeMo-Minitron-Upscale-v2,4ac077e496705687fdcbe51f3b915be42e91bf79,bfloat16,pretrained,Original,MistralForCausalLM,8.23215104600528,FALSE,IFEval,0.157271594923691,15.7271594923691,BBH,0.394966815480722,14.3826732880782,MATH Level 5,0.00604229607250755,0.604229607250755,GPQA,0.273489932885906,3.13199105145414,MUSR,0.379083333333333,5.25208333333333,MMLU-PRO,0.192652925531915,10.2947695035461,TRUE,TRUE,FALSE,FALSE,FALSE,2024-09-29,2024-09-29,1,nlpguy/Mistral-NeMo-Minitron-Upscale-v2 (Merge),other,0,12.451,2.92461867067532 nlpguy/Mistral-NeMo-Minitron-Upscale-v3_bfloat16_6703b09d3d78cc020448ee93c53dc727312bcbaf_False,nlpguy/Mistral-NeMo-Minitron-Upscale-v3,6703b09d3d78cc020448ee93c53dc727312bcbaf,bfloat16,pretrained,Original,MistralForCausalLM,5.01343743805603,FALSE,IFEval,0.141209767860388,14.1209767860388,BBH,0.305245226029181,3.39826644771649,MATH Level 5,0,0,GPQA,0.259228187919463,1.23042505592841,MUSR,0.40984375,9.43046875,MMLU-PRO,0.117104388297872,1.90048758865248,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-04,2024-10-04,1,nlpguy/Mistral-NeMo-Minitron-Upscale-v3 (Merge),other,1,12.451,6.04466857955523 @@ -1930,12 +1947,12 @@ nothingiisreal/MN-12B-Starcannon-v3_bfloat16_169480b62121c4f070e93a05158545c6797 nvidia/Hymba-1.5B-Base_bfloat16_85e5b833d75f26170c7684ba83140f1bf9fedf37_False,nvidia/Hymba-1.5B-Base,85e5b833d75f26170c7684ba83140f1bf9fedf37,bfloat16,pretrained,Original,HymbaForCausalLM,7.92198908307419,FALSE,IFEval,0.229512138902556,22.9512138902556,BBH,0.325647852141822,7.68994111813814,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.255872483221477,0.782997762863532,MUSR,0.356635416666667,5.17942708333334,MMLU-PRO,0.192237367021277,10.2485963356974,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-09,2024-12-06,0,nvidia/Hymba-1.5B-Base,other,128,1.523,9.10791437880169 nvidia/Hymba-1.5B-Instruct_bfloat16_ffc758eefef247c0ee4d7ce41636562759027ce6_True,nvidia/Hymba-1.5B-Instruct,ffc758eefef247c0ee4d7ce41636562759027ce6,bfloat16,chatmodels,Original,HymbaForCausalLM,13.7392113616459,TRUE,IFEval,0.600905597148898,60.0905597148898,BBH,0.306713390823188,4.59146361547248,MATH Level 5,0,0,GPQA,0.288590604026846,5.14541387024609,MUSR,0.331583333333333,1.04791666666667,MMLU-PRO,0.204039228723404,11.5599143026005,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-31,2024-12-06,1,nvidia/Hymba-1.5B-Instruct (Merge),other,213,1.523,6.71266576424283 nvidia/Llama-3.1-Minitron-4B-Depth-Base_bfloat16_40d82bc951b4f39e9c9e11176334250c30975098_False,nvidia/Llama-3.1-Minitron-4B-Depth-Base,40d82bc951b4f39e9c9e11176334250c30975098,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,11.5321699752737,FALSE,IFEval,0.16069362624503,16.069362624503,BBH,0.417070419310489,19.4441095555079,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.263422818791946,1.78970917225951,MUSR,0.4010625,10.6994791666667,MMLU-PRO,0.27983710106383,19.9819001182033,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-13,2024-09-25,0,nvidia/Llama-3.1-Minitron-4B-Depth-Base,other,20,4.02,0.467690635805229 -nvidia/Llama-3.1-Nemotron-70B-Instruct-HF_bfloat16_250db5cf2323e04a6d2025a2ca2b94a95c439e88_True,nvidia/Llama-3.1-Nemotron-70B-Instruct-HF,250db5cf2323e04a6d2025a2ca2b94a95c439e88,bfloat16,chatmodels,Original,LlamaForCausalLM,34.5783715382223,TRUE,IFEval,0.738067217205903,73.8067217205903,BBH,0.631600066889504,47.1095304937273,MATH Level 5,0.287009063444109,28.7009063444109,GPQA,0.258389261744966,1.11856823266219,MUSR,0.432760416666667,13.1950520833333,MMLU-PRO,0.491855053191489,43.5394503546099,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-12,2024-10-16,2,meta-llama/Meta-Llama-3.1-70B,llama3.1,1932,70.554,13.6287476336013 +nvidia/Llama-3.1-Nemotron-70B-Instruct-HF_bfloat16_250db5cf2323e04a6d2025a2ca2b94a95c439e88_True,nvidia/Llama-3.1-Nemotron-70B-Instruct-HF,250db5cf2323e04a6d2025a2ca2b94a95c439e88,bfloat16,chatmodels,Original,LlamaForCausalLM,34.5783715382223,TRUE,IFEval,0.738067217205903,73.8067217205903,BBH,0.631600066889504,47.1095304937273,MATH Level 5,0.287009063444109,28.7009063444109,GPQA,0.258389261744966,1.11856823266219,MUSR,0.432760416666667,13.1950520833333,MMLU-PRO,0.491855053191489,43.5394503546099,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-12,2024-10-16,2,meta-llama/Meta-Llama-3.1-70B,llama3.1,1937,70.554,13.6287476336013 nvidia/Minitron-4B-Base_bfloat16_d6321f64412982046a32d761701167e752fedc02_False,nvidia/Minitron-4B-Base,d6321f64412982046a32d761701167e752fedc02,bfloat16,pretrained,Original,NemotronForCausalLM,11.9399727051767,FALSE,IFEval,0.221793729526545,22.1793729526545,BBH,0.40838762439925,17.2156006550611,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.269295302013423,2.57270693512304,MUSR,0.413375,9.93854166666667,MMLU-PRO,0.261968085106383,17.9964539007092,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-19,2024-09-25,0,nvidia/Minitron-4B-Base,other,127,4,1.18926681315643 nvidia/Minitron-8B-Base_bfloat16_70fa5997afc42807f41eebd5d481f040556fdf97_False,nvidia/Minitron-8B-Base,70fa5997afc42807f41eebd5d481f040556fdf97,bfloat16,pretrained,Original,NemotronForCausalLM,14.1787264154315,FALSE,IFEval,0.242426760994162,24.2426760994162,BBH,0.43950631883576,22.0407929700052,MATH Level 5,0.0234138972809668,2.34138972809668,GPQA,0.273489932885906,3.13199105145414,MUSR,0.402552083333333,9.08567708333334,MMLU-PRO,0.318068484042553,24.2298315602837,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-19,2024-09-25,0,nvidia/Minitron-8B-Base,other,63,7.22,1.41252072016633 nvidia/Mistral-NeMo-Minitron-8B-Base_bfloat16_cc94637b669b62c4829b1e0c3b9074fecd883b74_False,nvidia/Mistral-NeMo-Minitron-8B-Base,cc94637b669b62c4829b1e0c3b9074fecd883b74,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,17.6601615070764,FALSE,IFEval,0.194565973838305,19.4565973838305,BBH,0.521909809052142,31.8220151574902,MATH Level 5,0.0460725075528701,4.60725075528701,GPQA,0.325503355704698,10.0671140939597,MUSR,0.40915625,8.94453125,MMLU-PRO,0.379571143617021,31.0634604018913,TRUE,FALSE,FALSE,FALSE,TRUE,2024-08-19,2024-08-22,0,nvidia/Mistral-NeMo-Minitron-8B-Base,other,166,7.88,3.40402832024504 nvidia/Mistral-NeMo-Minitron-8B-Instruct_bfloat16_27964e305f862f9947f577332a943d7013abc30f_True,nvidia/Mistral-NeMo-Minitron-8B-Instruct,27964e305f862f9947f577332a943d7013abc30f,bfloat16,chatmodels,Original,MistralForCausalLM,21.722143311104,TRUE,IFEval,0.500388967938403,50.0388967938403,BBH,0.532091960584029,34.1264912453462,MATH Level 5,0.00528700906344411,0.528700906344411,GPQA,0.287751677852349,5.03355704697987,MUSR,0.388572916666667,7.37161458333333,MMLU-PRO,0.399102393617021,33.2335992907801,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,2024-10-04,1,nvidia/Mistral-NeMo-Minitron-8B-Instruct (Merge),other,70,8.414,1.99389796292529 -nvidia/Nemotron-Mini-4B-Instruct_bfloat16_6a417790c444fd65a3da6a5c8821de6afc9654a6_True,nvidia/Nemotron-Mini-4B-Instruct,6a417790c444fd65a3da6a5c8821de6afc9654a6,bfloat16,chatmodels,Original,NemotronForCausalLM,17.9355153410832,TRUE,IFEval,0.666876110941192,66.6876110941192,BBH,0.386484079859154,14.2038251788621,MATH Level 5,0,0,GPQA,0.280201342281879,4.0268456375839,MUSR,0.376729166666667,4.62447916666667,MMLU-PRO,0.262632978723404,18.0703309692671,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-10,2024-09-25,1,nvidia/Minitron-4B-Base,other,135,4,1.1173137879977 +nvidia/Nemotron-Mini-4B-Instruct_bfloat16_6a417790c444fd65a3da6a5c8821de6afc9654a6_True,nvidia/Nemotron-Mini-4B-Instruct,6a417790c444fd65a3da6a5c8821de6afc9654a6,bfloat16,chatmodels,Original,NemotronForCausalLM,17.9355153410832,TRUE,IFEval,0.666876110941192,66.6876110941192,BBH,0.386484079859154,14.2038251788621,MATH Level 5,0,0,GPQA,0.280201342281879,4.0268456375839,MUSR,0.376729166666667,4.62447916666667,MMLU-PRO,0.262632978723404,18.0703309692671,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-10,2024-09-25,1,nvidia/Minitron-4B-Base,other,137,4,1.1173137879977 nvidia/OpenMath2-Llama3.1-8B_float16_4187cd28e77e76367261992b3274c77ffcbfd3d5_False,nvidia/OpenMath2-Llama3.1-8B,4187cd28e77e76367261992b3274c77ffcbfd3d5,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,8.98781780182601,FALSE,IFEval,0.233059393520304,23.3059393520304,BBH,0.409552414016945,16.2943699762186,MATH Level 5,0.0415407854984894,4.15407854984894,GPQA,0.26510067114094,2.01342281879195,MUSR,0.343552083333333,2.01067708333333,MMLU-PRO,0.155335771276596,6.14841903073286,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-30,2024-12-07,1,nvidia/OpenMath2-Llama3.1-8B (Merge),llama3.1,25,8.03,1.62670493051135 nxmwxm/Beast-Soul-new_float16_dd2ae8a96b7d088eb94a1cfa6ff84c3489e8c010_False,nxmwxm/Beast-Soul-new,dd2ae8a96b7d088eb94a1cfa6ff84c3489e8c010,float16,basemergesandmoerges,Original,MistralForCausalLM,21.830261529422,FALSE,IFEval,0.486874825463105,48.6874825463105,BBH,0.522714362888452,33.0727591685521,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.281879194630873,4.25055928411633,MUSR,0.445927083333333,14.1408854166667,MMLU-PRO,0.310172872340426,23.3525413711584,FALSE,FALSE,FALSE,FALSE,FALSE,2024-08-07,2024-08-07,1,nxmwxm/Beast-Soul-new (Merge),"",0,7.242,0.657023046365319 occiglot/occiglot-7b-es-en-instruct_float16_5858f6ee118eef70896f1870fd61052348ff571e_True,occiglot/occiglot-7b-es-en-instruct,5858f6ee118eef70896f1870fd61052348ff571e,float16,chatmodels,Original,MistralForCausalLM,12.3949633909971,TRUE,IFEval,0.348514164638714,34.8514164638714,BBH,0.411097022978108,17.2354103556121,MATH Level 5,0.020392749244713,2.0392749244713,GPQA,0.259228187919463,1.23042505592841,MUSR,0.37375,4.45208333333333,MMLU-PRO,0.231050531914894,14.561170212766,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-05,2024-09-02,0,occiglot/occiglot-7b-es-en-instruct,apache-2.0,2,7.242,0.688738120742571 @@ -1948,8 +1965,8 @@ oopere/pruned40-llama-1b_float16_3de470d9c61cb57cea821e93b43fb250aa14b975_False, oopere/pruned40-llama-3.2-3b_float16_ceb2073cda2f21afa10efcbae74583fc9b319d54_False,oopere/pruned40-llama-3.2-3b,ceb2073cda2f21afa10efcbae74583fc9b319d54,float16,pretrained,Original,LlamaForCausalLM,5.18246289956441,FALSE,IFEval,0.218296342593208,21.8296342593208,BBH,0.316711702809771,4.74010154594563,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.229865771812081,0,MUSR,0.3539375,2.40885416666667,MMLU-PRO,0.117686170212766,1.96513002364066,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-12,2024-12-12,1,oopere/pruned40-llama-3.2-3b (Merge),llama3.2,0,3,0.597667318719724 oopere/pruned60-llama-1b_float16_86b157256928b50ee07cc3cf5b3884b70062f2fe_False,oopere/pruned60-llama-1b,86b157256928b50ee07cc3cf5b3884b70062f2fe,float16,pretrained,Original,LlamaForCausalLM,5.42980237577008,FALSE,IFEval,0.182850392514085,18.2850392514085,BBH,0.30161934741854,2.94252648075335,MATH Level 5,0,0,GPQA,0.249161073825503,0,MUSR,0.408791666666667,9.43229166666667,MMLU-PRO,0.117270611702128,1.91895685579196,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-16,2024-11-25,1,oopere/pruned60-llama-1b (Merge),llama3.2,0,0.753,0.382487881515074 oopere/pruned60-llama-3.2-3b_float16_c8c061d55288274a59205fa740b51a951ca93335_False,oopere/pruned60-llama-3.2-3b,c8c061d55288274a59205fa740b51a951ca93335,float16,pretrained,Original,LlamaForCausalLM,5.065740099545,FALSE,IFEval,0.182475830795622,18.2475830795622,BBH,0.31662597093352,3.98840191534689,MATH Level 5,0,0,GPQA,0.27013422818792,2.68456375838927,MUSR,0.363333333333333,4.01666666666667,MMLU-PRO,0.113115026595745,1.45722517730496,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-12,2024-12-13,1,oopere/pruned60-llama-3.2-3b (Merge),llama3.2,0,3,0.620884220907376 -openai-community/gpt2_bfloat16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,openai-community/gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,bfloat16,pretrained,Original,GPT2LMHeadModel,6.51080708776172,FALSE,IFEval,0.179253270211927,17.9253270211927,BBH,0.303571124421336,2.67498136798699,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.258389261744966,1.11856823266219,MUSR,0.447052083333333,15.3481770833333,MMLU-PRO,0.115940824468085,1.77120271867612,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2,mit,2461,0.137,0.0859412568146148 -openai-community/gpt2_float16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,openai-community/gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,float16,pretrained,Original,GPT2LMHeadModel,6.29647106783872,FALSE,IFEval,0.177954494075719,17.7954494075719,BBH,0.301658010676531,2.81591130950851,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.258389261744966,1.11856823266219,MUSR,0.439020833333333,13.9109375,MMLU-PRO,0.116522606382979,1.8358451536643,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-12,0,openai-community/gpt2,mit,2461,0.137,0.117386895248811 +openai-community/gpt2_bfloat16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,openai-community/gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,bfloat16,pretrained,Original,GPT2LMHeadModel,6.51080708776172,FALSE,IFEval,0.179253270211927,17.9253270211927,BBH,0.303571124421336,2.67498136798699,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.258389261744966,1.11856823266219,MUSR,0.447052083333333,15.3481770833333,MMLU-PRO,0.115940824468085,1.77120271867612,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2,mit,2464,0.137,0.0859412568146148 +openai-community/gpt2_float16_607a30d783dfa663caf39e06633721c8d4cfcd7e_False,openai-community/gpt2,607a30d783dfa663caf39e06633721c8d4cfcd7e,float16,pretrained,Original,GPT2LMHeadModel,6.29647106783872,FALSE,IFEval,0.177954494075719,17.7954494075719,BBH,0.301658010676531,2.81591130950851,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.258389261744966,1.11856823266219,MUSR,0.439020833333333,13.9109375,MMLU-PRO,0.116522606382979,1.8358451536643,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-08-12,0,openai-community/gpt2,mit,2464,0.137,0.117386895248811 openai-community/gpt2-large_bfloat16_32b71b12589c2f8d625668d2335a01cac3249519_False,openai-community/gpt2-large,32b71b12589c2f8d625668d2335a01cac3249519,bfloat16,pretrained,Original,GPT2LMHeadModel,5.47959037520557,FALSE,IFEval,0.204782200117909,20.4782200117909,BBH,0.306884187601188,3.25379054497874,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.259228187919463,1.23042505592841,MUSR,0.378864583333333,5.65807291666667,MMLU-PRO,0.114195478723404,1.57727541371158,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-large,mit,279,0.812,0.180462238431619 openai-community/gpt2-medium_bfloat16_6dcaa7a952f72f9298047fd5137cd6e4f05f41da_False,openai-community/gpt2-medium,6dcaa7a952f72f9298047fd5137cd6e4f05f41da,bfloat16,pretrained,Original,GPT2LMHeadModel,5.8268115862481,FALSE,IFEval,0.220844027181213,22.0844027181213,BBH,0.305028023217627,2.71997223835624,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.26258389261745,1.67785234899329,MUSR,0.388447916666667,6.15598958333333,MMLU-PRO,0.118184840425532,2.0205378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-medium,mit,160,0.38,0.121061915000596 openai-community/gpt2-xl_bfloat16_15ea56dee5df4983c59b2538573817e1667135e2_False,openai-community/gpt2-xl,15ea56dee5df4983c59b2538573817e1667135e2,bfloat16,pretrained,Original,GPT2LMHeadModel,4.98018762739917,FALSE,IFEval,0.203857985700164,20.3857985700164,BBH,0.300857611232608,2.58096064745272,MATH Level 5,0.00302114803625378,0.302114803625378,GPQA,0.258389261744966,1.11856823266219,MUSR,0.370958333333333,4.03645833333333,MMLU-PRO,0.113115026595745,1.45722517730496,TRUE,FALSE,FALSE,FALSE,TRUE,2022-03-02,2024-06-12,0,openai-community/gpt2-xl,mit,318,1.608,0.215313699838485 @@ -2053,8 +2070,10 @@ qingy2019/Qwen2.5-Math-14B-Instruct-Alpha_bfloat16_e24aaa0779b576301bfb62b93789d qingy2019/Qwen2.5-Math-14B-Instruct-Pro_bfloat16_295a9ce370c2bfeabe13f76d52c92f57ff6d0308_True,qingy2019/Qwen2.5-Math-14B-Instruct-Pro,295a9ce370c2bfeabe13f76d52c92f57ff6d0308,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,19.707760053964,TRUE,IFEval,0.192167892303532,19.2167892303532,BBH,0.531868975451991,33.0369041422381,MATH Level 5,0.251510574018127,25.1510574018127,GPQA,0.311241610738255,8.165548098434,MUSR,0.37403125,4.25390625,MMLU-PRO,0.355801196808511,28.4223552009456,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-03,2024-12-03,1,qingy2019/Qwen2.5-Math-14B-Instruct-Pro (Merge),"",0,14.766,1.65956939801447 qingy2019/Qwen2.5-Ultimate-14B-Instruct_bfloat16_3eeba743112bed957ae6dc6a3f880355c8bedb66_True,qingy2019/Qwen2.5-Ultimate-14B-Instruct,3eeba743112bed957ae6dc6a3f880355c8bedb66,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,29.2891239591124,TRUE,IFEval,0.39380177927898,39.380177927898,BBH,0.584156159280425,40.5806006446963,MATH Level 5,0.280211480362538,28.0211480362538,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4135,9.8875,MMLU-PRO,0.492935505319149,43.6595005910166,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-02,2024-12-02,1,qingy2019/Qwen2.5-Ultimate-14B-Instruct (Merge),"",1,14.766,1.95208939714237 qingy2024/Eyas-17B-Instruct_bfloat16_afa6aa65deaef3eeb733e80f0fbffcf6d70a863f_True,qingy2024/Eyas-17B-Instruct,afa6aa65deaef3eeb733e80f0fbffcf6d70a863f,bfloat16,chatmodels,Original,LlamaForCausalLM,32.2521020222894,TRUE,IFEval,0.657458875782923,65.7458875782923,BBH,0.60845500802921,43.8500655327826,MATH Level 5,0.22809667673716,22.809667673716,GPQA,0.314597315436242,8.61297539149888,MUSR,0.452166666666667,15.3541666666667,MMLU-PRO,0.434258643617021,37.1398492907801,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-23,2024-12-23,1,qingy2024/Eyas-17B-Instruct (Merge),"",0,8.715,2.28576089883945 +qingy2024/Falcon3-2x10B-MoE-Instruct_bfloat16_e226b1f0beb60ff1e3770a694af51572b6d95dc5_True,qingy2024/Falcon3-2x10B-MoE-Instruct,e226b1f0beb60ff1e3770a694af51572b6d95dc5,bfloat16,continuouslypretrained,Original,MixtralForCausalLM,35.1686285250607,TRUE,IFEval,0.784978302016428,78.4978302016428,BBH,0.618492572603782,45.0738526590559,MATH Level 5,0.257552870090634,25.7552870090635,GPQA,0.330536912751678,10.738255033557,MUSR,0.428354166666667,12.9109375,MMLU-PRO,0.442320478723404,38.0356087470449,TRUE,TRUE,TRUE,FALSE,FALSE,2024-12-25,2024-12-25,1,qingy2024/Falcon3-2x10B-MoE-Instruct (Merge),apache-2.0,0,9.4,2.19328677762664 qingy2024/Fusion-14B-Instruct_bfloat16_2e15219659b919e04ad5b56bef259489cc264f09_True,qingy2024/Fusion-14B-Instruct,2e15219659b919e04ad5b56bef259489cc264f09,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,37.6442503278293,TRUE,IFEval,0.72597707416322,72.597707416322,BBH,0.639593081216423,48.5798359138013,MATH Level 5,0.309667673716012,30.9667673716012,GPQA,0.354865771812081,13.9821029082774,MUSR,0.440041666666667,14.8052083333333,MMLU-PRO,0.504404920212766,44.9338800236407,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-05,1,qingy2024/Fusion-14B-Instruct (Merge),"",1,14,1.62368095971721 qingy2024/Fusion2-14B-Instruct_bfloat16_df00288ce3d37ef518189c19e7973e71b47ef214_True,qingy2024/Fusion2-14B-Instruct,df00288ce3d37ef518189c19e7973e71b47ef214,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,35.1822684337256,TRUE,IFEval,0.606401015970957,60.6401015970957,BBH,0.611852372286455,44.7670438308547,MATH Level 5,0.308157099697885,30.8157099697885,GPQA,0.344798657718121,12.6398210290828,MUSR,0.463385416666667,17.2231770833333,MMLU-PRO,0.505069813829787,45.0077570921986,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-05,2024-12-06,1,qingy2024/Fusion2-14B-Instruct (Merge),"",1,14.766,1.66866594603866 +qingy2024/Fusion4-14B-Instruct_float16_3f3c7178006857d7fdf942ab7e86bd2b0d7b624d_True,qingy2024/Fusion4-14B-Instruct,3f3c7178006857d7fdf942ab7e86bd2b0d7b624d,float16,chatmodels,Original,Qwen2ForCausalLM,38.733953059072,TRUE,IFEval,0.764894923248093,76.4894923248093,BBH,0.654252046947762,50.6958556395896,MATH Level 5,0.339123867069486,33.9123867069486,GPQA,0.330536912751678,10.738255033557,MUSR,0.432572916666667,13.9716145833333,MMLU-PRO,0.519365026595745,46.5961140661939,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-25,2024-12-25,1,qingy2024/Fusion4-14B-Instruct (Merge),"",0,7.385,1.82283054036158 qingy2024/QwQ-14B-Math-v0.2_float16_308f732e0f2c1ac9e416e9c1e0523c0198ac658c_True,qingy2024/QwQ-14B-Math-v0.2,308f732e0f2c1ac9e416e9c1e0523c0198ac658c,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,24.0889902509765,TRUE,IFEval,0.339096929480445,33.9096929480445,BBH,0.573097955260854,39.0992137429518,MATH Level 5,0.190332326283988,19.0332326283988,GPQA,0.26258389261745,1.67785234899329,MUSR,0.40209375,8.59505208333333,MMLU-PRO,0.479970079787234,42.2188977541371,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-20,2024-12-23,2,Qwen/Qwen2.5-14B,apache-2.0,14,7.385,3.41117129475758 qingy2024/Qwen2.5-Math-14B-Instruct-Alpha_float16_c82727eb404d3d55450759301b80f838e4d3e1fc_True,qingy2024/Qwen2.5-Math-14B-Instruct-Alpha,c82727eb404d3d55450759301b80f838e4d3e1fc,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,32.2153945754645,TRUE,IFEval,0.770440209754562,77.0440209754562,BBH,0.646486159387426,50.1795027462589,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.348993288590604,13.1991051454139,MUSR,0.40209375,8.72838541666667,MMLU-PRO,0.496592420212766,44.0658244680851,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-03,2024-12-10,2,Qwen/Qwen2.5-14B,apache-2.0,1,14,1.56934662160497 qingy2024/Qwen2.5-Math-14B-Instruct-Preview_float16_7b9e9b94d69f0de9627f728e9328fb394f7fea14_True,qingy2024/Qwen2.5-Math-14B-Instruct-Preview,7b9e9b94d69f0de9627f728e9328fb394f7fea14,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,31.987593150848,TRUE,IFEval,0.782580220481655,78.2580220481655,BBH,0.629394224593443,47.0508075682843,MATH Level 5,0,0,GPQA,0.340604026845638,12.0805369127517,MUSR,0.411458333333333,10.165625,MMLU-PRO,0.499335106382979,44.3705673758865,TRUE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-10,3,Qwen/Qwen2.5-14B,apache-2.0,1,14,1.61898032712152 @@ -2075,7 +2094,7 @@ recoilme/recoilme-gemma-2-9B-v0.3_float16_772cab46d9d22cbcc3c574d193021803ce5c44 recoilme/recoilme-gemma-2-9B-v0.3_bfloat16_76c8fb761660e6eb237c91bb6e6761ee36266bba_False,recoilme/recoilme-gemma-2-9B-v0.3,76c8fb761660e6eb237c91bb6e6761ee36266bba,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,30.1116383212597,FALSE,IFEval,0.57607592299543,57.607592299543,BBH,0.601982710105885,43.3268682962836,MATH Level 5,0.172960725075529,17.2960725075529,GPQA,0.337248322147651,11.6331096196868,MUSR,0.463229166666667,17.0369791666667,MMLU-PRO,0.403922872340426,33.7692080378251,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-18,2024-09-27,0,recoilme/recoilme-gemma-2-9B-v0.3,cc-by-nc-4.0,3,10.159,2.55534970855255 recoilme/recoilme-gemma-2-9B-v0.4_bfloat16_2691f2cc8d80072f15d78cb7ae72831e1a12139e_False,recoilme/recoilme-gemma-2-9B-v0.4,2691f2cc8d80072f15d78cb7ae72831e1a12139e,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,24.1003632168539,FALSE,IFEval,0.25618913372075,25.618913372075,BBH,0.596728583355488,42.4424816754251,MATH Level 5,0.0823262839879154,8.23262839879154,GPQA,0.340604026845638,12.0805369127517,MUSR,0.4726875,18.3859375,MMLU-PRO,0.440575132978723,37.8416814420804,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-18,2024-09-19,0,recoilme/recoilme-gemma-2-9B-v0.4,cc-by-nc-4.0,2,10.159,2.91891024220838 recoilme/recoilme-gemma-2-9B-v0.5_float16_b4035d3a16486dae4f726eb953be959a4573ea67_True,recoilme/recoilme-gemma-2-9B-v0.5,b4035d3a16486dae4f726eb953be959a4573ea67,float16,chatmodels,Original,Gemma2ForCausalLM,30.0577620055673,TRUE,IFEval,0.766418658049531,76.6418658049531,BBH,0.5981472549925,42.3533554065342,MATH Level 5,0.0211480362537764,2.11480362537764,GPQA,0.336409395973154,11.5212527964206,MUSR,0.423177083333333,12.1638020833333,MMLU-PRO,0.419963430851064,35.5514923167849,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-26,2024-11-26,1,recoilme/recoilme-gemma-2-9B-v0.5 (Merge),"",0,10.159,3.86674425617504 -redrix/AngelSlayer-12B-Unslop-Mell-RPMax-DARKNESS_bfloat16_1523f26adec368380647e864dd2e9fa79f36fefe_True,redrix/AngelSlayer-12B-Unslop-Mell-RPMax-DARKNESS,1523f26adec368380647e864dd2e9fa79f36fefe,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,22.37371795391,TRUE,IFEval,0.535959033143171,53.5959033143171,BBH,0.512884099805285,29.9659323107153,MATH Level 5,0.0891238670694864,8.91238670694864,GPQA,0.315436241610738,8.7248322147651,MUSR,0.38178125,8.82265625,MMLU-PRO,0.317985372340426,24.220596926714,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-05,2024-12-12,1,redrix/AngelSlayer-12B-Unslop-Mell-RPMax-DARKNESS (Merge),apache-2.0,6,12,1.09584828785617 +redrix/AngelSlayer-12B-Unslop-Mell-RPMax-DARKNESS_bfloat16_1523f26adec368380647e864dd2e9fa79f36fefe_True,redrix/AngelSlayer-12B-Unslop-Mell-RPMax-DARKNESS,1523f26adec368380647e864dd2e9fa79f36fefe,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,22.37371795391,TRUE,IFEval,0.535959033143171,53.5959033143171,BBH,0.512884099805285,29.9659323107153,MATH Level 5,0.0891238670694864,8.91238670694864,GPQA,0.315436241610738,8.7248322147651,MUSR,0.38178125,8.82265625,MMLU-PRO,0.317985372340426,24.220596926714,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-05,2024-12-12,1,redrix/AngelSlayer-12B-Unslop-Mell-RPMax-DARKNESS (Merge),apache-2.0,7,12,1.09584828785617 redrix/patricide-12B-Unslop-Mell_bfloat16_2f1a849859a24da80bd1f938a2ac6ab627ef75e8_False,redrix/patricide-12B-Unslop-Mell,2f1a849859a24da80bd1f938a2ac6ab627ef75e8,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,22.9085375547461,FALSE,IFEval,0.407390169195512,40.7390169195512,BBH,0.539866686585362,33.9894476074595,MATH Level 5,0.124622356495468,12.4622356495468,GPQA,0.323825503355705,9.84340044742729,MUSR,0.402583333333333,11.85625,MMLU-PRO,0.357047872340426,28.5608747044917,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-01,2024-12-12,1,redrix/patricide-12B-Unslop-Mell (Merge),apache-2.0,5,12,1.02955491130521 refuelai/Llama-3-Refueled_bfloat16_ff6d1c3ba37b31d4af421951c2300f2256fb3691_True,refuelai/Llama-3-Refueled,ff6d1c3ba37b31d4af421951c2300f2256fb3691,bfloat16,chatmodels,Original,LlamaForCausalLM,22.8038048017426,TRUE,IFEval,0.461995283625226,46.1995283625226,BBH,0.587076620170505,41.721971003391,MATH Level 5,0.0438066465256798,4.38066465256798,GPQA,0.299496644295302,6.59955257270694,MUSR,0.44540625,14.6424479166667,MMLU-PRO,0.309507978723404,23.2786643026005,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-03,2024-06-12,0,refuelai/Llama-3-Refueled,cc-by-nc-4.0,189,8.03,0.875985833377866 rhplus0831/maid-yuzu-v7_bfloat16_a0bd8c707bb80024778da4a0d057917faa53d2f6_True,rhplus0831/maid-yuzu-v7,a0bd8c707bb80024778da4a0d057917faa53d2f6,bfloat16,chatmodels,Original,MixtralForCausalLM,24.4819301245243,TRUE,IFEval,0.646243079473575,64.6243079473575,BBH,0.480491692312673,26.8198371046094,MATH Level 5,0.0951661631419939,9.51661631419939,GPQA,0.309563758389262,7.94183445190157,MUSR,0.413625,9.76979166666667,MMLU-PRO,0.353972739361702,28.2191932624114,FALSE,FALSE,FALSE,FALSE,FALSE,2024-02-09,2024-09-08,1,rhplus0831/maid-yuzu-v7 (Merge),"",1,46.703,4.1042853231815 @@ -2088,13 +2107,13 @@ rombodawg/Rombos-LLM-V2.5-Qwen-0.5b_bfloat16_aae2e55548c8090ce357c64ca78e8b9ef6b rombodawg/Rombos-LLM-V2.5-Qwen-1.5b_bfloat16_1f634da015ed671efe7dc574bc2a1954f5b2cc93_False,rombodawg/Rombos-LLM-V2.5-Qwen-1.5b,1f634da015ed671efe7dc574bc2a1954f5b2cc93,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,16.1655641449128,FALSE,IFEval,0.340246102563421,34.0246102563421,BBH,0.425670314586439,18.7113437839723,MATH Level 5,0.0740181268882175,7.40181268882175,GPQA,0.288590604026846,5.14541387024609,MUSR,0.418552083333333,10.35234375,MMLU-PRO,0.292220744680851,21.3578605200946,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-06,2024-09-29,1,rombodawg/Rombos-LLM-V2.5-Qwen-1.5b (Merge),apache-2.0,4,1.777,0.740357996195001 rombodawg/Rombos-LLM-V2.5-Qwen-14b_bfloat16_834ddb1712ae6d1b232b2d5b26be658d90d23e43_False,rombodawg/Rombos-LLM-V2.5-Qwen-14b,834ddb1712ae6d1b232b2d5b26be658d90d23e43,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,34.7300596437434,FALSE,IFEval,0.584044778964259,58.4044778964259,BBH,0.648108626166965,49.3869002714448,MATH Level 5,0.169184290030212,16.9184290030212,GPQA,0.371644295302013,16.2192393736018,MUSR,0.471729166666667,18.8328125,MMLU-PRO,0.537566489361702,48.6184988179669,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-06,2024-09-29,1,rombodawg/Rombos-LLM-V2.5-Qwen-14b (Merge),apache-2.0,6,14.77,2.18269986161066 rombodawg/Rombos-LLM-V2.5-Qwen-32b_bfloat16_234abe4b494dbe83ba805b791f74feb33462a33d_False,rombodawg/Rombos-LLM-V2.5-Qwen-32b,234abe4b494dbe83ba805b791f74feb33462a33d,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,44.57420016657,FALSE,IFEval,0.682663111654854,68.2663111654854,BBH,0.70455370708598,58.2618940867874,MATH Level 5,0.419939577039275,41.9939577039275,GPQA,0.396812080536913,19.5749440715884,MUSR,0.503416666666667,24.7270833333333,MMLU-PRO,0.591589095744681,54.6210106382979,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-30,2024-10-07,1,rombodawg/Rombos-LLM-V2.5-Qwen-32b (Merge),apache-2.0,43,32.764,17.9126897235194 -rombodawg/Rombos-LLM-V2.5-Qwen-3b_bfloat16_26601a8da5afce3b5959d91bdd0faaab6df8bf95_False,rombodawg/Rombos-LLM-V2.5-Qwen-3b,26601a8da5afce3b5959d91bdd0faaab6df8bf95,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.1831113569493,FALSE,IFEval,0.534235827604091,53.4235827604091,BBH,0.480889624636847,27.2135969511257,MATH Level 5,0.0551359516616314,5.51359516616314,GPQA,0.307885906040268,7.71812080536913,MUSR,0.404166666666667,8.55416666666667,MMLU-PRO,0.37608045212766,30.6756057919622,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-06,2024-09-29,1,rombodawg/Rombos-LLM-V2.5-Qwen-3b (Merge),other,3,3.397,1.005794477103 +rombodawg/Rombos-LLM-V2.5-Qwen-3b_bfloat16_26601a8da5afce3b5959d91bdd0faaab6df8bf95_False,rombodawg/Rombos-LLM-V2.5-Qwen-3b,26601a8da5afce3b5959d91bdd0faaab6df8bf95,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.1831113569493,FALSE,IFEval,0.534235827604091,53.4235827604091,BBH,0.480889624636847,27.2135969511257,MATH Level 5,0.0551359516616314,5.51359516616314,GPQA,0.307885906040268,7.71812080536913,MUSR,0.404166666666667,8.55416666666667,MMLU-PRO,0.37608045212766,30.6756057919622,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-06,2024-09-29,1,rombodawg/Rombos-LLM-V2.5-Qwen-3b (Merge),other,4,3.397,1.005794477103 rombodawg/Rombos-LLM-V2.5-Qwen-72b_bfloat16_5260f182e7859e13d515c4cb3926ac85ad057504_True,rombodawg/Rombos-LLM-V2.5-Qwen-72b,5260f182e7859e13d515c4cb3926ac85ad057504,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,45.9092456451536,TRUE,IFEval,0.715535889218385,71.5535889218385,BBH,0.722958906578849,61.2671450457366,MATH Level 5,0.506797583081571,50.6797583081571,GPQA,0.398489932885906,19.7986577181208,MUSR,0.459916666666667,17.3229166666667,MMLU-PRO,0.593500664893617,54.8334072104019,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-30,2024-12-19,1,rombodawg/Rombos-LLM-V2.5-Qwen-72b (Merge),other,32,36.353,16.0339456258967 rombodawg/Rombos-LLM-V2.5-Qwen-7b_bfloat16_dbd819e8f765181f774cb5b79812d081669eb302_False,rombodawg/Rombos-LLM-V2.5-Qwen-7b,dbd819e8f765181f774cb5b79812d081669eb302,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,31.1123483495661,FALSE,IFEval,0.623711751486057,62.3711751486057,BBH,0.554388504690359,36.3723504143006,MATH Level 5,0.283232628398792,28.3232628398792,GPQA,0.317953020134228,9.06040268456376,MUSR,0.42909375,12.0033854166667,MMLU-PRO,0.446891622340426,38.5435135933806,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-06,2024-09-29,1,rombodawg/Rombos-LLM-V2.5-Qwen-7b (Merge),apache-2.0,15,7.616,1.31708405545612 rombodawg/Rombos-LLM-V2.5.1-Qwen-3b_bfloat16_a3305ce148f4273ab334052ab47d3aebb51d104c_False,rombodawg/Rombos-LLM-V2.5.1-Qwen-3b,a3305ce148f4273ab334052ab47d3aebb51d104c,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,13.3571249720534,FALSE,IFEval,0.259512537844032,25.9512537844032,BBH,0.388404302465666,14.8814091844514,MATH Level 5,0.0913897280966768,9.13897280966768,GPQA,0.274328859060403,3.24384787472036,MUSR,0.399114583333333,7.82265625,MMLU-PRO,0.271941489361702,19.104609929078,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-08,2024-10-08,1,rombodawg/Rombos-LLM-V2.5.1-Qwen-3b (Merge),other,1,3.397,0.929243868572982 rombodawg/Rombos-LLM-V2.5.1-Qwen-3b_float16_b65848c13b31f5b9d5d953df95d504d195082a3b_False,rombodawg/Rombos-LLM-V2.5.1-Qwen-3b,b65848c13b31f5b9d5d953df95d504d195082a3b,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,13.130246819292,FALSE,IFEval,0.256640159221976,25.6640159221976,BBH,0.390008397403765,15.0577444820961,MATH Level 5,0.0921450151057402,9.21450151057402,GPQA,0.26258389261745,1.67785234899329,MUSR,0.399114583333333,7.82265625,MMLU-PRO,0.274102393617021,19.3447104018913,TRUE,TRUE,FALSE,FALSE,FALSE,2024-10-08,2024-11-14,1,rombodawg/Rombos-LLM-V2.5.1-Qwen-3b (Merge),other,1,3.397,1.95403065052004 rombodawg/Rombos-LLM-V2.6-Nemotron-70b_bfloat16_951c9cdf68d6e679c78625d1a1f396eb71cdf746_False,rombodawg/Rombos-LLM-V2.6-Nemotron-70b,951c9cdf68d6e679c78625d1a1f396eb71cdf746,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,41.933642375789,FALSE,IFEval,0.752655177152179,75.2655177152179,BBH,0.693769948258033,55.8055734251465,MATH Level 5,0.332326283987915,33.2326283987915,GPQA,0.406040268456376,20.8053691275168,MUSR,0.466864583333333,18.39140625,MMLU-PRO,0.532912234042553,48.1013593380615,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-17,2024-10-17,0,rombodawg/Rombos-LLM-V2.6-Nemotron-70b,llama3.1,3,70.554,11.9507744668539 -rombodawg/Rombos-LLM-V2.6-Qwen-14b_bfloat16_887910d75a1837b8b8c7c3e50a257517d286ec60_True,rombodawg/Rombos-LLM-V2.6-Qwen-14b,887910d75a1837b8b8c7c3e50a257517d286ec60,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,33.7023663437699,TRUE,IFEval,0.843155050820711,84.3155050820711,BBH,0.644209659634489,49.2785176403309,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.333892617449664,11.1856823266219,MUSR,0.4220625,12.2911458333333,MMLU-PRO,0.49609375,44.0104166666667,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-12,2024-12-07,1,rombodawg/Rombos-LLM-V2.6-Qwen-14b (Merge),apache-2.0,47,14.77,3.71574997699498 +rombodawg/Rombos-LLM-V2.6-Qwen-14b_bfloat16_887910d75a1837b8b8c7c3e50a257517d286ec60_True,rombodawg/Rombos-LLM-V2.6-Qwen-14b,887910d75a1837b8b8c7c3e50a257517d286ec60,bfloat16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,33.7023663437699,TRUE,IFEval,0.843155050820711,84.3155050820711,BBH,0.644209659634489,49.2785176403309,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.333892617449664,11.1856823266219,MUSR,0.4220625,12.2911458333333,MMLU-PRO,0.49609375,44.0104166666667,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-12,2024-12-07,1,rombodawg/Rombos-LLM-V2.6-Qwen-14b (Merge),apache-2.0,48,14.77,3.71574997699498 rombodawg/rombos_Replete-Coder-Instruct-8b-Merged_bfloat16_85ad1fb943d73866ba5c8dcfe4a4f2cbfba12d4d_True,rombodawg/rombos_Replete-Coder-Instruct-8b-Merged,85ad1fb943d73866ba5c8dcfe4a4f2cbfba12d4d,bfloat16,basemergesandmoerges,Original,LlamaForCausalLM,16.4338239876319,TRUE,IFEval,0.538757164323994,53.8757164323994,BBH,0.446169386007583,21.9377065782727,MATH Level 5,0.0777945619335348,7.77945619335348,GPQA,0.269295302013423,2.57270693512304,MUSR,0.36603125,3.45390625,MMLU-PRO,0.180851063829787,8.98345153664303,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-06,2024-10-14,0,rombodawg/rombos_Replete-Coder-Instruct-8b-Merged,apache-2.0,1,8.03,0.964128193317057 rombodawg/rombos_Replete-Coder-Llama3-8B_bfloat16_938a45789cf94821ef6b12c98dc76622a0fa936a_True,rombodawg/rombos_Replete-Coder-Llama3-8B,938a45789cf94821ef6b12c98dc76622a0fa936a,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,11.8325635028728,TRUE,IFEval,0.471412518783495,47.1412518783495,BBH,0.327627710252668,7.08784511784512,MATH Level 5,0.0309667673716012,3.09667673716012,GPQA,0.266778523489933,2.23713646532438,MUSR,0.396635416666667,7.71276041666667,MMLU-PRO,0.133477393617021,3.71971040189125,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-06,2024-10-14,0,rombodawg/rombos_Replete-Coder-Llama3-8B,other,2,8.03,1.2056020933418 rwitz/go-bruins-v2_float16_6d9e57d3a36dbad364ec77ca642873d9fc7fd61c_True,rwitz/go-bruins-v2,6d9e57d3a36dbad364ec77ca642873d9fc7fd61c,float16,chatmodels,Original,MistralForCausalLM,15.4213790816555,TRUE,IFEval,0.409588779992642,40.9588779992642,BBH,0.379884468410897,12.6932601876857,MATH Level 5,0.0664652567975831,6.64652567975831,GPQA,0.26258389261745,1.67785234899329,MUSR,0.41375,10.9854166666667,MMLU-PRO,0.276097074468085,19.566341607565,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-06-26,0,Removed,"",0,7.242,0.637819720781267 @@ -2158,6 +2177,7 @@ sometimesanotion/Qwenvergence-14B-v3_bfloat16_40c489fd71724f2fa3f7154e4874c6d007 sometimesanotion/Qwenvergence-14B-v3-Prose_bfloat16_15e4222295ef31aee17c2e5b6e7a31ffd21e3c7b_False,sometimesanotion/Qwenvergence-14B-v3-Prose,15e4222295ef31aee17c2e5b6e7a31ffd21e3c7b,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,37.3708094176769,FALSE,IFEval,0.49177072390147,49.177072390147,BBH,0.651291317094932,49.7983666809914,MATH Level 5,0.355740181268882,35.5740181268882,GPQA,0.39513422818792,19.3512304250559,MUSR,0.493895833333333,21.7703125,MMLU-PRO,0.536984707446809,48.5538563829787,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-21,2024-12-21,1,sometimesanotion/Qwenvergence-14B-v3-Prose (Merge),apache-2.0,2,7.383,1.71134135251856 sometimesanotion/Qwenvergence-14B-v3-Reason_float16_1e613b0e6bfdb08e7c21a3e6ba3b84e361cf8350_False,sometimesanotion/Qwenvergence-14B-v3-Reason,1e613b0e6bfdb08e7c21a3e6ba3b84e361cf8350,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,37.0468000181585,FALSE,IFEval,0.536683776823273,53.6683776823274,BBH,0.656128395746618,50.6944479886705,MATH Level 5,0.324018126888218,32.4018126888218,GPQA,0.386744966442953,18.2326621923937,MUSR,0.474020833333333,18.4526041666667,MMLU-PRO,0.539478058510638,48.8308953900709,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-21,0,Removed,"",0,7.383,1.89560397778342 sometimesanotion/Qwenvergence-14B-v3-Reason_bfloat16_6acf3cbc9c36b19d66ac683f073e32a9bf86d56e_False,sometimesanotion/Qwenvergence-14B-v3-Reason,6acf3cbc9c36b19d66ac683f073e32a9bf86d56e,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.7140481268604,FALSE,IFEval,0.527816194364287,52.7816194364287,BBH,0.655743756682434,50.6357761372748,MATH Level 5,0.311933534743202,31.1933534743202,GPQA,0.384228187919463,17.8970917225951,MUSR,0.475416666666667,18.9270833333333,MMLU-PRO,0.539644281914894,48.8493646572104,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-21,0,Removed,"",0,7.383,1.92617191333061 +sometimesanotion/Qwenvergence-14B-v6-Prose_bfloat16_bbb6b0900b630a3120d036d3434ca0fa508ed559_False,sometimesanotion/Qwenvergence-14B-v6-Prose,bbb6b0900b630a3120d036d3434ca0fa508ed559,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,38.8249662267441,FALSE,IFEval,0.599007300628998,59.9007300628998,BBH,0.65437502308072,50.1199760400256,MATH Level 5,0.348942598187311,34.8942598187311,GPQA,0.388422818791946,18.4563758389262,MUSR,0.48865625,21.0153645833333,MMLU-PRO,0.537067819148936,48.5630910165485,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-26,2024-12-26,1,sometimesanotion/Qwenvergence-14B-v6-Prose (Merge),apache-2.0,0,7.383,1.93526414003491 sometimesanotion/lamarck-14b-prose-model_stock_bfloat16_d71942f5b5471fca97914ea26a9f66bb5866693e_False,sometimesanotion/lamarck-14b-prose-model_stock,d71942f5b5471fca97914ea26a9f66bb5866693e,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,35.5898576058715,FALSE,IFEval,0.427648638944667,42.7648638944667,BBH,0.648762158566534,49.383875963762,MATH Level 5,0.336102719033233,33.6102719033233,GPQA,0.393456375838926,19.1275167785235,MUSR,0.48459375,20.27421875,MMLU-PRO,0.535405585106383,48.3783983451537,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-09,0,Removed,"",0,14.766,1.55751948598314 sometimesanotion/lamarck-14b-reason-model_stock_bfloat16_0f1d7f04b9219ffe3bc26aa3146380fba249d61a_False,sometimesanotion/lamarck-14b-reason-model_stock,0f1d7f04b9219ffe3bc26aa3146380fba249d61a,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,36.2563275132583,FALSE,IFEval,0.496467151602193,49.6467151602193,BBH,0.656889854140825,50.715404125685,MATH Level 5,0.31570996978852,31.570996978852,GPQA,0.384228187919463,17.8970917225951,MUSR,0.474083333333333,18.79375,MMLU-PRO,0.540226063829787,48.9140070921986,FALSE,FALSE,FALSE,FALSE,FALSE,"",2024-12-09,0,Removed,"",0,14.766,7.94839884559841 sonthenguyen/ft-unsloth-zephyr-sft-bnb-4bit-20241014-161415_float16_467eff1ac1c3395c130929bbe1f34a8194715e7c_True,sonthenguyen/ft-unsloth-zephyr-sft-bnb-4bit-20241014-161415,467eff1ac1c3395c130929bbe1f34a8194715e7c,float16,chatmodels,Adapter,?,8.8268740255258,TRUE,IFEval,0.289337845804687,28.9337845804687,BBH,0.380418168868286,12.7892123094856,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.246644295302013,0,MUSR,0.3860625,6.02447916666667,MMLU-PRO,0.140126329787234,4.45848108747045,TRUE,FALSE,FALSE,FALSE,FALSE,2024-10-15,2024-10-16,1,unsloth/zephyr-sft-bnb-4bit,apache-2.0,0,7.723,1.62771156469603 @@ -2181,13 +2201,14 @@ spow12/ChatWaifu_v2.0_22B_bfloat16_a6e7c206d9af77d3f85faf0ce4a711d62815b2ab_True ssmits/Qwen2.5-95B-Instruct_bfloat16_9c0e7df57a4fcf4d364efd916a0fc0abdd2d20a3_True,ssmits/Qwen2.5-95B-Instruct,9c0e7df57a4fcf4d364efd916a0fc0abdd2d20a3,bfloat16,chatmodels,Original,Qwen2ForCausalLM,37.4401249883746,TRUE,IFEval,0.843105183136301,84.3105183136301,BBH,0.703779969748824,58.5303513228511,MATH Level 5,0.061178247734139,6.1178247734139,GPQA,0.364093959731544,15.2125279642058,MUSR,0.428385416666667,13.61484375,MMLU-PRO,0.521692154255319,46.8546838061466,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-24,2024-09-26,1,ssmits/Qwen2.5-95B-Instruct (Merge),other,3,94.648,19.2334948028144 stabilityai/StableBeluga2_bfloat16_cb47d3db70ea3ddc2cabdeb358c303b328f65900_False,stabilityai/StableBeluga2,cb47d3db70ea3ddc2cabdeb358c303b328f65900,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,22.6828417931441,FALSE,IFEval,0.378714034317832,37.8714034317832,BBH,0.582412813455381,41.2632611272238,MATH Level 5,0.0362537764350453,3.62537764350453,GPQA,0.316275167785235,8.83668903803132,MUSR,0.47296875,18.6544270833333,MMLU-PRO,0.332613031914894,25.8458924349882,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-20,2024-06-13,0,stabilityai/StableBeluga2,"",884,68.977,6.25467365604401 stabilityai/stablelm-2-12b_bfloat16_fead13ddbf4492970666650c3cd6f85f485411ec_False,stabilityai/stablelm-2-12b,fead13ddbf4492970666650c3cd6f85f485411ec,bfloat16,pretrained,Original,StableLmForCausalLM,13.9357224770686,FALSE,IFEval,0.156921412962052,15.6921412962052,BBH,0.450865417111477,22.685797482044,MATH Level 5,0.0392749244712991,3.92749244712991,GPQA,0.278523489932886,3.80313199105145,MUSR,0.447885416666667,14.4856770833333,MMLU-PRO,0.30718085106383,23.0200945626478,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-21,2024-06-12,0,stabilityai/stablelm-2-12b,other,116,12.143,1.47327922426156 -stabilityai/stablelm-2-12b-chat_bfloat16_b6b62cd451b84e848514c00fafa66d9ead9297c5_True,stabilityai/stablelm-2-12b-chat,b6b62cd451b84e848514c00fafa66d9ead9297c5,bfloat16,chatmodels,Original,StableLmForCausalLM,16.2494771147373,TRUE,IFEval,0.408164780560025,40.8164780560025,BBH,0.467202473128281,25.2536970908126,MATH Level 5,0.0219033232628399,2.19033232628399,GPQA,0.266778523489933,2.23713646532438,MUSR,0.391427083333333,7.72838541666667,MMLU-PRO,0.2734375,19.2708333333333,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-04,2024-06-12,0,stabilityai/stablelm-2-12b-chat,other,86,12.143,1.08809668593683 +stabilityai/stablelm-2-12b-chat_bfloat16_b6b62cd451b84e848514c00fafa66d9ead9297c5_True,stabilityai/stablelm-2-12b-chat,b6b62cd451b84e848514c00fafa66d9ead9297c5,bfloat16,chatmodels,Original,StableLmForCausalLM,16.2494771147373,TRUE,IFEval,0.408164780560025,40.8164780560025,BBH,0.467202473128281,25.2536970908126,MATH Level 5,0.0219033232628399,2.19033232628399,GPQA,0.266778523489933,2.23713646532438,MUSR,0.391427083333333,7.72838541666667,MMLU-PRO,0.2734375,19.2708333333333,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-04,2024-06-12,0,stabilityai/stablelm-2-12b-chat,other,87,12.143,1.08809668593683 stabilityai/stablelm-2-1_6b_float16_8879812cccd176fbbe9ceb747b815bcc7d6499f8_False,stabilityai/stablelm-2-1_6b,8879812cccd176fbbe9ceb747b815bcc7d6499f8,float16,pretrained,Original,StableLmForCausalLM,5.21612653885089,FALSE,IFEval,0.115705217711228,11.5705217711228,BBH,0.338457720511071,8.63269520496884,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.248322147651007,0,MUSR,0.388197916666667,5.79140625,MMLU-PRO,0.146359707446809,5.15107860520095,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-18,2024-06-12,0,stabilityai/stablelm-2-1_6b,other,187,1.645,0.549871827675722 stabilityai/stablelm-2-1_6b-chat_bfloat16_f3fe67057c2789ae1bb1fe42b038da99840d4f13_True,stabilityai/stablelm-2-1_6b-chat,f3fe67057c2789ae1bb1fe42b038da99840d4f13,bfloat16,chatmodels,Original,StableLmForCausalLM,8.64077458938206,TRUE,IFEval,0.305999193251683,30.5999193251683,BBH,0.339017239548652,7.49337829741063,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.24748322147651,0,MUSR,0.35796875,5.71276041666667,MMLU-PRO,0.162150930851064,6.90565898345154,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-08,2024-06-12,0,stabilityai/stablelm-2-1_6b-chat,other,32,1.645,0.495426508518865 stabilityai/stablelm-2-zephyr-1_6b_float16_2f275b1127d59fc31e4f7c7426d528768ada9ea4_True,stabilityai/stablelm-2-zephyr-1_6b,2f275b1127d59fc31e4f7c7426d528768ada9ea4,float16,chatmodels,Original,StableLmForCausalLM,9.28193395617311,TRUE,IFEval,0.327931000855508,32.7931000855508,BBH,0.335160870628073,6.70871014793823,MATH Level 5,0.0226586102719033,2.26586102719033,GPQA,0.243288590604027,0,MUSR,0.351145833333333,5.99322916666667,MMLU-PRO,0.171376329787234,7.93070330969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-19,2024-06-12,0,stabilityai/stablelm-2-zephyr-1_6b,other,181,1.645,0.473088662740942 stabilityai/stablelm-3b-4e1t_bfloat16_fa4a6a92fca83c3b4223a3c9bf792887090ebfba_False,stabilityai/stablelm-3b-4e1t,fa4a6a92fca83c3b4223a3c9bf792887090ebfba,bfloat16,pretrained,Original,StableLmForCausalLM,7.26325070759698,FALSE,IFEval,0.220319862409518,22.0319862409518,BBH,0.350421141582691,9.01307034954628,MATH Level 5,0.006797583081571,0.6797583081571,GPQA,0.23741610738255,0,MUSR,0.37778125,4.42265625,MMLU-PRO,0.16688829787234,7.43203309692671,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-29,2024-08-10,0,stabilityai/stablelm-3b-4e1t,cc-by-sa-4.0,309,2.795,0.434265126393168 stabilityai/stablelm-zephyr-3b_bfloat16_a14f62d95754d96aea2be6e24c0f6966636797b9_True,stabilityai/stablelm-zephyr-3b,a14f62d95754d96aea2be6e24c0f6966636797b9,bfloat16,chatmodels,Original,StableLmForCausalLM,12.356618845486,TRUE,IFEval,0.368322717057408,36.8322717057408,BBH,0.386636144283787,14.7591192080273,MATH Level 5,0.0422960725075529,4.22960725075529,GPQA,0.239093959731544,0,MUSR,0.418302083333333,9.78776041666667,MMLU-PRO,0.176778590425532,8.53095449172577,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-21,2024-06-12,0,stabilityai/stablelm-zephyr-3b,other,249,2.795,0.38402363149593 sthenno-com/miscii-14b-1028_bfloat16_a60c866621ee35d04e84cf366e972f2466d617b1_True,sthenno-com/miscii-14b-1028,a60c866621ee35d04e84cf366e972f2466d617b1,bfloat16,chatmodels,Original,Qwen2ForCausalLM,35.0544159891224,TRUE,IFEval,0.82367119243607,82.367119243607,BBH,0.64483340535341,49.2626676555747,MATH Level 5,0.0634441087613293,6.34441087613293,GPQA,0.356543624161074,14.2058165548098,MUSR,0.41815625,12.0028645833333,MMLU-PRO,0.515292553191489,46.1436170212766,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-12,2024-11-17,1,sthenno-com/miscii-14b-1028 (Merge),apache-2.0,16,14.77,1.53372828900934 +sthenno-com/miscii-14b-1225_bfloat16_3d26f676424307cc2496c6b11710bbfa35275685_True,sthenno-com/miscii-14b-1225,3d26f676424307cc2496c6b11710bbfa35275685,bfloat16,chatmodels,Original,Qwen2ForCausalLM,40.0836508904516,TRUE,IFEval,0.787800812954073,78.7800812954073,BBH,0.657170898840738,50.9128057269024,MATH Level 5,0.31570996978852,31.570996978852,GPQA,0.37751677852349,17.0022371364653,MUSR,0.436572916666667,14.7716145833333,MMLU-PRO,0.527177526595745,47.4641696217494,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-24,2024-12-24,1,sthenno-com/miscii-14b-1225 (Merge),apache-2.0,5,7.383,1.44849724600296 suayptalha/HomerCreativeAnvita-Mix-Qw7B_bfloat16_5be9b48b59652687d3e5b88f9e935b51869756ad_True,suayptalha/HomerCreativeAnvita-Mix-Qw7B,5be9b48b59652687d3e5b88f9e935b51869756ad,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,34.6209777006466,TRUE,IFEval,0.780781659330576,78.0781659330576,BBH,0.556465318149032,36.9841675036238,MATH Level 5,0.310422960725076,31.0422960725076,GPQA,0.314597315436242,8.61297539149888,MUSR,0.44159375,14.7325520833333,MMLU-PRO,0.444481382978723,38.2757092198582,TRUE,TRUE,FALSE,FALSE,FALSE,2024-11-22,2024-11-24,1,suayptalha/HomerCreativeAnvita-Mix-Qw7B (Merge),apache-2.0,9,7.616,0.649880690265609 suayptalha/Komodo-Llama-3.2-3B-v2-fp16_float16_1ff4b55d952597429c249ca71dc08b823eba17c0_True,suayptalha/Komodo-Llama-3.2-3B-v2-fp16,1ff4b55d952597429c249ca71dc08b823eba17c0,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,19.5872620510565,TRUE,IFEval,0.634053201062071,63.4053201062071,BBH,0.43549964909075,20.2043289735504,MATH Level 5,0.0626888217522659,6.26888217522659,GPQA,0.277684563758389,3.69127516778523,MUSR,0.340572916666667,3.37161458333333,MMLU-PRO,0.285239361702128,20.5821513002364,TRUE,FALSE,FALSE,FALSE,FALSE,2024-11-19,2024-11-19,1,suayptalha/Komodo-Llama-3.2-3B-v2-fp16 (Merge),apache-2.0,5,3,0.598064763597242 suayptalha/Rombos-2.5-T.E-8.1_bfloat16_c0ee2950b07377e1d0e01fc013a0f200b0306ea2_True,suayptalha/Rombos-2.5-T.E-8.1,c0ee2950b07377e1d0e01fc013a0f200b0306ea2,bfloat16,basemergesandmoerges,Original,Qwen2ForCausalLM,27.3351789287742,TRUE,IFEval,0.692504776215996,69.2504776215996,BBH,0.551464124947837,36.4998612058804,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.311241610738255,8.165548098434,MUSR,0.416635416666667,10.9794270833333,MMLU-PRO,0.444564494680851,38.2849438534279,TRUE,TRUE,FALSE,FALSE,FALSE,2024-11-16,2024-11-16,1,suayptalha/Rombos-2.5-T.E-8.1 (Merge),cc-by-nc-sa-4.0,6,7.616,0.686015561357919 @@ -2232,16 +2253,17 @@ thomas-yanxin/XinYuan-Qwen2-1_5B_float16_a01b362887832bea08d686737861ac3d5b437a3 thomas-yanxin/XinYuan-Qwen2-7B_float16_c62d83eee2f4812ac17fc17d307f4aa1a77c5359_True,thomas-yanxin/XinYuan-Qwen2-7B,c62d83eee2f4812ac17fc17d307f4aa1a77c5359,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.2177136716821,TRUE,IFEval,0.443760333692381,44.3760333692381,BBH,0.49366291572389,28.4014885227586,MATH Level 5,0.132930513595166,13.2930513595166,GPQA,0.291107382550336,5.48098434004475,MUSR,0.4058125,9.25989583333334,MMLU-PRO,0.392453457446809,32.4948286052009,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-21,2024-09-03,0,thomas-yanxin/XinYuan-Qwen2-7B,other,1,7.616,3.27615443959276 thomas-yanxin/XinYuan-Qwen2-7B-0917_float16_6cee1b155fca9ae1f558f434953dfdadb9596af0_True,thomas-yanxin/XinYuan-Qwen2-7B-0917,6cee1b155fca9ae1f558f434953dfdadb9596af0,float16,fine-tunedondomain-specificdatasets,Original,Qwen2ForCausalLM,22.7216165321403,TRUE,IFEval,0.371919839359566,37.1919839359566,BBH,0.516921557378601,32.6199381358211,MATH Level 5,0.088368580060423,8.8368580060423,GPQA,0.309563758389262,7.94183445190157,MUSR,0.440104166666667,13.6796875,MMLU-PRO,0.424534574468085,36.0593971631206,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-17,2024-09-17,0,thomas-yanxin/XinYuan-Qwen2-7B-0917,other,4,7.616,1.48556449363563 thomas-yanxin/XinYuan-Qwen2.5-7B-0917_float16_bbbeafd1003c4d5e13f09b7223671957384b961a_True,thomas-yanxin/XinYuan-Qwen2.5-7B-0917,bbbeafd1003c4d5e13f09b7223671957384b961a,float16,chatmodels,Original,Qwen2ForCausalLM,18.1750369812353,TRUE,IFEval,0.357706441131753,35.7706441131753,BBH,0.518410611698749,33.439669270242,MATH Level 5,0,0,GPQA,0.281040268456376,4.13870246085012,MUSR,0.367552083333333,3.67734375,MMLU-PRO,0.388214760638298,32.0238622931442,TRUE,FALSE,FALSE,FALSE,FALSE,2024-09-17,2024-09-24,0,thomas-yanxin/XinYuan-Qwen2.5-7B-0917,other,4,7.616,0.971225233350759 -tiiuae/Falcon3-10B-Base_bfloat16_0b20cceec08ec598ed2de7a6dfbeb208f1eae656_False,tiiuae/Falcon3-10B-Base,0b20cceec08ec598ed2de7a6dfbeb208f1eae656,bfloat16,pretrained,Original,LlamaForCausalLM,27.5926746458582,FALSE,IFEval,0.36477546243966,36.477546243966,BBH,0.595004253437141,41.375462186518,MATH Level 5,0.24773413897281,24.773413897281,GPQA,0.345637583892617,12.751677852349,MUSR,0.439791666666667,14.1739583333333,MMLU-PRO,0.424035904255319,36.0039893617021,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-03,2024-12-12,0,tiiuae/Falcon3-10B-Base,other,29,10.306,0.810389439981991 +tiiuae/Falcon3-10B-Base_bfloat16_0b20cceec08ec598ed2de7a6dfbeb208f1eae656_False,tiiuae/Falcon3-10B-Base,0b20cceec08ec598ed2de7a6dfbeb208f1eae656,bfloat16,pretrained,Original,LlamaForCausalLM,27.5926746458582,FALSE,IFEval,0.36477546243966,36.477546243966,BBH,0.595004253437141,41.375462186518,MATH Level 5,0.24773413897281,24.773413897281,GPQA,0.345637583892617,12.751677852349,MUSR,0.439791666666667,14.1739583333333,MMLU-PRO,0.424035904255319,36.0039893617021,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-03,2024-12-12,0,tiiuae/Falcon3-10B-Base,other,30,10.306,0.810389439981991 tiiuae/Falcon3-10B-Instruct_bfloat16_9be8471432d7c4f35f72505fa2ca4101f0a2ed6d_True,tiiuae/Falcon3-10B-Instruct,9be8471432d7c4f35f72505fa2ca4101f0a2ed6d,bfloat16,chatmodels,Original,LlamaForCausalLM,35.1858847768594,TRUE,IFEval,0.78165600606391,78.1656006063911,BBH,0.617046939805208,44.8215398248313,MATH Level 5,0.259063444108761,25.9063444108761,GPQA,0.328859060402685,10.5145413870246,MUSR,0.432322916666667,13.60703125,MMLU-PRO,0.442902260638298,38.1002511820331,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-14,2024-12-16,1,tiiuae/Falcon3-10B-Base,other,64,10.306,0.840411143061328 +tiiuae/Falcon3-10B-Instruct_float16_2843dfec944639fa3e41aca25456a8a4b3c9d46c_False,tiiuae/Falcon3-10B-Instruct,2843dfec944639fa3e41aca25456a8a4b3c9d46c,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,30.6884786152003,FALSE,IFEval,0.618166464979588,61.8166464979587,BBH,0.609093730631744,43.3315462875091,MATH Level 5,0.217522658610272,21.7522658610272,GPQA,0.333892617449664,11.1856823266219,MUSR,0.400447916666667,8.48932291666667,MMLU-PRO,0.437998670212766,37.5554078014184,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-14,2024-12-25,1,tiiuae/Falcon3-10B-Base,other,64,5.153,0.81113658949049 tiiuae/Falcon3-1B-Base_bfloat16_cc56a5a7c3923821312ad14f52c5a7c3fa835cbc_False,tiiuae/Falcon3-1B-Base,cc56a5a7c3923821312ad14f52c5a7c3fa835cbc,bfloat16,pretrained,Original,LlamaForCausalLM,9.8377436362263,FALSE,IFEval,0.242801322712625,24.2801322712625,BBH,0.357115391801564,11.3431732658549,MATH Level 5,0.0302114803625378,3.02114803625378,GPQA,0.279362416107383,3.91498881431767,MUSR,0.414739583333333,9.70911458333333,MMLU-PRO,0.160821143617021,6.7579048463357,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-13,2024-12-16,0,tiiuae/Falcon3-1B-Base,other,11,1.669,0.401369486782322 tiiuae/Falcon3-1B-Instruct_bfloat16_27dd70ccb22fd3cc71c5adbc95eb670455afff3d_True,tiiuae/Falcon3-1B-Instruct,27dd70ccb22fd3cc71c5adbc95eb670455afff3d,bfloat16,chatmodels,Original,LlamaForCausalLM,15.3211934957275,TRUE,IFEval,0.555667850193043,55.5667850193043,BBH,0.374453569136667,12.9613740625082,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.266778523489933,2.23713646532438,MUSR,0.418895833333333,10.5619791666667,MMLU-PRO,0.183843085106383,9.31589834515366,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-14,2024-12-16,1,tiiuae/Falcon3-1B-Base,other,25,1.669,0.397020363950145 tiiuae/Falcon3-3B-Base_bfloat16_3d49753006a0fa5384031a737c60fbcd0f60b7f2_False,tiiuae/Falcon3-3B-Base,3d49753006a0fa5384031a737c60fbcd0f60b7f2,bfloat16,pretrained,Original,LlamaForCausalLM,15.7513313104367,FALSE,IFEval,0.27649857932508,27.649857932508,BBH,0.442136782587439,21.5847842937733,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.296979865771812,6.26398210290828,MUSR,0.374989583333333,6.27369791666667,MMLU-PRO,0.287898936170213,20.8776595744681,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-13,2024-12-13,0,tiiuae/Falcon3-3B-Base,other,11,3.228,0.481216475612645 tiiuae/Falcon3-3B-Instruct_bfloat16_552213004cecf9bb6ce332f46da0d4324c8347f1_True,tiiuae/Falcon3-3B-Instruct,552213004cecf9bb6ce332f46da0d4324c8347f1,bfloat16,chatmodels,Original,LlamaForCausalLM,26.5519924326426,TRUE,IFEval,0.697675501004003,69.7675501004003,BBH,0.475443033216757,26.2872294684327,MATH Level 5,0.246978851963746,24.6978851963746,GPQA,0.288590604026846,5.14541387024609,MUSR,0.41359375,11.1325520833333,MMLU-PRO,0.300531914893617,22.2813238770686,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-14,2024-12-16,0,tiiuae/Falcon3-3B-Instruct,other,20,3.228,0.480463645995229 tiiuae/Falcon3-7B-Base_bfloat16_a1cf49eb7a53210fc2ee82f3876bbc7efb2244fd_False,tiiuae/Falcon3-7B-Base,a1cf49eb7a53210fc2ee82f3876bbc7efb2244fd,bfloat16,pretrained,Original,LlamaForCausalLM,24.7205491267482,FALSE,IFEval,0.341594746384039,34.1594746384039,BBH,0.509888046642671,31.5599185475034,MATH Level 5,0.192598187311178,19.2598187311178,GPQA,0.346476510067114,12.8635346756152,MUSR,0.470208333333333,18.1427083333333,MMLU-PRO,0.391040558510638,32.3378398345154,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-21,2024-12-12,0,tiiuae/Falcon3-7B-Base,other,18,7.456,0.609372047303554 -tiiuae/Falcon3-7B-Instruct_bfloat16_7aae4f3953f3dbfaa81aeecbb404a6bbba0e0c06_True,tiiuae/Falcon3-7B-Instruct,7aae4f3953f3dbfaa81aeecbb404a6bbba0e0c06,bfloat16,chatmodels,Original,LlamaForCausalLM,34.9066990629732,TRUE,IFEval,0.761247933261524,76.1247933261524,BBH,0.563244278519333,37.9158124591715,MATH Level 5,0.318731117824773,31.8731117824773,GPQA,0.310402684563758,8.05369127516779,MUSR,0.482677083333333,21.16796875,MMLU-PRO,0.40874335106383,34.30481678487,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-29,2024-12-16,1,tiiuae/Falcon3-7B-Base,other,31,7.456,0.618760668612507 +tiiuae/Falcon3-7B-Instruct_bfloat16_7aae4f3953f3dbfaa81aeecbb404a6bbba0e0c06_True,tiiuae/Falcon3-7B-Instruct,7aae4f3953f3dbfaa81aeecbb404a6bbba0e0c06,bfloat16,chatmodels,Original,LlamaForCausalLM,34.9066990629732,TRUE,IFEval,0.761247933261524,76.1247933261524,BBH,0.563244278519333,37.9158124591715,MATH Level 5,0.318731117824773,31.8731117824773,GPQA,0.310402684563758,8.05369127516779,MUSR,0.482677083333333,21.16796875,MMLU-PRO,0.40874335106383,34.30481678487,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-29,2024-12-16,1,tiiuae/Falcon3-7B-Base,other,33,7.456,0.618760668612507 tiiuae/Falcon3-Mamba-7B-Base_bfloat16_f08d14145ce86c32dd04f18bacb3f12b247042e2_False,tiiuae/Falcon3-Mamba-7B-Base,f08d14145ce86c32dd04f18bacb3f12b247042e2,bfloat16,pretrained,Original,FalconMambaForCausalLM,18.1262038589633,FALSE,IFEval,0.289112887139457,28.9112887139457,BBH,0.469928018882704,25.5340488029532,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.309563758389262,7.94183445190157,MUSR,0.343145833333333,4.39322916666667,MMLU-PRO,0.303773271276596,22.6414745862884,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-11,2024-12-12,0,tiiuae/Falcon3-Mamba-7B-Base,other,15,7.273,0.83631814366917 -tiiuae/Falcon3-Mamba-7B-Instruct_bfloat16_382561849d1509b5f1a4d7a38bb286b3c4f46fbd_True,tiiuae/Falcon3-Mamba-7B-Instruct,382561849d1509b5f1a4d7a38bb286b3c4f46fbd,bfloat16,chatmodels,Original,FalconMambaForCausalLM,27.643894386327,TRUE,IFEval,0.716509971320541,71.6509971320541,BBH,0.467895768841069,25.2035051723981,MATH Level 5,0.272658610271903,27.2658610271903,GPQA,0.303691275167785,7.15883668903803,MUSR,0.386864583333333,8.25807291666667,MMLU-PRO,0.336934840425532,26.3260933806147,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-13,2024-12-13,1,tiiuae/Falcon3-Mamba-7B-Instruct (Merge),other,18,7.273,0.828497506621677 +tiiuae/Falcon3-Mamba-7B-Instruct_bfloat16_382561849d1509b5f1a4d7a38bb286b3c4f46fbd_True,tiiuae/Falcon3-Mamba-7B-Instruct,382561849d1509b5f1a4d7a38bb286b3c4f46fbd,bfloat16,chatmodels,Original,FalconMambaForCausalLM,27.643894386327,TRUE,IFEval,0.716509971320541,71.6509971320541,BBH,0.467895768841069,25.2035051723981,MATH Level 5,0.272658610271903,27.2658610271903,GPQA,0.303691275167785,7.15883668903803,MUSR,0.386864583333333,8.25807291666667,MMLU-PRO,0.336934840425532,26.3260933806147,TRUE,FALSE,FALSE,FALSE,TRUE,2024-12-13,2024-12-13,1,tiiuae/Falcon3-Mamba-7B-Instruct (Merge),other,19,7.273,0.828497506621677 tiiuae/falcon-11B_bfloat16_066e3bf4e2d9aaeefa129af0a6d39727d27816b3_False,tiiuae/falcon-11B,066e3bf4e2d9aaeefa129af0a6d39727d27816b3,bfloat16,pretrained,Original,FalconForCausalLM,13.814138235727,FALSE,IFEval,0.326132439704429,32.6132439704429,BBH,0.439163703554938,21.9379994628903,MATH Level 5,0.0256797583081571,2.56797583081571,GPQA,0.270973154362416,2.79642058165548,MUSR,0.398645833333333,7.53072916666667,MMLU-PRO,0.238946143617021,15.4384604018913,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-09,2024-06-09,0,tiiuae/falcon-11B,unknown,213,11.103,1.08287099141766 tiiuae/falcon-40b_bfloat16_4a70170c215b36a3cce4b4253f6d0612bb7d4146_False,tiiuae/falcon-40b,4a70170c215b36a3cce4b4253f6d0612bb7d4146,bfloat16,pretrained,Original,FalconForCausalLM,11.3635401118469,FALSE,IFEval,0.249645385355302,24.9645385355302,BBH,0.40185324955958,16.5833047303122,MATH Level 5,0.0158610271903323,1.58610271903323,GPQA,0.273489932885906,3.13199105145414,MUSR,0.363145833333333,5.19322916666667,MMLU-PRO,0.250498670212766,16.7220744680851,TRUE,FALSE,FALSE,FALSE,TRUE,2023-05-24,2024-06-09,0,tiiuae/falcon-40b,apache-2.0,2424,40,21.7935839014342 tiiuae/falcon-40b-instruct_bfloat16_ecb78d97ac356d098e79f0db222c9ce7c5d9ee5f_False,tiiuae/falcon-40b-instruct,ecb78d97ac356d098e79f0db222c9ce7c5d9ee5f,bfloat16,chatmodels,Original,FalconForCausalLM,10.4341543148279,FALSE,IFEval,0.24544874266945,24.544874266945,BBH,0.40538675151592,17.2201142032645,MATH Level 5,0.0166163141993958,1.66163141993958,GPQA,0.25,0,MUSR,0.376229166666667,5.16197916666667,MMLU-PRO,0.226146941489362,14.0163268321513,TRUE,FALSE,FALSE,FALSE,TRUE,2023-05-25,2024-06-09,0,tiiuae/falcon-40b-instruct,apache-2.0,1174,40,19.7332454871768 @@ -2251,7 +2273,7 @@ tiiuae/falcon-mamba-7b_bfloat16_5337fd73f19847e111ba2291f3f0e1617b90c37d_False,t tklohj/WindyFloLLM_float16_21f4241ab3f091d1d309e9076a8d8e3f014908a8_False,tklohj/WindyFloLLM,21f4241ab3f091d1d309e9076a8d8e3f014908a8,float16,pretrained,Original,LlamaForCausalLM,14.2058910531351,FALSE,IFEval,0.26685638550158,26.685638550158,BBH,0.463661600705879,24.3987631978505,MATH Level 5,0.013595166163142,1.3595166163142,GPQA,0.275167785234899,3.35570469798658,MUSR,0.4253125,11.8640625,MMLU-PRO,0.258144946808511,17.5716607565012,FALSE,FALSE,FALSE,FALSE,FALSE,2024-06-30,2024-07-10,1,tklohj/WindyFloLLM (Merge),"",0,13.016,1.09851209304988 togethercomputer/GPT-JT-6B-v1_float16_f34aa35f906895602c1f86f5685e598afdea8051_False,togethercomputer/GPT-JT-6B-v1,f34aa35f906895602c1f86f5685e598afdea8051,float16,fine-tunedondomain-specificdatasets,Original,GPTJForCausalLM,6.82735436046721,FALSE,IFEval,0.206106464181705,20.6106464181705,BBH,0.330266091274267,7.31852396514161,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.260906040268456,1.45413870246085,MUSR,0.37365625,3.87369791666667,MMLU-PRO,0.162566489361702,6.95183215130023,TRUE,FALSE,FALSE,FALSE,TRUE,2022-11-24,2024-06-12,0,togethercomputer/GPT-JT-6B-v1,apache-2.0,301,6,37.9588106808561 togethercomputer/GPT-NeoXT-Chat-Base-20B_float16_d386708e84d862a65f7d2b4989f64750cb657227_False,togethercomputer/GPT-NeoXT-Chat-Base-20B,d386708e84d862a65f7d2b4989f64750cb657227,float16,fine-tunedondomain-specificdatasets,Original,GPTNeoXForCausalLM,4.96406182126427,FALSE,IFEval,0.182975615810494,18.2975615810494,BBH,0.33209702572173,6.83079498313785,MATH Level 5,0.0128398791540786,1.28398791540786,GPQA,0.25,0,MUSR,0.3460625,1.7578125,MMLU-PRO,0.114527925531915,1.61421394799054,TRUE,FALSE,FALSE,FALSE,TRUE,2023-03-03,2024-06-12,0,togethercomputer/GPT-NeoXT-Chat-Base-20B,apache-2.0,695,20,2.98358798772187 -togethercomputer/LLaMA-2-7B-32K_float16_46c24bb5aef59722fa7aa6d75e832afd1d64b980_False,togethercomputer/LLaMA-2-7B-32K,46c24bb5aef59722fa7aa6d75e832afd1d64b980,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,6.73701093305286,FALSE,IFEval,0.186497382500654,18.6497382500654,BBH,0.339951752173017,8.08998422988955,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.25,0,MUSR,0.375364583333333,4.32057291666667,MMLU-PRO,0.176778590425532,8.53095449172577,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-26,2024-06-12,0,togethercomputer/LLaMA-2-7B-32K,llama2,534,7,0.584572773138673 +togethercomputer/LLaMA-2-7B-32K_float16_46c24bb5aef59722fa7aa6d75e832afd1d64b980_False,togethercomputer/LLaMA-2-7B-32K,46c24bb5aef59722fa7aa6d75e832afd1d64b980,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,6.73701093305286,FALSE,IFEval,0.186497382500654,18.6497382500654,BBH,0.339951752173017,8.08998422988955,MATH Level 5,0.00830815709969789,0.830815709969789,GPQA,0.25,0,MUSR,0.375364583333333,4.32057291666667,MMLU-PRO,0.176778590425532,8.53095449172577,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-26,2024-06-12,0,togethercomputer/LLaMA-2-7B-32K,llama2,535,7,0.584572773138673 togethercomputer/Llama-2-7B-32K-Instruct_float16_d27380af003252f5eb0d218e104938b4e673e3f3_False,togethercomputer/Llama-2-7B-32K-Instruct,d27380af003252f5eb0d218e104938b4e673e3f3,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,8.20818971851801,FALSE,IFEval,0.213000394508792,21.3000394508792,BBH,0.344347242399275,8.56346991944695,MATH Level 5,0.0128398791540785,1.28398791540785,GPQA,0.251677852348993,0.223713646532442,MUSR,0.40559375,9.19921875,MMLU-PRO,0.178108377659574,8.67870862884161,TRUE,FALSE,FALSE,FALSE,TRUE,2023-08-08,2024-06-12,0,togethercomputer/Llama-2-7B-32K-Instruct,llama2,159,7,0.589909363259561 togethercomputer/RedPajama-INCITE-7B-Base_float16_78f7e482443971f4873ba3239f0ac810a367833b_False,togethercomputer/RedPajama-INCITE-7B-Base,78f7e482443971f4873ba3239f0ac810a367833b,float16,pretrained,Original,GPTNeoXForCausalLM,5.48628559312893,FALSE,IFEval,0.208229719366836,20.8229719366836,BBH,0.319488987650134,5.08724227291643,MATH Level 5,0.0113293051359517,1.13293051359517,GPQA,0.25503355704698,0.671140939597318,MUSR,0.362,3.01666666666667,MMLU-PRO,0.11968085106383,2.18676122931442,TRUE,FALSE,FALSE,FALSE,TRUE,2023-05-04,2024-06-12,0,togethercomputer/RedPajama-INCITE-7B-Base,apache-2.0,94,7,1.2206071633267 togethercomputer/RedPajama-INCITE-7B-Chat_float16_47b94a739e2f3164b438501c8684acc5d5acc146_False,togethercomputer/RedPajama-INCITE-7B-Chat,47b94a739e2f3164b438501c8684acc5d5acc146,float16,fine-tunedondomain-specificdatasets,Original,GPTNeoXForCausalLM,3.96278377352117,FALSE,IFEval,0.155797727806664,15.5797727806664,BBH,0.317544932845737,4.5021736643812,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.25251677852349,0.335570469798655,MUSR,0.344760416666667,1.86171875,MMLU-PRO,0.112117686170213,1.34640957446808,TRUE,FALSE,FALSE,FALSE,TRUE,2023-05-04,2024-06-13,0,togethercomputer/RedPajama-INCITE-7B-Chat,apache-2.0,92,7,1.21933610668148 @@ -2262,7 +2284,7 @@ togethercomputer/RedPajama-INCITE-Instruct-3B-v1_float16_0c66778ee09a03688674170 tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1_bfloat16_1fae784584dd03680b72dd4de7eefbc5b7cabcd5_True,tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1,1fae784584dd03680b72dd4de7eefbc5b7cabcd5,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,22.3073854674577,TRUE,IFEval,0.550771951754678,55.0771951754678,BBH,0.5009389976232,29.2679661316177,MATH Level 5,0.0725075528700906,7.25075528700906,GPQA,0.289429530201342,5.2572706935123,MUSR,0.435697916666667,13.7955729166667,MMLU-PRO,0.308759973404255,23.1955526004728,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-26,2024-09-12,0,tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1,llama3,16,8.03,0.858110170753023 unsloth/Phi-3-mini-4k-instruct_float16_636c707430a5509c80b1aa51d05c127ed339a975_True,unsloth/Phi-3-mini-4k-instruct,636c707430a5509c80b1aa51d05c127ed339a975,float16,basemergesandmoerges,Original,MistralForCausalLM,27.1783743374799,TRUE,IFEval,0.544027624480822,54.4027624480822,BBH,0.550023946744103,36.732473265614,MATH Level 5,0.154078549848943,15.4078549848943,GPQA,0.322986577181208,9.73154362416107,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.403091755319149,33.6768617021277,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-29,2024-11-25,0,unsloth/Phi-3-mini-4k-instruct,mit,41,3.821,0.469533108024419 upstage/SOLAR-10.7B-Instruct-v1.0_float16_c08c25ed66414a878fe0401a3596d536c083606c_True,upstage/SOLAR-10.7B-Instruct-v1.0,c08c25ed66414a878fe0401a3596d536c083606c,float16,chatmodels,Original,LlamaForCausalLM,19.6282553318946,TRUE,IFEval,0.473660997265035,47.3660997265035,BBH,0.516249494144699,31.8724018880021,MATH Level 5,0,0,GPQA,0.308724832214765,7.82997762863535,MUSR,0.3899375,6.9421875,MMLU-PRO,0.313829787234043,23.7588652482269,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-12,2024-06-12,1,upstage/SOLAR-10.7B-Instruct-v1.0 (Merge),cc-by-nc-4.0,619,10.732,0.782775785638588 -upstage/SOLAR-10.7B-v1.0_float16_a45090b8e56bdc2b8e32e46b3cd782fc0bea1fa5_False,upstage/SOLAR-10.7B-v1.0,a45090b8e56bdc2b8e32e46b3cd782fc0bea1fa5,float16,pretrained,Original,LlamaForCausalLM,4.9164478862809,FALSE,IFEval,0.171584728520326,17.1584728520326,BBH,0.299835173754951,2.14716276381869,MATH Level 5,0.0234138972809668,2.34138972809668,GPQA,0.260906040268456,1.45413870246085,MUSR,0.368197916666667,4.52473958333333,MMLU-PRO,0.116855053191489,1.87278368794326,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-12,2024-06-12,0,upstage/SOLAR-10.7B-v1.0,apache-2.0,292,10.732,1.51919401838023 +upstage/SOLAR-10.7B-v1.0_float16_a45090b8e56bdc2b8e32e46b3cd782fc0bea1fa5_False,upstage/SOLAR-10.7B-v1.0,a45090b8e56bdc2b8e32e46b3cd782fc0bea1fa5,float16,pretrained,Original,LlamaForCausalLM,4.9164478862809,FALSE,IFEval,0.171584728520326,17.1584728520326,BBH,0.299835173754951,2.14716276381869,MATH Level 5,0.0234138972809668,2.34138972809668,GPQA,0.260906040268456,1.45413870246085,MUSR,0.368197916666667,4.52473958333333,MMLU-PRO,0.116855053191489,1.87278368794326,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-12,2024-06-12,0,upstage/SOLAR-10.7B-v1.0,apache-2.0,293,10.732,1.51919401838023 upstage/solar-pro-preview-instruct_bfloat16_b4db141b5fb08b23f8bc323bc34e2cff3e9675f8_True,upstage/solar-pro-preview-instruct,b4db141b5fb08b23f8bc323bc34e2cff3e9675f8,bfloat16,chatmodels,Original,SolarForCausalLM,39.9008905140799,TRUE,IFEval,0.841581448334863,84.1581448334863,BBH,0.681684305137953,54.8223509998353,MATH Level 5,0.218277945619335,21.8277945619335,GPQA,0.370805369127517,16.1073825503356,MUSR,0.44165625,15.00703125,MMLU-PRO,0.52734375,47.4826388888889,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-09,2024-09-11,0,upstage/solar-pro-preview-instruct,mit,436,22.14,1.7417631529201 uukuguy/speechless-code-mistral-7b-v1.0_bfloat16_1862e0a712efc6002112e9c1235a197d58419b37_False,uukuguy/speechless-code-mistral-7b-v1.0,1862e0a712efc6002112e9c1235a197d58419b37,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,18.0918867557836,FALSE,IFEval,0.366524155906329,36.6524155906329,BBH,0.45717128870942,24.0914120678456,MATH Level 5,0.0460725075528701,4.60725075528701,GPQA,0.284395973154362,4.58612975391499,MUSR,0.450177083333333,14.7721354166667,MMLU-PRO,0.314577792553192,23.8419769503546,TRUE,FALSE,FALSE,FALSE,FALSE,2023-10-10,2024-06-26,0,uukuguy/speechless-code-mistral-7b-v1.0,apache-2.0,18,7,0.646398339303366 uukuguy/speechless-codellama-34b-v2.0_bfloat16_419bc42a254102d6a5486a1a854068e912c4047c_False,uukuguy/speechless-codellama-34b-v2.0,419bc42a254102d6a5486a1a854068e912c4047c,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,17.20935759677,FALSE,IFEval,0.460421681139377,46.0421681139377,BBH,0.481312669744462,25.9932932678406,MATH Level 5,0.0430513595166163,4.30513595166163,GPQA,0.269295302013423,2.57270693512305,MUSR,0.378708333333333,7.20520833333333,MMLU-PRO,0.254238696808511,17.1376329787234,TRUE,FALSE,FALSE,FALSE,FALSE,2023-10-04,2024-06-26,0,uukuguy/speechless-codellama-34b-v2.0,llama2,17,34,1.9912541922771 @@ -2287,7 +2309,7 @@ vicgalle/Configurable-Yi-1.5-9B-Chat_float16_992cb2232caae78eff6a836b2e0642f7cbf vicgalle/ConfigurableBeagle-11B_float16_bbc16dbf94b8e8a99bb3e2ada6755faf9c2990dd_True,vicgalle/ConfigurableBeagle-11B,bbc16dbf94b8e8a99bb3e2ada6755faf9c2990dd,float16,chatmodels,Original,MistralForCausalLM,22.635544120218,TRUE,IFEval,0.583445258580566,58.3445258580566,BBH,0.52865923186267,32.3920229028112,MATH Level 5,0.0438066465256798,4.38066465256798,GPQA,0.302013422818792,6.93512304250559,MUSR,0.395302083333333,7.37942708333333,MMLU-PRO,0.337433510638298,26.3815011820331,TRUE,FALSE,FALSE,FALSE,FALSE,2024-02-17,2024-06-26,0,vicgalle/ConfigurableBeagle-11B,apache-2.0,3,10.732,0.879856522706047 vicgalle/ConfigurableHermes-7B_float16_1333a88eaf6591836b2d9825d1eaec7260f336c9_True,vicgalle/ConfigurableHermes-7B,1333a88eaf6591836b2d9825d1eaec7260f336c9,float16,chatmodels,Original,MistralForCausalLM,19.5362954149074,TRUE,IFEval,0.541079890246768,54.1079890246768,BBH,0.457296962783042,23.1581643804065,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.276845637583893,3.57941834451902,MUSR,0.4056875,9.1109375,MMLU-PRO,0.302526595744681,22.5029550827423,TRUE,FALSE,FALSE,FALSE,FALSE,2024-02-17,2024-06-26,0,vicgalle/ConfigurableHermes-7B,apache-2.0,3,7.242,0.61728188136055 vicgalle/ConfigurableSOLAR-10.7B_float16_9d9baad88ea9dbaa61881f15e4f0d16e931033b4_True,vicgalle/ConfigurableSOLAR-10.7B,9d9baad88ea9dbaa61881f15e4f0d16e931033b4,float16,chatmodels,Original,LlamaForCausalLM,19.0456959218201,TRUE,IFEval,0.509955806149905,50.9955806149905,BBH,0.486681009773605,27.4509501416669,MATH Level 5,0,0,GPQA,0.298657718120805,6.48769574944072,MUSR,0.380479166666667,5.19322916666667,MMLU-PRO,0.317320478723404,24.146719858156,TRUE,FALSE,FALSE,FALSE,FALSE,2024-03-10,2024-06-26,0,vicgalle/ConfigurableSOLAR-10.7B,apache-2.0,2,10.732,0.677681314775582 -vicgalle/Humanish-RP-Llama-3.1-8B_float16_d27aa731db1d390a8d17b0a4565c9231ee5ae8b9_True,vicgalle/Humanish-RP-Llama-3.1-8B,d27aa731db1d390a8d17b0a4565c9231ee5ae8b9,float16,chatmodels,Original,LlamaForCausalLM,25.347670753782,TRUE,IFEval,0.666925978625602,66.6925978625602,BBH,0.510038547614325,29.9585603152367,MATH Level 5,0.147280966767372,14.7280966767372,GPQA,0.286912751677852,4.92170022371365,MUSR,0.395208333333333,8.26770833333333,MMLU-PRO,0.34765625,27.5173611111111,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-03,2024-08-03,0,vicgalle/Humanish-RP-Llama-3.1-8B,apache-2.0,8,8.03,0.753450538005498 +vicgalle/Humanish-RP-Llama-3.1-8B_float16_d27aa731db1d390a8d17b0a4565c9231ee5ae8b9_True,vicgalle/Humanish-RP-Llama-3.1-8B,d27aa731db1d390a8d17b0a4565c9231ee5ae8b9,float16,chatmodels,Original,LlamaForCausalLM,25.347670753782,TRUE,IFEval,0.666925978625602,66.6925978625602,BBH,0.510038547614325,29.9585603152367,MATH Level 5,0.147280966767372,14.7280966767372,GPQA,0.286912751677852,4.92170022371365,MUSR,0.395208333333333,8.26770833333333,MMLU-PRO,0.34765625,27.5173611111111,TRUE,FALSE,FALSE,FALSE,FALSE,2024-08-03,2024-08-03,0,vicgalle/Humanish-RP-Llama-3.1-8B,apache-2.0,9,8.03,0.753450538005498 vicgalle/Merge-Mistral-Prometheus-7B_bfloat16_a7083581b508ce83c74f9267f07024bd462e7161_True,vicgalle/Merge-Mistral-Prometheus-7B,a7083581b508ce83c74f9267f07024bd462e7161,bfloat16,basemergesandmoerges,Original,MistralForCausalLM,16.5740542307737,TRUE,IFEval,0.484801437962384,48.4801437962384,BBH,0.420139773821292,18.4104062669295,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.263422818791946,1.78970917225951,MUSR,0.41,9.95,MMLU-PRO,0.271692154255319,19.0769060283688,TRUE,TRUE,FALSE,FALSE,FALSE,2024-05-04,2024-06-26,1,vicgalle/Merge-Mistral-Prometheus-7B (Merge),apache-2.0,1,7.242,0.630355575128161 vicgalle/Merge-Mixtral-Prometheus-8x7B_bfloat16_ba53ee5b52a81e56b01e919c069a0d045cfd4e83_True,vicgalle/Merge-Mixtral-Prometheus-8x7B,ba53ee5b52a81e56b01e919c069a0d045cfd4e83,bfloat16,basemergesandmoerges,Original,MixtralForCausalLM,24.7941577597984,TRUE,IFEval,0.57440258514076,57.440258514076,BBH,0.535149807109657,34.6514212661431,MATH Level 5,0.0944108761329305,9.44108761329305,GPQA,0.308724832214765,7.82997762863535,MUSR,0.40975,9.58541666666667,MMLU-PRO,0.368351063829787,29.8167848699764,TRUE,TRUE,TRUE,FALSE,FALSE,2024-05-04,2024-06-26,1,vicgalle/Merge-Mixtral-Prometheus-8x7B (Merge),apache-2.0,2,46.703,3.67400914913757 vicgalle/Roleplay-Llama-3-8B_float16_57297eb57dcc2c116f061d9dda341094203da01b_True,vicgalle/Roleplay-Llama-3-8B,57297eb57dcc2c116f061d9dda341094203da01b,float16,chatmodels,Original,LlamaForCausalLM,24.0831235202376,TRUE,IFEval,0.732022145684561,73.2022145684561,BBH,0.501231820692232,28.5546039092406,MATH Level 5,0.095166163141994,9.5166163141994,GPQA,0.260906040268456,1.45413870246085,MUSR,0.352885416666667,1.67734375,MMLU-PRO,0.370844414893617,30.0938238770686,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-19,2024-06-26,0,vicgalle/Roleplay-Llama-3-8B,apache-2.0,36,8.03,1.12615851389189 @@ -2383,11 +2405,13 @@ zelk12/MT1-Gen1-gemma-2-9B_bfloat16_939ac6c12059a18fc1117cdb3861f46816eff2fb_Tru zelk12/MT1-Gen2-gemma-2-9B_bfloat16_aeaca7dc7d50a425a5d3c38d7c4a7daf1c772ad4_True,zelk12/MT1-Gen2-gemma-2-9B,aeaca7dc7d50a425a5d3c38d7c4a7daf1c772ad4,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,33.1423983132787,TRUE,IFEval,0.798367221195317,79.8367221195317,BBH,0.609598989469156,43.9191905580506,MATH Level 5,0.113293051359517,11.3293051359517,GPQA,0.352348993288591,13.6465324384787,MUSR,0.428354166666667,12.8442708333333,MMLU-PRO,0.435505319148936,37.2783687943262,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-11,2024-11-11,1,zelk12/MT1-Gen2-gemma-2-9B (Merge),"",2,10.159,1.99599515181469 zelk12/MT1-Gen3-gemma-2-9B_bfloat16_5cc4ee1c70f08a5b1a195d43f044d9bf6fca29f5_True,zelk12/MT1-Gen3-gemma-2-9B,5cc4ee1c70f08a5b1a195d43f044d9bf6fca29f5,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,32.9649266979476,TRUE,IFEval,0.795969139660545,79.5969139660545,BBH,0.610155139201776,43.9903061254897,MATH Level 5,0.117824773413897,11.7824773413897,GPQA,0.348993288590604,13.1991051454139,MUSR,0.424322916666667,12.00703125,MMLU-PRO,0.434923537234043,37.2137263593381,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-01,2024-12-01,1,zelk12/MT1-Gen3-gemma-2-9B (Merge),"",0,10.159,1.94487662298927 zelk12/MT1-Gen4-gemma-2-9B_bfloat16_5eaf1ef67f32805c6fbc0b51418a8caf866661a2_True,zelk12/MT1-Gen4-gemma-2-9B,5eaf1ef67f32805c6fbc0b51418a8caf866661a2,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,31.5072355710121,TRUE,IFEval,0.794120710825055,79.4120710825055,BBH,0.605756767760905,43.1453681610688,MATH Level 5,0.0490936555891239,4.90936555891239,GPQA,0.347315436241611,12.9753914988814,MUSR,0.423114583333333,12.0893229166667,MMLU-PRO,0.42860704787234,36.5118942080378,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-14,2024-12-14,1,zelk12/MT1-Gen4-gemma-2-9B (Merge),gemma,1,9,1.74206227518399 +zelk12/MT1-Gen5-gemma-2-9B_bfloat16_4eb54f9a0a9f482537b0e79000ffe7fb9d024c38_True,zelk12/MT1-Gen5-gemma-2-9B,4eb54f9a0a9f482537b0e79000ffe7fb9d024c38,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,30.6361740982541,TRUE,IFEval,0.779482883194369,77.9482883194369,BBH,0.601745501763189,42.4967641989982,MATH Level 5,0.0324773413897281,3.24773413897281,GPQA,0.346476510067114,12.8635346756152,MUSR,0.419145833333333,11.4598958333333,MMLU-PRO,0.422207446808511,35.8008274231679,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-24,2024-12-24,1,zelk12/MT1-Gen5-gemma-2-9B (Merge),gemma,0,5.08,1.75523033656311 zelk12/MT1-gemma-2-9B_bfloat16_3a5e77518ca9c3c8ea2edac4c03bc220ee91f3ed_True,zelk12/MT1-gemma-2-9B,3a5e77518ca9c3c8ea2edac4c03bc220ee91f3ed,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,33.6338291770933,TRUE,IFEval,0.794670363524338,79.4670363524338,BBH,0.610874595075693,44.1615262166188,MATH Level 5,0.149546827794562,14.9546827794562,GPQA,0.345637583892617,12.751677852349,MUSR,0.432229166666667,13.1619791666667,MMLU-PRO,0.435754654255319,37.3060726950355,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-12,2024-10-14,1,zelk12/MT1-gemma-2-9B (Merge),"",1,10.159,3.3457193902416 zelk12/MT2-Gen1-gemma-2-9B_bfloat16_167abf8eb4ea01fecd42dc32ad68160c51a8685a_True,zelk12/MT2-Gen1-gemma-2-9B,167abf8eb4ea01fecd42dc32ad68160c51a8685a,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,32.4602232030711,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.610080202792074,44.1411031572748,MATH Level 5,0.101208459214502,10.1208459214502,GPQA,0.343120805369128,12.4161073825503,MUSR,0.424322916666667,12.00703125,MMLU-PRO,0.437666223404255,37.5184692671395,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-24,2024-10-27,1,zelk12/MT2-Gen1-gemma-2-9B (Merge),"",0,10.159,3.38320977682526 zelk12/MT2-Gen2-gemma-2-9B_bfloat16_24c487499b5833424ffb9932eed838bb254f61b4_True,zelk12/MT2-Gen2-gemma-2-9B,24c487499b5833424ffb9932eed838bb254f61b4,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,33.4711721257521,TRUE,IFEval,0.788900118352638,78.8900118352638,BBH,0.609291753193645,44.0445025622076,MATH Level 5,0.148036253776435,14.8036253776435,GPQA,0.346476510067114,12.8635346756152,MUSR,0.427020833333333,12.5776041666667,MMLU-PRO,0.438829787234043,37.6477541371158,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-12,2024-11-12,1,zelk12/MT2-Gen2-gemma-2-9B (Merge),"",3,10.159,2.0374413053929 zelk12/MT2-Gen3-gemma-2-9B_bfloat16_bb750c2b76328c6dbc9adf9ae3d09551f3723758_True,zelk12/MT2-Gen3-gemma-2-9B,bb750c2b76328c6dbc9adf9ae3d09551f3723758,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,32.9678950988867,TRUE,IFEval,0.781006617995807,78.1006617995807,BBH,0.610477206537393,44.0072740588439,MATH Level 5,0.132930513595166,13.2930513595166,GPQA,0.346476510067114,12.8635346756152,MUSR,0.423083333333333,12.0520833333333,MMLU-PRO,0.437416888297872,37.4907653664303,FALSE,FALSE,FALSE,FALSE,FALSE,2024-12-04,2024-12-04,1,zelk12/MT2-Gen3-gemma-2-9B (Merge),"",1,10.159,1.92437675479163 zelk12/MT2-Gen4-gemma-2-9B_bfloat16_7a07de3719c3b8b8e90e79a65798bcc4ef454fc6_True,zelk12/MT2-Gen4-gemma-2-9B,7a07de3719c3b8b8e90e79a65798bcc4ef454fc6,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,31.8609318658179,TRUE,IFEval,0.789599374105152,78.9599374105152,BBH,0.609655139201776,43.7783616810452,MATH Level 5,0.0830815709969789,8.30815709969789,GPQA,0.345637583892617,12.751677852349,MUSR,0.412541666666667,10.4677083333333,MMLU-PRO,0.432097739361702,36.8997488179669,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-15,2024-12-15,1,zelk12/MT2-Gen4-gemma-2-9B (Merge),gemma,1,9,1.7864357226101 +zelk12/MT2-Gen5-gemma-2-9B_bfloat16_94711cc263eab1464fa6b01c28ee5171b4467d84_True,zelk12/MT2-Gen5-gemma-2-9B,94711cc263eab1464fa6b01c28ee5171b4467d84,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,31.5945507760444,TRUE,IFEval,0.774911678790055,77.4911678790055,BBH,0.606393381752774,43.1242813733858,MATH Level 5,0.0634441087613293,6.34441087613293,GPQA,0.351510067114094,13.5346756152125,MUSR,0.424416666666667,12.3854166666667,MMLU-PRO,0.430186170212766,36.6873522458629,TRUE,TRUE,FALSE,FALSE,FALSE,2024-12-25,2024-12-25,1,zelk12/MT2-Gen5-gemma-2-9B (Merge),gemma,0,5.08,1.7621357118449 zelk12/MT2-gemma-2-9B_bfloat16_d20d7169ce0f53d586504c50b4b7dc470bf8a781_True,zelk12/MT2-gemma-2-9B,d20d7169ce0f53d586504c50b4b7dc470bf8a781,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,33.2824999153575,TRUE,IFEval,0.788575424318586,78.8575424318586,BBH,0.611511004530543,44.1674813698923,MATH Level 5,0.147280966767372,14.7280966767372,GPQA,0.347315436241611,12.9753914988814,MUSR,0.42165625,11.5403645833333,MMLU-PRO,0.436835106382979,37.4261229314421,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-14,2024-10-15,1,zelk12/MT2-gemma-2-9B (Merge),"",1,10.159,3.19410987112374 zelk12/MT3-Gen1-gemma-2-9B_bfloat16_cd78df9e67e2e710d8d305f5a03a92c01b1b425d_True,zelk12/MT3-Gen1-gemma-2-9B,cd78df9e67e2e710d8d305f5a03a92c01b1b425d,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,31.0548450771972,TRUE,IFEval,0.783779261249042,78.3779261249042,BBH,0.610676093203033,44.1194946874028,MATH Level 5,0.0324773413897281,3.24773413897281,GPQA,0.346476510067114,12.8635346756152,MUSR,0.415114583333333,10.7559895833333,MMLU-PRO,0.432679521276596,36.9643912529551,FALSE,FALSE,FALSE,FALSE,FALSE,2024-10-24,2024-10-28,1,zelk12/MT3-Gen1-gemma-2-9B (Merge),"",1,10.159,3.11366590171411 zelk12/MT3-Gen2-gemma-2-9B_bfloat16_e4ef057d20751d89934025e9088ba98d89b921b5_True,zelk12/MT3-Gen2-gemma-2-9B,e4ef057d20751d89934025e9088ba98d89b921b5,bfloat16,basemergesandmoerges,Original,Gemma2ForCausalLM,30.9636258974297,TRUE,IFEval,0.784328913948324,78.4328913948324,BBH,0.609147319467617,43.940225749255,MATH Level 5,0.020392749244713,2.0392749244713,GPQA,0.357382550335571,14.3176733780761,MUSR,0.411114583333333,10.02265625,MMLU-PRO,0.433261303191489,37.0290336879433,FALSE,FALSE,FALSE,FALSE,FALSE,2024-11-20,2024-11-20,1,zelk12/MT3-Gen2-gemma-2-9B (Merge),"",1,10.159,1.91910839859834 diff --git a/csv/merged.csv b/csv/merged.csv index 473a7a0..874fb40 100644 --- a/csv/merged.csv +++ b/csv/merged.csv @@ -1,34 +1,34 @@ key,id,model_name,model_sha,model_precision,model_type,model_weight_type,model_architecture,model_average_score,model_has_chat_template,evaluations_ifeval_name,evaluations_ifeval_value,evaluations_ifeval_normalized_score,evaluations_bbh_name,evaluations_bbh_value,evaluations_bbh_normalized_score,evaluations_math_name,evaluations_math_value,evaluations_math_normalized_score,evaluations_gpqa_name,evaluations_gpqa_value,evaluations_gpqa_normalized_score,evaluations_musr_name,evaluations_musr_value,evaluations_musr_normalized_score,evaluations_mmlu_pro_name,evaluations_mmlu_pro_value,evaluations_mmlu_pro_normalized_score,features_is_not_available_on_hub,features_is_merged,features_is_moe,features_is_flagged,features_is_highlighted_by_maintainer,metadata_upload_date,metadata_submission_date,metadata_generation,metadata_base_model,metadata_hub_license,metadata_hub_hearts,metadata_params_billions,metadata_co2_cost,rank,rank_stylectrl,model,arena_score,95_pct_ci,votes,organization,license,knowledge_cutoff,url -aya-expanse-32b,CohereForAI/aya-expanse-32b_float16_08b69cfa4240e2009c80ad304f000b491d1b8c38_True,CohereForAI/aya-expanse-32b,08b69cfa4240e2009c80ad304f000b491d1b8c38,float16,chatmodels,Original,CohereForCausalLM,29.3912190893162,TRUE,IFEval,0.730173716849072,73.0173716849072,BBH,0.564867009921211,38.7096114330142,MATH Level 5,0.13368580060423,13.368580060423,GPQA,0.325503355704698,10.0671140939597,MUSR,0.387270833333333,6.40885416666667,MMLU-PRO,0.41298204787234,34.7757830969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-23,2024-10-24,0,CohereForAI/aya-expanse-32b,cc-by-nc-4.0,192,32.296,5.5177350999101,54,62,Aya-Expanse-32B,1209,+4/-5,23536,Cohere,CC-BY-NC-4.0,Unknown,https://huggingface.co/CohereForAI/aya-expanse-32b -aya-expanse-8b,CohereForAI/aya-expanse-8b_float16_b9848575c8731981dfcf2e1f3bfbcb917a2e585d_True,CohereForAI/aya-expanse-8b,b9848575c8731981dfcf2e1f3bfbcb917a2e585d,float16,chatmodels,Original,CohereForCausalLM,22.1422232448213,TRUE,IFEval,0.63585176221315,63.585176221315,BBH,0.497720305573641,28.5234825042885,MATH Level 5,0.0702416918429003,7.02416918429003,GPQA,0.302852348993289,7.04697986577182,MUSR,0.372885416666667,4.41067708333333,MMLU-PRO,0.300365691489362,22.2628546099291,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-23,2024-10-24,0,CohereForAI/aya-expanse-8b,cc-by-nc-4.0,307,8.028,1.1696890688757,72,79,Aya-Expanse-8B,1179,+8/-8,5426,Cohere,CC-BY-NC-4.0,Unknown,https://huggingface.co/CohereForAI/aya-expanse-8b +aya-expanse-32b,CohereForAI/aya-expanse-32b_float16_08b69cfa4240e2009c80ad304f000b491d1b8c38_True,CohereForAI/aya-expanse-32b,08b69cfa4240e2009c80ad304f000b491d1b8c38,float16,chatmodels,Original,CohereForCausalLM,29.3912190893162,TRUE,IFEval,0.730173716849072,73.0173716849072,BBH,0.564867009921211,38.7096114330142,MATH Level 5,0.13368580060423,13.368580060423,GPQA,0.325503355704698,10.0671140939597,MUSR,0.387270833333333,6.40885416666667,MMLU-PRO,0.41298204787234,34.7757830969267,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-23,2024-10-24,0,CohereForAI/aya-expanse-32b,cc-by-nc-4.0,195,32.296,5.5177350999101,54,62,Aya-Expanse-32B,1209,+4/-5,23536,Cohere,CC-BY-NC-4.0,Unknown,https://huggingface.co/CohereForAI/aya-expanse-32b +aya-expanse-8b,CohereForAI/aya-expanse-8b_float16_b9848575c8731981dfcf2e1f3bfbcb917a2e585d_True,CohereForAI/aya-expanse-8b,b9848575c8731981dfcf2e1f3bfbcb917a2e585d,float16,chatmodels,Original,CohereForCausalLM,22.1422232448213,TRUE,IFEval,0.63585176221315,63.585176221315,BBH,0.497720305573641,28.5234825042885,MATH Level 5,0.0702416918429003,7.02416918429003,GPQA,0.302852348993289,7.04697986577182,MUSR,0.372885416666667,4.41067708333333,MMLU-PRO,0.300365691489362,22.2628546099291,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-23,2024-10-24,0,CohereForAI/aya-expanse-8b,cc-by-nc-4.0,309,8.028,1.1696890688757,72,79,Aya-Expanse-8B,1179,+8/-8,5426,Cohere,CC-BY-NC-4.0,Unknown,https://huggingface.co/CohereForAI/aya-expanse-8b deepseek-llm-67b-chat,deepseek-ai/deepseek-llm-67b-chat_bfloat16_79648bef7658bb824e4630740f6e1484c1b0620b_True,deepseek-ai/deepseek-llm-67b-chat,79648bef7658bb824e4630740f6e1484c1b0620b,bfloat16,chatmodels,Original,LlamaForCausalLM,26.9959289542937,TRUE,IFEval,0.558715319795919,55.8715319795919,BBH,0.524341617974236,33.2252419253453,MATH Level 5,0.0740181268882175,7.40181268882175,GPQA,0.316275167785235,8.83668903803132,MUSR,0.505864583333333,23.9330729166667,MMLU-PRO,0.394365026595745,32.707225177305,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-29,2024-06-12,0,deepseek-ai/deepseek-llm-67b-chat,other,177,67,59.8218086686963,126,118,DeepSeek-LLM-67B-Chat,1077,+9/-7,4985,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat dolly-v2-12b,databricks/dolly-v2-12b_bfloat16_19308160448536e378e3db21a73a751579ee7fdd_False,databricks/dolly-v2-12b,19308160448536e378e3db21a73a751579ee7fdd,bfloat16,fine-tunedondomain-specificdatasets,Original,GPTNeoXForCausalLM,6.3830238203141,FALSE,IFEval,0.235507342739487,23.5507342739487,BBH,0.331997316737713,6.37789413745296,MATH Level 5,0.0143504531722054,1.43504531722054,GPQA,0.240771812080537,0,MUSR,0.37390625,5.50494791666667,MMLU-PRO,0.112865691489362,1.42952127659574,TRUE,FALSE,FALSE,FALSE,TRUE,2023-04-11,2024-06-12,0,databricks/dolly-v2-12b,mit,1952,12,1.39711946227966,177,175,Dolly-V2-12B,822,+13/-9,3486,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b gemma-1.1-2b-it,google/gemma-1.1-2b-it_bfloat16_bf4924f313df5166dee1467161e886e55f2eb4d4_True,google/gemma-1.1-2b-it,bf4924f313df5166dee1467161e886e55f2eb4d4,bfloat16,chatmodels,Original,GemmaForCausalLM,7.77643528435205,TRUE,IFEval,0.306748316688608,30.6748316688608,BBH,0.318463497481492,5.86282672277435,MATH Level 5,0.00151057401812689,0.151057401812689,GPQA,0.269295302013423,2.57270693512304,MUSR,0.339395833333333,2.02447916666667,MMLU-PRO,0.148354388297872,5.3727098108747,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-26,2024-06-12,0,google/gemma-1.1-2b-it,gemma,152,2.506,0.32921478142276,156,149,Gemma-1.1-2b-it,1021,+5/-4,11353,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-2b-it gemma-1.1-7b-it,google/gemma-1.1-7b-it_bfloat16_16128b0aeb50762ea96430c0c06a37941bf9f274_True,google/gemma-1.1-7b-it,16128b0aeb50762ea96430c0c06a37941bf9f274,bfloat16,chatmodels,Original,GemmaForCausalLM,17.4795862430713,TRUE,IFEval,0.503910734628563,50.3910734628563,BBH,0.393529796283325,15.9342093850132,MATH Level 5,0.0362537764350453,3.62537764350453,GPQA,0.293624161073826,5.8165548098434,MUSR,0.423020833333333,11.5109375,MMLU-PRO,0.258394281914894,17.5993646572104,TRUE,FALSE,FALSE,FALSE,TRUE,2024-03-26,2024-06-12,0,google/gemma-1.1-7b-it,gemma,267,8.538,0.578299189963354,124,116,Gemma-1.1-7B-it,1084,+3/-4,25072,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it -gemma-2-27b-it,google/gemma-2-27b-it_bfloat16_f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b_True,google/gemma-2-27b-it,f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b,bfloat16,chatmodels,Original,Gemma2ForCausalLM,32.3223187688799,TRUE,IFEval,0.797767700811624,79.7767700811624,BBH,0.64513874331688,49.2728421513039,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.375,16.6666666666667,MUSR,0.403302083333333,9.11276041666667,MMLU-PRO,0.445146276595745,38.3495862884161,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-08-07,1,google/gemma-2-27b,gemma,473,27.227,4.82621118669274,50,44,Gemma-2-27B-it,1220,+2/-3,69149,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-27b-it -gemma-2-2b-it,google/gemma-2-2b-it_bfloat16_2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f_True,google/gemma-2-2b-it,2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f,bfloat16,fine-tunedondomain-specificdatasets,Original,InternLM2ForCausalLM,17.0469392949665,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.419923089142747,17.9807928815234,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.274328859060403,3.24384787472036,MUSR,0.392885416666667,7.07734375,MMLU-PRO,0.25498670212766,17.2207446808511,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,1,google/gemma-2-2b,gemma,806,2.614,1.23474327420585,93,109,Gemma-2-2b-it,1142,+3/-3,38514,Google,Gemma license,2024/7,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-2b-it -gemma-2-9b-it,google/gemma-2-9b-it_bfloat16_1937c70277fcc5f7fb0fc772fc5bc69378996e71_True,google/gemma-2-9b-it,1937c70277fcc5f7fb0fc772fc5bc69378996e71,bfloat16,chatmodels,Original,Gemma2ForCausalLM,28.8627904641512,TRUE,IFEval,0.743562636027961,74.3562636027961,BBH,0.599034250416413,42.1366196836647,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.360738255033557,14.7651006711409,MUSR,0.407270833333333,9.7421875,MMLU-PRO,0.387549867021277,31.9499852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,1,google/gemma-2-9b,gemma,602,9,5.01449702077493,70,64,Gemma-2-9B-it,1191,+3/-4,46948,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-9b-it +gemma-2-27b-it,google/gemma-2-27b-it_bfloat16_f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b_True,google/gemma-2-27b-it,f6c533e5eb013c7e31fc74ef042ac4f3fb5cf40b,bfloat16,chatmodels,Original,Gemma2ForCausalLM,32.3223187688799,TRUE,IFEval,0.797767700811624,79.7767700811624,BBH,0.64513874331688,49.2728421513039,MATH Level 5,0.00755287009063444,0.755287009063444,GPQA,0.375,16.6666666666667,MUSR,0.403302083333333,9.11276041666667,MMLU-PRO,0.445146276595745,38.3495862884161,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-08-07,1,google/gemma-2-27b,gemma,474,27.227,4.82621118669274,50,44,Gemma-2-27B-it,1220,+2/-3,69149,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-27b-it +gemma-2-2b-it,google/gemma-2-2b-it_bfloat16_2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f_True,google/gemma-2-2b-it,2b6ac3ff954ad896c115bbfa1b571cd93ea2c20f,bfloat16,fine-tunedondomain-specificdatasets,Original,InternLM2ForCausalLM,17.0469392949665,TRUE,IFEval,0.566833778817981,56.6833778817981,BBH,0.419923089142747,17.9807928815234,MATH Level 5,0.000755287009063444,0.0755287009063444,GPQA,0.274328859060403,3.24384787472036,MUSR,0.392885416666667,7.07734375,MMLU-PRO,0.25498670212766,17.2207446808511,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-07-31,1,google/gemma-2-2b,gemma,811,2.614,1.23474327420585,93,109,Gemma-2-2b-it,1142,+3/-3,38514,Google,Gemma license,2024/7,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-2b-it +gemma-2-9b-it,google/gemma-2-9b-it_bfloat16_1937c70277fcc5f7fb0fc772fc5bc69378996e71_True,google/gemma-2-9b-it,1937c70277fcc5f7fb0fc772fc5bc69378996e71,bfloat16,chatmodels,Original,Gemma2ForCausalLM,28.8627904641512,TRUE,IFEval,0.743562636027961,74.3562636027961,BBH,0.599034250416413,42.1366196836647,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.360738255033557,14.7651006711409,MUSR,0.407270833333333,9.7421875,MMLU-PRO,0.387549867021277,31.9499852245863,TRUE,FALSE,FALSE,FALSE,TRUE,2024-06-24,2024-07-11,1,google/gemma-2-9b,gemma,604,9,5.01449702077493,70,64,Gemma-2-9B-it,1191,+3/-4,46948,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-9b-it gemma-2-9b-it-simpo,princeton-nlp/gemma-2-9b-it-SimPO_bfloat16_8c87091f412e3aa6f74f66bd86c57fb81cbc3fde_True,princeton-nlp/gemma-2-9b-it-SimPO,8c87091f412e3aa6f74f66bd86c57fb81cbc3fde,bfloat16,chatmodels,Original,Gemma2ForCausalLM,21.1616516275693,TRUE,IFEval,0.320685780396016,32.0685780396016,BBH,0.583917992316212,40.0934299163717,MATH Level 5,0,0,GPQA,0.335570469798658,11.4093959731544,MUSR,0.412322916666667,10.3403645833333,MMLU-PRO,0.397523271276596,33.0581412529551,TRUE,FALSE,FALSE,FALSE,FALSE,2024-07-16,2024-08-10,2,google/gemma-2-9b,mit,137,9.242,2.76900372425403,50,44,Gemma-2-9B-it-SimPO,1216,+5/-7,10567,Princeton,MIT,2024/7,https://huggingface.co/princeton-nlp/gemma-2-9b-it-SimPO -gemma-2b-it,google/gemma-2b-it_bfloat16_de144fb2268dee1066f515465df532c05e699d48_True,google/gemma-2b-it,de144fb2268dee1066f515465df532c05e699d48,bfloat16,chatmodels,Original,GemmaForCausalLM,7.22145367714292,TRUE,IFEval,0.269029508371122,26.9029508371122,BBH,0.315081919887885,5.21430302216362,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.278523489932886,3.80313199105145,MUSR,0.334125,3.03229166666667,MMLU-PRO,0.13530585106383,3.92287234042553,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b-it,gemma,685,2.506,0.352950331047759,165,163,Gemma-2B-it,989,+7/-8,4922,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it +gemma-2b-it,google/gemma-2b-it_bfloat16_de144fb2268dee1066f515465df532c05e699d48_True,google/gemma-2b-it,de144fb2268dee1066f515465df532c05e699d48,bfloat16,chatmodels,Original,GemmaForCausalLM,7.22145367714292,TRUE,IFEval,0.269029508371122,26.9029508371122,BBH,0.315081919887885,5.21430302216362,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.278523489932886,3.80313199105145,MUSR,0.334125,3.03229166666667,MMLU-PRO,0.13530585106383,3.92287234042553,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-08,2024-06-12,0,google/gemma-2b-it,gemma,686,2.506,0.352950331047759,165,163,Gemma-2B-it,989,+7/-8,4922,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it gemma-7b-it,google/gemma-7b-it_bfloat16_18329f019fb74ca4b24f97371785268543d687d2_True,google/gemma-7b-it,18329f019fb74ca4b24f97371785268543d687d2,bfloat16,chatmodels,Original,GemmaForCausalLM,12.8681419014102,TRUE,IFEval,0.386832493339894,38.6832493339894,BBH,0.364558292227017,11.8800913445494,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.284395973154362,4.58612975391499,MUSR,0.427427083333333,12.5283854166667,MMLU-PRO,0.169464760638298,7.71830673758865,TRUE,FALSE,FALSE,FALSE,TRUE,2024-02-13,2024-06-12,1,google/gemma-7b,gemma,1143,8.538,1.0999544452693,147,143,Gemma-7B-it,1037,+6/-6,9179,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it granite-3.0-2b-instruct,ibm-granite/granite-3.0-2b-instruct_bfloat16_342f92f4a0b4d6d83c0b61dc6c122e253a4efebd_True,ibm-granite/granite-3.0-2b-instruct,342f92f4a0b4d6d83c0b61dc6c122e253a4efebd,bfloat16,chatmodels,Original,GraniteForCausalLM,18.3205664133779,TRUE,IFEval,0.513977357854936,51.3977357854936,BBH,0.441197720626303,21.7378914109024,MATH Level 5,0.0876132930513595,8.76132930513595,GPQA,0.299496644295302,6.59955257270694,MUSR,0.351489583333333,1.26953125,MMLU-PRO,0.281416223404255,20.1573581560284,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,"",1,ibm-granite/granite-3.0-2b-instruct (Merge),apache-2.0,46,2.634,1.01894808156813,128,123,Granite-3.0-2B-Instruct,1074,+7/-6,7240,IBM,Apache 2.0,Unknown,https://huggingface.co/ibm-granite/granite-3.0-2b-instruct granite-3.0-8b-instruct,ibm-granite/granite-3.0-8b-instruct_bfloat16_e0a466fb25b9e07e9c2dc93380a360189700d1f8_True,ibm-granite/granite-3.0-8b-instruct,e0a466fb25b9e07e9c2dc93380a360189700d1f8,bfloat16,chatmodels,Original,GraniteForCausalLM,23.8640332348529,TRUE,IFEval,0.530963399335984,53.0963399335984,BBH,0.519187463184023,31.5881590647151,MATH Level 5,0.132175226586103,13.2175226586103,GPQA,0.332214765100671,10.9619686800895,MUSR,0.3900625,7.02447916666667,MMLU-PRO,0.345661569148936,27.2957299054374,TRUE,FALSE,FALSE,FALSE,TRUE,2024-10-02,2024-10-20,1,ibm-granite/granite-3.0-8b-instruct (Merge),apache-2.0,196,8.171,1.7129925870079,116,109,Granite-3.0-8B-Instruct,1094,+6/-7,7068,IBM,Apache 2.0,Unknown,https://huggingface.co/ibm-granite/granite-3.0-8b-instruct llama-13b,huggyllama/llama-13b_float16_bf57045473f207bb1de1ed035ace226f4d9f9bba_False,huggyllama/llama-13b,bf57045473f207bb1de1ed035ace226f4d9f9bba,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,9.29147946431344,FALSE,IFEval,0.241052629245956,24.1052629245956,BBH,0.398789255811746,16.1457073769258,MATH Level 5,0.0143504531722054,1.43504531722054,GPQA,0.25503355704698,0.671140939597318,MUSR,0.34621875,2.81067708333333,MMLU-PRO,0.195229388297872,10.581043144208,TRUE,FALSE,FALSE,FALSE,FALSE,2023-04-03,2024-07-04,0,huggyllama/llama-13b,other,138,13.016,1.1061405985716,178,176,LLaMA-13B,800,+14/-14,2444,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 llama-3-8b-instruct,AI-Sweden-Models/Llama-3-8B-instruct_bfloat16_4e1c955228bdb4d69c1c4560e8d5872312a8f033_True,AI-Sweden-Models/Llama-3-8B-instruct,4e1c955228bdb4d69c1c4560e8d5872312a8f033,bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,13.7772044149452,TRUE,IFEval,0.240128414828211,24.0128414828211,BBH,0.41734601545153,18.3880956150275,MATH Level 5,0.00453172205438067,0.453172205438067,GPQA,0.265939597315436,2.12527964205817,MUSR,0.47709375,19.93671875,MMLU-PRO,0.259724069148936,17.7471187943262,TRUE,FALSE,FALSE,FALSE,FALSE,2024-06-01,2024-06-27,2,meta-llama/Meta-Llama-3-8B,llama3,10,8.03,1.16611088086752,88,91,Llama-3-8B-Instruct,1152,+3/-3,109267,Meta,Llama 3 Community,2023/3,https://llama.meta.com/llama3/ -llama-3.3-70b-instruct,meta-llama/Llama-3.3-70B-Instruct_bfloat16__False,meta-llama/Llama-3.3-70B-Instruct,"",bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,36.8288410384085,FALSE,IFEval,0.899758197139146,89.9758197139146,BBH,0.691931282832581,56.5614107880222,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446125,15.565625,MMLU-PRO,0.533161569148936,48.1290632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-26,2024-12-09,1,meta-llama/Llama-3.3-70B-Instruct (Merge),llama3.3,1284,70.554,38.2795370537265,28,20,Llama-3.3-70B-Instruct,1256,+5/-5,8907,Meta,Llama-3.3,Unknown,https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct -meta-llama-3.1-70b-instruct,meta-llama/Meta-Llama-3.1-70B-Instruct_bfloat16_b9461463b511ed3c0762467538ea32cf7c9669f2_True,meta-llama/Meta-Llama-3.1-70B-Instruct,b9461463b511ed3c0762467538ea32cf7c9669f2,bfloat16,chatmodels,Original,LlamaForCausalLM,42.1763127975088,TRUE,IFEval,0.866885419575615,86.6885419575615,BBH,0.691728745366365,55.9279917389847,MATH Level 5,0.306646525679758,30.6646525679758,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4580625,17.6911458333333,MMLU-PRO,0.530917553191489,47.8797281323877,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-15,1,meta-llama/Meta-Llama-3.1-70B,llama3.1,754,70.554,26.8020157168701,36,40,Meta-Llama-3.1-70B-Instruct,1248,+3/-3,58794,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ -meta-llama-3.1-8b-instruct,meta-llama/Meta-Llama-3.1-8B-Instruct_bfloat16_df34336b42332c6d360959e259cd6271c6a09fd4_True,meta-llama/Meta-Llama-3.1-8B-Instruct,df34336b42332c6d360959e259cd6271c6a09fd4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2044584981019,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.26761744966443,2.3489932885906,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376163563829787,30.6848404255319,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-08-15,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,3318,8.03,2.48701186834409,77,99,Meta-Llama-3.1-8B-Instruct,1176,+3/-3,52712,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ +llama-3.3-70b-instruct,meta-llama/Llama-3.3-70B-Instruct_bfloat16__False,meta-llama/Llama-3.3-70B-Instruct,"",bfloat16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,36.8288410384085,FALSE,IFEval,0.899758197139146,89.9758197139146,BBH,0.691931282832581,56.5614107880222,MATH Level 5,0.00226586102719033,0.226586102719033,GPQA,0.328859060402685,10.5145413870246,MUSR,0.446125,15.565625,MMLU-PRO,0.533161569148936,48.1290632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-26,2024-12-09,1,meta-llama/Llama-3.3-70B-Instruct (Merge),llama3.3,1298,70.554,38.2795370537265,28,20,Llama-3.3-70B-Instruct,1256,+5/-5,8907,Meta,Llama-3.3,Unknown,https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct +meta-llama-3.1-70b-instruct,meta-llama/Meta-Llama-3.1-70B-Instruct_bfloat16_b9461463b511ed3c0762467538ea32cf7c9669f2_True,meta-llama/Meta-Llama-3.1-70B-Instruct,b9461463b511ed3c0762467538ea32cf7c9669f2,bfloat16,chatmodels,Original,LlamaForCausalLM,42.1763127975088,TRUE,IFEval,0.866885419575615,86.6885419575615,BBH,0.691728745366365,55.9279917389847,MATH Level 5,0.306646525679758,30.6646525679758,GPQA,0.356543624161074,14.2058165548098,MUSR,0.4580625,17.6911458333333,MMLU-PRO,0.530917553191489,47.8797281323877,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-16,2024-08-15,1,meta-llama/Meta-Llama-3.1-70B,llama3.1,755,70.554,26.8020157168701,36,40,Meta-Llama-3.1-70B-Instruct,1248,+3/-3,58794,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ +meta-llama-3.1-8b-instruct,meta-llama/Meta-Llama-3.1-8B-Instruct_bfloat16_df34336b42332c6d360959e259cd6271c6a09fd4_True,meta-llama/Meta-Llama-3.1-8B-Instruct,df34336b42332c6d360959e259cd6271c6a09fd4,bfloat16,chatmodels,Original,LlamaForCausalLM,28.2044584981019,TRUE,IFEval,0.785577822400121,78.5577822400121,BBH,0.507326783896146,29.8927563524528,MATH Level 5,0.193353474320242,19.3353474320242,GPQA,0.26761744966443,2.3489932885906,MUSR,0.386989583333333,8.40703125,MMLU-PRO,0.376163563829787,30.6848404255319,TRUE,FALSE,FALSE,FALSE,TRUE,2024-07-18,2024-08-15,1,meta-llama/Meta-Llama-3.1-8B,llama3.1,3325,8.03,2.48701186834409,77,99,Meta-Llama-3.1-8B-Instruct,1176,+3/-3,52712,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ mistral-7b-instruct-v0.1,mistralai/Mistral-7B-Instruct-v0.1_bfloat16_73068f3702d050a2fd5aa2ca1e612e5036429398_True,mistralai/Mistral-7B-Instruct-v0.1,73068f3702d050a2fd5aa2ca1e612e5036429398,bfloat16,chatmodels,Original,MistralForCausalLM,12.6957006941243,TRUE,IFEval,0.448706099815157,44.8706099815157,BBH,0.33548084759811,7.64702053582754,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.25,0,MUSR,0.384760416666667,6.12838541666667,MMLU-PRO,0.241439494680851,15.7154994089835,TRUE,FALSE,FALSE,FALSE,TRUE,2023-09-27,2024-06-27,1,mistralai/Mistral-7B-v0.1,apache-2.0,1538,7.242,1.21604471748007,160,157,Mistral-7B-Instruct-v0.1,1008,+6/-5,9143,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 -mistral-7b-instruct-v0.2,mistralai/Mistral-7B-Instruct-v0.2_bfloat16_41b61a33a2483885c981aa79e0df6b32407ed873_True,mistralai/Mistral-7B-Instruct-v0.2,41b61a33a2483885c981aa79e0df6b32407ed873,bfloat16,chatmodels,Original,MistralForCausalLM,18.4575391254667,TRUE,IFEval,0.549622778671702,54.9622778671702,BBH,0.445973552032928,22.9106019367136,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.276006711409396,3.4675615212528,MUSR,0.396604166666667,7.60885416666667,MMLU-PRO,0.271692154255319,19.0769060283688,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-11,2024-06-12,0,mistralai/Mistral-7B-Instruct-v0.2,apache-2.0,2600,7.242,0.534406629050985,129,134,Mistral-7B-Instruct-v0.2,1072,+5/-4,20066,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 +mistral-7b-instruct-v0.2,mistralai/Mistral-7B-Instruct-v0.2_bfloat16_41b61a33a2483885c981aa79e0df6b32407ed873_True,mistralai/Mistral-7B-Instruct-v0.2,41b61a33a2483885c981aa79e0df6b32407ed873,bfloat16,chatmodels,Original,MistralForCausalLM,18.4575391254667,TRUE,IFEval,0.549622778671702,54.9622778671702,BBH,0.445973552032928,22.9106019367136,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.276006711409396,3.4675615212528,MUSR,0.396604166666667,7.60885416666667,MMLU-PRO,0.271692154255319,19.0769060283688,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-11,2024-06-12,0,mistralai/Mistral-7B-Instruct-v0.2,apache-2.0,2601,7.242,0.534406629050985,129,134,Mistral-7B-Instruct-v0.2,1072,+5/-4,20066,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 mixtral-8x22b-instruct-v0.1,mistralai/Mixtral-8x22B-Instruct-v0.1_bfloat16_b0c3516041d014f640267b14feb4e9a84c8e8c71_True,mistralai/Mixtral-8x22B-Instruct-v0.1,b0c3516041d014f640267b14feb4e9a84c8e8c71,bfloat16,chatmodels,Original,MixtralForCausalLM,33.885680288082,TRUE,IFEval,0.718358400156031,71.8358400156031,BBH,0.612492492627202,44.1143455872484,MATH Level 5,0.187311178247734,18.7311178247734,GPQA,0.373322147651007,16.4429530201342,MUSR,0.431114583333333,13.4893229166667,MMLU-PRO,0.448304521276596,38.7005023640662,TRUE,FALSE,TRUE,FALSE,TRUE,2024-04-16,2024-06-12,1,mistralai/Mixtral-8x22B-v0.1,apache-2.0,696,140.621,47.147578592378,90,85,Mixtral-8x22b-Instruct-v0.1,1148,+3/-3,53823,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ -mixtral-8x7b-instruct-v0.1,mistralai/Mixtral-8x7B-Instruct-v0.1_bfloat16_1e637f2d7cb0a9d6fb1922f305cb784995190a83_True,mistralai/Mixtral-8x7B-Instruct-v0.1,1e637f2d7cb0a9d6fb1922f305cb784995190a83,bfloat16,chatmodels,Original,MixtralForCausalLM,23.8422789394817,TRUE,IFEval,0.559914360563305,55.9914360563305,BBH,0.496236540133565,29.7423983809673,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.302852348993289,7.04697986577182,MUSR,0.420322916666667,11.0736979166667,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-10,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,4235,46.703,13.7649393661468,109,110,Mixtral-8x7B-Instruct-v0.1,1114,+0/-0,76152,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ +mixtral-8x7b-instruct-v0.1,mistralai/Mixtral-8x7B-Instruct-v0.1_bfloat16_1e637f2d7cb0a9d6fb1922f305cb784995190a83_True,mistralai/Mixtral-8x7B-Instruct-v0.1,1e637f2d7cb0a9d6fb1922f305cb784995190a83,bfloat16,chatmodels,Original,MixtralForCausalLM,23.8422789394817,TRUE,IFEval,0.559914360563305,55.9914360563305,BBH,0.496236540133565,29.7423983809673,MATH Level 5,0.0929003021148036,9.29003021148036,GPQA,0.302852348993289,7.04697986577182,MUSR,0.420322916666667,11.0736979166667,MMLU-PRO,0.369182180851064,29.9091312056738,TRUE,FALSE,TRUE,FALSE,TRUE,2023-12-10,2024-06-12,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,4241,46.703,13.7649393661468,109,110,Mixtral-8x7B-Instruct-v0.1,1114,+0/-0,76152,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ nous-hermes-2-mixtral-8x7b-dpo,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO_bfloat16_286ae6737d048ad1d965c2e830864df02db50f2f_True,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,286ae6737d048ad1d965c2e830864df02db50f2f,bfloat16,chatmodels,Original,MixtralForCausalLM,27.290249854483,TRUE,IFEval,0.58968980083955,58.968980083955,BBH,0.553885138403382,37.1077837913399,MATH Level 5,0.118580060422961,11.8580060422961,GPQA,0.321308724832215,9.50782997762864,MUSR,0.459541666666667,16.6760416666667,MMLU-PRO,0.366605718085106,29.6228575650118,TRUE,FALSE,TRUE,FALSE,TRUE,2024-01-11,2024-07-27,1,mistralai/Mixtral-8x7B-v0.1,apache-2.0,420,46.703,12.8651437241499,121,130,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+8/-8,3835,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO openchat-3.5-0106,openchat/openchat-3.5-0106_bfloat16_ff058fda49726ecf4ea53dc1635f917cdb8ba36b_True,openchat/openchat-3.5-0106,ff058fda49726ecf4ea53dc1635f917cdb8ba36b,bfloat16,fine-tunedondomain-specificdatasets,Original,MistralForCausalLM,22.6586834330757,TRUE,IFEval,0.595135351977198,59.5135351977198,BBH,0.461697870839606,24.0387112139116,MATH Level 5,0.074773413897281,7.4773413897281,GPQA,0.307885906040268,7.71812080536913,MUSR,0.4254375,11.7463541666667,MMLU-PRO,0.329122340425532,25.4580378250591,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-07,2024-06-27,1,mistralai/Mistral-7B-v0.1,apache-2.0,348,7.242,2.35495886433684,121,114,OpenChat-3.5-0106,1091,+4/-5,12985,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 openhermes-2.5-mistral-7b,teknium/OpenHermes-2.5-Mistral-7B_bfloat16_24c0bea14d53e6f67f1fbe2eca5bfe7cae389b33_True,teknium/OpenHermes-2.5-Mistral-7B,24c0bea14d53e6f67f1fbe2eca5bfe7cae389b33,bfloat16,chatmodels,Original,MistralForCausalLM,21.2668365601522,TRUE,IFEval,0.557141717310071,55.7141717310071,BBH,0.487001325992498,27.7700263678076,MATH Level 5,0.047583081570997,4.7583081570997,GPQA,0.283557046979866,4.47427293064877,MUSR,0.424197916666667,12.0580729166667,MMLU-PRO,0.305435505319149,22.8261672576832,TRUE,FALSE,FALSE,FALSE,TRUE,2023-10-29,2024-06-12,1,mistralai/Mistral-7B-v0.1,apache-2.0,818,7.242,0.472783300310566,128,119,OpenHermes-2.5-Mistral-7B,1074,+8/-8,5089,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B phi-3-medium-4k-instruct,microsoft/Phi-3-medium-4k-instruct_bfloat16_d194e4e74ffad5a5e193e26af25bcfc80c7f1ffc_True,microsoft/Phi-3-medium-4k-instruct,d194e4e74ffad5a5e193e26af25bcfc80c7f1ffc,bfloat16,chatmodels,Original,Phi3ForCausalLM,32.8962495702928,TRUE,IFEval,0.642271395452954,64.2271395452954,BBH,0.641246489055555,49.3806100742202,MATH Level 5,0.183534743202417,18.3534743202417,GPQA,0.336409395973154,11.5212527964206,MUSR,0.42575,13.0520833333333,MMLU-PRO,0.467586436170213,40.8429373522459,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-12,0,microsoft/Phi-3-medium-4k-instruct,mit,211,13.96,1.45526252332937,102,109,Phi-3-Medium-4k-Instruct,1123,+4/-4,26122,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct -phi-3-mini-128k-instruct,microsoft/Phi-3-mini-128k-instruct_bfloat16_5be6479b4bc06a081e8f4c6ece294241ccd32dec_True,microsoft/Phi-3-mini-128k-instruct,5be6479b4bc06a081e8f4c6ece294241ccd32dec,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.6262872732554,TRUE,IFEval,0.597633168880792,59.7633168880792,BBH,0.557453179267985,37.0997666322403,MATH Level 5,0.0974320241691843,9.74320241691843,GPQA,0.317953020134228,9.06040268456376,MUSR,0.3936875,7.7109375,MMLU-PRO,0.373420877659575,30.3800975177305,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-08-21,0,microsoft/Phi-3-mini-128k-instruct,mit,1617,3.821,24.2222515926888,147,143,Phi-3-Mini-128k-Instruct,1037,+4/-4,21636,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ -phi-3-mini-4k-instruct,microsoft/Phi-3-mini-4k-instruct_bfloat16_ff07dc01615f8113924aed013115ab2abd32115b_True,microsoft/Phi-3-mini-4k-instruct,ff07dc01615f8113924aed013115ab2abd32115b,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.9677326380416,TRUE,IFEval,0.561288492311511,56.1288492311511,BBH,0.567597262633488,39.2693352377728,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.319630872483222,9.2841163310962,MUSR,0.395020833333333,7.64427083333334,MMLU-PRO,0.386635638297872,31.8484042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-06-12,0,microsoft/Phi-3-mini-4k-instruct,mit,1092,3.821,0.804074829912372,131,139,Phi-3-Mini-4k-Instruct,1066,+4/-4,21097,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -phi-3-mini-4k-instruct,microsoft/Phi-3-mini-4k-instruct_float16_c1358f8a35e6d2af81890deffbbfa575b978c62f_True,microsoft/Phi-3-mini-4k-instruct,c1358f8a35e6d2af81890deffbbfa575b978c62f,float16,chatmodels,Original,Phi3ForCausalLM,27.4111166417796,TRUE,IFEval,0.547674614467391,54.7674614467391,BBH,0.549071891949582,36.5598553051879,MATH Level 5,0.154833836858006,15.4833836858006,GPQA,0.332214765100671,10.9619686800895,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.402177526595745,33.5752807328605,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-07-02,0,microsoft/Phi-3-mini-4k-instruct,mit,1092,3.821,0.786699265454341,131,139,Phi-3-Mini-4k-Instruct,1066,+4/-4,21097,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +phi-3-mini-128k-instruct,microsoft/Phi-3-mini-128k-instruct_bfloat16_5be6479b4bc06a081e8f4c6ece294241ccd32dec_True,microsoft/Phi-3-mini-128k-instruct,5be6479b4bc06a081e8f4c6ece294241ccd32dec,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.6262872732554,TRUE,IFEval,0.597633168880792,59.7633168880792,BBH,0.557453179267985,37.0997666322403,MATH Level 5,0.0974320241691843,9.74320241691843,GPQA,0.317953020134228,9.06040268456376,MUSR,0.3936875,7.7109375,MMLU-PRO,0.373420877659575,30.3800975177305,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-08-21,0,microsoft/Phi-3-mini-128k-instruct,mit,1618,3.821,24.2222515926888,147,143,Phi-3-Mini-128k-Instruct,1037,+4/-4,21636,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ +phi-3-mini-4k-instruct,microsoft/Phi-3-mini-4k-instruct_bfloat16_ff07dc01615f8113924aed013115ab2abd32115b_True,microsoft/Phi-3-mini-4k-instruct,ff07dc01615f8113924aed013115ab2abd32115b,bfloat16,chatmodels,Original,Phi3ForCausalLM,25.9677326380416,TRUE,IFEval,0.561288492311511,56.1288492311511,BBH,0.567597262633488,39.2693352377728,MATH Level 5,0.11631419939577,11.631419939577,GPQA,0.319630872483222,9.2841163310962,MUSR,0.395020833333333,7.64427083333334,MMLU-PRO,0.386635638297872,31.8484042553192,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-06-12,0,microsoft/Phi-3-mini-4k-instruct,mit,1093,3.821,0.804074829912372,131,139,Phi-3-Mini-4k-Instruct,1066,+4/-4,21097,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +phi-3-mini-4k-instruct,microsoft/Phi-3-mini-4k-instruct_float16_c1358f8a35e6d2af81890deffbbfa575b978c62f_True,microsoft/Phi-3-mini-4k-instruct,c1358f8a35e6d2af81890deffbbfa575b978c62f,float16,chatmodels,Original,Phi3ForCausalLM,27.4111166417796,TRUE,IFEval,0.547674614467391,54.7674614467391,BBH,0.549071891949582,36.5598553051879,MATH Level 5,0.154833836858006,15.4833836858006,GPQA,0.332214765100671,10.9619686800895,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.402177526595745,33.5752807328605,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-22,2024-07-02,0,microsoft/Phi-3-mini-4k-instruct,mit,1093,3.821,0.786699265454341,131,139,Phi-3-Mini-4k-Instruct,1066,+4/-4,21097,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct phi-3-mini-4k-instruct,unsloth/Phi-3-mini-4k-instruct_float16_636c707430a5509c80b1aa51d05c127ed339a975_True,unsloth/Phi-3-mini-4k-instruct,636c707430a5509c80b1aa51d05c127ed339a975,float16,basemergesandmoerges,Original,MistralForCausalLM,27.1783743374799,TRUE,IFEval,0.544027624480822,54.4027624480822,BBH,0.550023946744103,36.732473265614,MATH Level 5,0.154078549848943,15.4078549848943,GPQA,0.322986577181208,9.73154362416107,MUSR,0.428416666666667,13.11875,MMLU-PRO,0.403091755319149,33.6768617021277,TRUE,FALSE,FALSE,FALSE,FALSE,2024-04-29,2024-11-25,0,unsloth/Phi-3-mini-4k-instruct,mit,41,3.821,0.469533108024419,131,139,Phi-3-Mini-4k-Instruct,1066,+4/-4,21097,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct phi-3-small-8k-instruct,microsoft/Phi-3-small-8k-instruct_bfloat16_1535ae26fb4faada95c6950e8bc6e867cdad6b00_True,microsoft/Phi-3-small-8k-instruct,1535ae26fb4faada95c6950e8bc6e867cdad6b00,bfloat16,chatmodels,Original,Phi3SmallForCausalLM,29.6709218521057,TRUE,IFEval,0.649665110794913,64.9665110794913,BBH,0.620836488087056,46.2055703663891,MATH Level 5,0.0284301430770108,2.84301430770108,GPQA,0.312080536912752,8.27740492170022,MUSR,0.455791666666667,16.7739583333333,MMLU-PRO,0.45063164893617,38.9590721040189,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-07,2024-06-13,0,microsoft/Phi-3-small-8k-instruct,mit,159,7.392,1.0254536035218,113,116,Phi-3-Small-8k-Instruct,1102,+4/-4,18503,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-small-8k-instruct qwen1.5-110b-chat,Qwen/Qwen1.5-110B-Chat_bfloat16_85f86cec25901f2dbd870a86e06756903c9a876a_True,Qwen/Qwen1.5-110B-Chat,85f86cec25901f2dbd870a86e06756903c9a876a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,29.2248366843256,TRUE,IFEval,0.593886443525402,59.3886443525402,BBH,0.618380038558863,44.9845452561663,MATH Level 5,0,0,GPQA,0.341442953020134,12.1923937360179,MUSR,0.452166666666667,16.2875,MMLU-PRO,0.482463430851064,42.4959367612293,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-25,2024-06-12,0,Qwen/Qwen1.5-110B-Chat,other,123,111.21,72.5652930561157,85,79,Qwen1.5-110B-Chat,1161,+3/-4,27458,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ @@ -36,10 +36,10 @@ qwen1.5-14b-chat,Qwen/Qwen1.5-14B-Chat_bfloat16_9492b22871f43e975435455f5c616c77 qwen1.5-32b-chat,Qwen/Qwen1.5-32B-Chat_bfloat16_0997b012af6ddd5465d40465a8415535b2f06cfc_True,Qwen/Qwen1.5-32B-Chat,0997b012af6ddd5465d40465a8415535b2f06cfc,bfloat16,chatmodels,Original,Qwen2ForCausalLM,27.1930170704966,TRUE,IFEval,0.553219900973861,55.3219900973861,BBH,0.606689975793023,44.5548540239164,MATH Level 5,0.0717522658610272,7.17522658610272,GPQA,0.306208053691275,7.49440715883669,MUSR,0.415979166666667,10.1973958333333,MMLU-PRO,0.445728058510638,38.4142287234043,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-03,2024-06-12,0,Qwen/Qwen1.5-32B-Chat,other,108,32.512,46.0594497310076,101,103,Qwen1.5-32B-Chat,1125,+4/-4,22762,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ qwen1.5-4b-chat,Qwen/Qwen1.5-4B-Chat_bfloat16_a7a4d4945d28bac955554c9abd2f74a71ebbf22f_True,Qwen/Qwen1.5-4B-Chat,a7a4d4945d28bac955554c9abd2f74a71ebbf22f,bfloat16,chatmodels,Original,Qwen2ForCausalLM,12.3377534239841,TRUE,IFEval,0.315665766832006,31.5665766832006,BBH,0.400554856114861,16.2970785289083,MATH Level 5,0.0105740181268882,1.05740181268882,GPQA,0.266778523489933,2.23713646532438,MUSR,0.39778125,7.35598958333333,MMLU-PRO,0.239611037234043,15.5123374704492,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-30,2024-06-12,0,Qwen/Qwen1.5-4B-Chat,other,38,3.95,0.866150647838799,165,161,Qwen1.5-4B-Chat,988,+7/-8,7812,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ qwen1.5-7b-chat,Qwen/Qwen1.5-7B-Chat_bfloat16_5f4f5e69ac7f1d508f8369e977de208b4803444b_True,Qwen/Qwen1.5-7B-Chat,5f4f5e69ac7f1d508f8369e977de208b4803444b,bfloat16,chatmodels,Original,Qwen2ForCausalLM,16.5761729315825,TRUE,IFEval,0.437115741787347,43.7115741787347,BBH,0.451005311652135,22.3791295999528,MATH Level 5,0,0,GPQA,0.302852348993289,7.04697986577182,MUSR,0.37790625,4.63828125,MMLU-PRO,0.295129654255319,21.6810726950355,TRUE,FALSE,FALSE,FALSE,TRUE,2024-01-30,2024-06-12,0,Qwen/Qwen1.5-7B-Chat,other,164,7.721,1.07882659669136,129,134,Qwen1.5-7B-Chat,1070,+9/-10,4866,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen2-72b-instruct,Qwen/Qwen2-72B-Instruct_bfloat16_1af63c698f59c4235668ec9c1395468cb7cd7e79_False,Qwen/Qwen2-72B-Instruct,1af63c698f59c4235668ec9c1395468cb7cd7e79,bfloat16,chatmodels,Original,Qwen2ForCausalLM,42.9143041555209,FALSE,IFEval,0.7989168738946,79.89168738946,BBH,0.697730968386067,57.483009118763,MATH Level 5,0.376888217522659,37.6888217522659,GPQA,0.37248322147651,16.331096196868,MUSR,0.456010416666667,17.16796875,MMLU-PRO,0.540309175531915,48.9232417257683,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-28,2024-06-26,1,Qwen/Qwen2-72B,other,691,72.706,37.5539744227,70,63,Qwen2-72B-Instruct,1187,+3/-3,38963,Alibaba,Qianwen LICENSE,2024/6,https://qwenlm.github.io/blog/qwen2/ -qwen2.5-72b-instruct,Qwen/Qwen2.5-72B-Instruct_bfloat16_a13fff9ad76700c7ecff2769f75943ba8395b4a7_True,Qwen/Qwen2.5-72B-Instruct,a13fff9ad76700c7ecff2769f75943ba8395b4a7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,38.2120812616148,TRUE,IFEval,0.863837949972739,86.3837949972739,BBH,0.727274732174482,61.8732556687879,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.375,16.6666666666667,MUSR,0.420604166666667,11.7421875,MMLU-PRO,0.562583111702128,51.3981235224587,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-72B,other,629,72.706,33.0067683243991,29,35,Qwen2.5-72B-Instruct,1258,+4/-4,36753,Alibaba,Qwen,2024/9,https://qwenlm.github.io/blog/qwen2.5/ -qwen2.5-coder-32b-instruct,Qwen/Qwen2.5-Coder-32B-Instruct_float16_b47205940b83b5b484577359f71ee7b88472df67_False,Qwen/Qwen2.5-Coder-32B-Instruct,b47205940b83b5b484577359f71ee7b88472df67,float16,chatmodels,Original,Qwen2ForCausalLM,38.7525412608276,FALSE,IFEval,0.726526726862503,72.6526726862503,BBH,0.662522222240513,52.2665152094361,MATH Level 5,0.427492447129909,42.7492447129909,GPQA,0.348993288590604,13.1991051454139,MUSR,0.438583333333333,13.7229166666667,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-12-10,1,Qwen/Qwen2.5-Coder-32B-Instruct (Merge),apache-2.0,1364,32,4.69438966297979,49,53,Qwen2.5-Coder-32B-Instruct,1217,+7/-7,5748,Alibaba,Apache 2.0,Unknown,https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct -qwq-32b-preview,Qwen/QwQ-32B-Preview_bfloat16_1032e81cb936c486aae1d33da75b2fbcd5deed4a_True,Qwen/QwQ-32B-Preview,1032e81cb936c486aae1d33da75b2fbcd5deed4a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,30.444123257489,TRUE,IFEval,0.403543708471301,40.3543708471301,BBH,0.669138148225274,53.3876763517132,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.281879194630873,4.25055928411634,MUSR,0.410989583333333,9.80703125,MMLU-PRO,0.56781914893617,51.9799054373523,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-27,2024-11-29,2,Qwen/Qwen2.5-32B,apache-2.0,1416,32.764,10.2103897762396,86,119,QwQ-32B-Preview,1152,+8/-11,3294,Alibaba,Apache 2.0,Unknown,https://huggingface.co/Qwen/QwQ-32B-Preview +qwen2-72b-instruct,Qwen/Qwen2-72B-Instruct_bfloat16_1af63c698f59c4235668ec9c1395468cb7cd7e79_False,Qwen/Qwen2-72B-Instruct,1af63c698f59c4235668ec9c1395468cb7cd7e79,bfloat16,chatmodels,Original,Qwen2ForCausalLM,42.9143041555209,FALSE,IFEval,0.7989168738946,79.89168738946,BBH,0.697730968386067,57.483009118763,MATH Level 5,0.376888217522659,37.6888217522659,GPQA,0.37248322147651,16.331096196868,MUSR,0.456010416666667,17.16796875,MMLU-PRO,0.540309175531915,48.9232417257683,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-28,2024-06-26,1,Qwen/Qwen2-72B,other,692,72.706,37.5539744227,70,63,Qwen2-72B-Instruct,1187,+3/-3,38963,Alibaba,Qianwen LICENSE,2024/6,https://qwenlm.github.io/blog/qwen2/ +qwen2.5-72b-instruct,Qwen/Qwen2.5-72B-Instruct_bfloat16_a13fff9ad76700c7ecff2769f75943ba8395b4a7_True,Qwen/Qwen2.5-72B-Instruct,a13fff9ad76700c7ecff2769f75943ba8395b4a7,bfloat16,chatmodels,Original,Qwen2ForCausalLM,38.2120812616148,TRUE,IFEval,0.863837949972739,86.3837949972739,BBH,0.727274732174482,61.8732556687879,MATH Level 5,0.0120845921450151,1.20845921450151,GPQA,0.375,16.6666666666667,MUSR,0.420604166666667,11.7421875,MMLU-PRO,0.562583111702128,51.3981235224587,TRUE,FALSE,FALSE,FALSE,TRUE,2024-09-16,2024-10-16,1,Qwen/Qwen2.5-72B,other,632,72.706,33.0067683243991,29,35,Qwen2.5-72B-Instruct,1258,+4/-4,36753,Alibaba,Qwen,2024/9,https://qwenlm.github.io/blog/qwen2.5/ +qwen2.5-coder-32b-instruct,Qwen/Qwen2.5-Coder-32B-Instruct_float16_b47205940b83b5b484577359f71ee7b88472df67_False,Qwen/Qwen2.5-Coder-32B-Instruct,b47205940b83b5b484577359f71ee7b88472df67,float16,chatmodels,Original,Qwen2ForCausalLM,38.7525412608276,FALSE,IFEval,0.726526726862503,72.6526726862503,BBH,0.662522222240513,52.2665152094361,MATH Level 5,0.427492447129909,42.7492447129909,GPQA,0.348993288590604,13.1991051454139,MUSR,0.438583333333333,13.7229166666667,MMLU-PRO,0.441323138297872,37.924793144208,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-06,2024-12-10,1,Qwen/Qwen2.5-Coder-32B-Instruct (Merge),apache-2.0,1368,32,4.69438966297979,49,53,Qwen2.5-Coder-32B-Instruct,1217,+7/-7,5748,Alibaba,Apache 2.0,Unknown,https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct +qwq-32b-preview,Qwen/QwQ-32B-Preview_bfloat16_1032e81cb936c486aae1d33da75b2fbcd5deed4a_True,Qwen/QwQ-32B-Preview,1032e81cb936c486aae1d33da75b2fbcd5deed4a,bfloat16,chatmodels,Original,Qwen2ForCausalLM,30.444123257489,TRUE,IFEval,0.403543708471301,40.3543708471301,BBH,0.669138148225274,53.3876763517132,MATH Level 5,0.228851963746224,22.8851963746224,GPQA,0.281879194630873,4.25055928411634,MUSR,0.410989583333333,9.80703125,MMLU-PRO,0.56781914893617,51.9799054373523,TRUE,FALSE,FALSE,FALSE,TRUE,2024-11-27,2024-11-29,2,Qwen/Qwen2.5-32B,apache-2.0,1425,32.764,10.2103897762396,86,119,QwQ-32B-Preview,1152,+8/-11,3294,Alibaba,Apache 2.0,Unknown,https://huggingface.co/Qwen/QwQ-32B-Preview solar-10.7b-instruct-v1.0,upstage/SOLAR-10.7B-Instruct-v1.0_float16_c08c25ed66414a878fe0401a3596d536c083606c_True,upstage/SOLAR-10.7B-Instruct-v1.0,c08c25ed66414a878fe0401a3596d536c083606c,float16,chatmodels,Original,LlamaForCausalLM,19.6282553318946,TRUE,IFEval,0.473660997265035,47.3660997265035,BBH,0.516249494144699,31.8724018880021,MATH Level 5,0,0,GPQA,0.308724832214765,7.82997762863535,MUSR,0.3899375,6.9421875,MMLU-PRO,0.313829787234043,23.7588652482269,TRUE,FALSE,FALSE,FALSE,TRUE,2023-12-12,2024-06-12,1,upstage/SOLAR-10.7B-Instruct-v1.0 (Merge),cc-by-nc-4.0,619,10.732,0.782775785638588,130,134,SOLAR-10.7B-Instruct-v1.0,1062,+10/-9,4289,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 starling-lm-7b-alpha,berkeley-nest/Starling-LM-7B-alpha_bfloat16_1dddf3b95bc1391f6307299eb1c162c194bde9bd_True,berkeley-nest/Starling-LM-7B-alpha,1dddf3b95bc1391f6307299eb1c162c194bde9bd,bfloat16,chatmodels,Original,MistralForCausalLM,20.8267729304501,TRUE,IFEval,0.548049176185854,54.8049176185854,BBH,0.4440065261164,21.9540280871593,MATH Level 5,0.0830815709969789,8.30815709969789,GPQA,0.296979865771812,6.26398210290828,MUSR,0.412010416666667,9.50130208333333,MMLU-PRO,0.317154255319149,24.1282505910166,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-25,2024-06-12,0,berkeley-nest/Starling-LM-7B-alpha,apache-2.0,556,7.242,0.551628886692049,121,123,Starling-LM-7B-alpha,1089,+4/-6,10415,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha wizardlm-13b-v1.2,WizardLMTeam/WizardLM-13B-V1.2_float16_cf5f40382559f19e13874e45b39575171ca46ef8_False,WizardLMTeam/WizardLM-13B-V1.2,cf5f40382559f19e13874e45b39575171ca46ef8,float16,fine-tunedondomain-specificdatasets,Original,LlamaForCausalLM,15.164944624066,FALSE,IFEval,0.339246532533677,33.9246532533677,BBH,0.446199943646005,22.8886549780445,MATH Level 5,0.0181268882175227,1.81268882175227,GPQA,0.260906040268456,1.45413870246085,MUSR,0.43784375,14.03046875,MMLU-PRO,0.251911569148936,16.8790632387707,TRUE,FALSE,FALSE,FALSE,TRUE,2023-07-25,2024-06-12,0,WizardLMTeam/WizardLM-13B-V1.2,llama2,224,13,3.51945813008333,136,134,WizardLM-13b-v1.2,1059,+9/-6,7182,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 @@ -47,5 +47,5 @@ wizardlm-70b-v1.0,WizardLMTeam/WizardLM-70B-V1.0_float16_54aaecaff7d0790eb9f0ece yi-1.5-34b-chat,01-ai/Yi-1.5-34B-Chat_bfloat16_f3128b2d02d82989daae566c0a7eadc621ca3254_True,01-ai/Yi-1.5-34B-Chat,f3128b2d02d82989daae566c0a7eadc621ca3254,bfloat16,chatmodels,Original,LlamaForCausalLM,32.8922333485004,TRUE,IFEval,0.606675842320598,60.6675842320598,BBH,0.608374831027182,44.2628259810057,MATH Level 5,0.249244712990937,24.9244712990937,GPQA,0.36493288590604,15.324384787472,MUSR,0.428197916666667,13.0580729166667,MMLU-PRO,0.452044547872341,39.1160608747045,TRUE,FALSE,FALSE,FALSE,TRUE,2024-05-10,2024-06-12,0,01-ai/Yi-1.5-34B-Chat,apache-2.0,258,34.389,11.2119219336639,86,98,Yi-1.5-34B-Chat,1157,+3/-4,25152,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat yi-34b-chat,01-ai/Yi-34B-Chat_bfloat16_2e528b6a80fb064a0a746c5ca43114b135e30464_True,01-ai/Yi-34B-Chat,2e528b6a80fb064a0a746c5ca43114b135e30464,bfloat16,chatmodels,Original,LlamaForCausalLM,23.9623121996312,TRUE,IFEval,0.469888783982057,46.9888783982057,BBH,0.556087291076616,37.6239875972435,MATH Level 5,0.0468277945619335,4.68277945619335,GPQA,0.338087248322148,11.744966442953,MUSR,0.39784375,8.36380208333334,MMLU-PRO,0.409325132978723,34.3694592198582,TRUE,FALSE,FALSE,FALSE,TRUE,2023-11-22,2024-06-12,0,01-ai/Yi-34B-Chat,apache-2.0,345,34.389,12.5628478449908,107,114,Yi-34B-Chat,1111,+4/-5,15932,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat zephyr-7b-alpha,HuggingFaceH4/zephyr-7b-alpha_bfloat16_2ce2d025864af849b3e5029e2ec9d568eeda892d_True,HuggingFaceH4/zephyr-7b-alpha,2ce2d025864af849b3e5029e2ec9d568eeda892d,bfloat16,chatmodels,Original,MistralForCausalLM,18.5718642203846,TRUE,IFEval,0.519148082642943,51.9148082642943,BBH,0.458786350590441,23.9552914270685,MATH Level 5,0.0173716012084592,1.73716012084592,GPQA,0.297818791946309,6.3758389261745,MUSR,0.394958333333333,7.503125,MMLU-PRO,0.279504654255319,19.9449615839244,TRUE,FALSE,FALSE,FALSE,TRUE,2023-10-09,2024-06-12,1,mistralai/Mistral-7B-v0.1,mit,1103,7.242,0.79567519919312,142,139,Zephyr-7B-alpha,1041,+14/-14,1814,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha -zephyr-7b-beta,HuggingFaceH4/zephyr-7b-beta_bfloat16_b70e0c9a2d9e14bd1e812d3c398e5f313e93b473_True,HuggingFaceH4/zephyr-7b-beta,b70e0c9a2d9e14bd1e812d3c398e5f313e93b473,bfloat16,chatmodels,Original,MistralForCausalLM,17.767060993735,TRUE,IFEval,0.495043152169577,49.5043152169577,BBH,0.431582191918003,21.4875421828067,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.290268456375839,5.36912751677852,MUSR,0.392541666666667,7.734375,MMLU-PRO,0.278091755319149,19.7879728132388,TRUE,FALSE,FALSE,FALSE,TRUE,2023-10-26,2024-06-12,1,mistralai/Mistral-7B-v0.1,mit,1621,7.242,0.555023090869454,142,142,Zephyr-7B-beta,1053,+5/-5,11333,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +zephyr-7b-beta,HuggingFaceH4/zephyr-7b-beta_bfloat16_b70e0c9a2d9e14bd1e812d3c398e5f313e93b473_True,HuggingFaceH4/zephyr-7b-beta,b70e0c9a2d9e14bd1e812d3c398e5f313e93b473,bfloat16,chatmodels,Original,MistralForCausalLM,17.767060993735,TRUE,IFEval,0.495043152169577,49.5043152169577,BBH,0.431582191918003,21.4875421828067,MATH Level 5,0.027190332326284,2.7190332326284,GPQA,0.290268456375839,5.36912751677852,MUSR,0.392541666666667,7.734375,MMLU-PRO,0.278091755319149,19.7879728132388,TRUE,FALSE,FALSE,FALSE,TRUE,2023-10-26,2024-06-12,1,mistralai/Mistral-7B-v0.1,mit,1627,7.242,0.555023090869454,142,142,Zephyr-7B-beta,1053,+5/-5,11333,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta zephyr-orpo-141b-a35b-v0.1,HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1_float16_a3be084543d278e61b64cd600f28157afc79ffd3_True,HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1,a3be084543d278e61b64cd600f28157afc79ffd3,float16,chatmodels,Original,MixtralForCausalLM,34.0630228005823,TRUE,IFEval,0.65108911022753,65.108911022753,BBH,0.629043972852409,47.5037962865412,MATH Level 5,0.200906344410876,20.0906344410876,GPQA,0.378355704697987,17.1140939597315,MUSR,0.446520833333333,14.7151041666667,MMLU-PRO,0.458610372340426,39.8455969267139,TRUE,FALSE,FALSE,FALSE,TRUE,2024-04-10,2024-06-12,1,mistral-community/Mixtral-8x22B-v0.1,apache-2.0,262,140.621,42.0677864230678,101,97,Zephyr-ORPO-141b-A35b-v0.1,1127,+7/-10,4862,HuggingFace,Apache 2.0,2024/4,https://huggingface.co/HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1