diff --git a/csv/huggingface_v2.csv b/csv/huggingface_v2.csv index c2a73dd..9b88ffc 100644 --- a/csv/huggingface_v2.csv +++ b/csv/huggingface_v2.csv @@ -1,10 +1,11 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpqa_raw,musr,musr_raw,mmlupro,mmlupro_raw,type,architecture,weight_type,precision,not_merged,hub_license,params_b,hub_hearts,available_on_the_hub,model_sha,flagged,moe,submission_date,upload_to_hub_date,chat_template,maintainers_highlight,fullname,url 💬,MaziyarPanahi/Qwen2-72B-Instruct-v0.1,43.61,81.63,0.82,57.33,0.7,36.03,0.36,17.45,0.38,20.15,0.47,49.05,0.54,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,13,TRUE,0369c39770f45f2464587918f2dbdb8449ea3a0d,TRUE,TRUE,2024-06-26,2024-06-08,TRUE,FALSE,MaziyarPanahi/Qwen2-72B-Instruct-v0.1,https://huggingface.co/MaziyarPanahi/Qwen2-72B-Instruct-v0.1 -💬,Qwen/Qwen2-72B-Instruct,42.49,79.89,0.8,57.48,0.7,35.12,0.35,16.33,0.37,17.17,0.46,48.92,0.54,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,562,TRUE,1af63c698f59c4235668ec9c1395468cb7cd7e79,TRUE,TRUE,2024-06-26,2024-05-28,FALSE,TRUE,Qwen/Qwen2-72B-Instruct,https://huggingface.co/Qwen/Qwen2-72B-Instruct +💬,Qwen/Qwen2-72B-Instruct,42.49,79.89,0.8,57.48,0.7,35.12,0.35,16.33,0.37,17.17,0.46,48.92,0.54,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,563,TRUE,1af63c698f59c4235668ec9c1395468cb7cd7e79,TRUE,TRUE,2024-06-26,2024-05-28,FALSE,TRUE,Qwen/Qwen2-72B-Instruct,https://huggingface.co/Qwen/Qwen2-72B-Instruct 🔶,pankajmathur/orca_mini_v7_72b,39.06,59.3,0.59,55.06,0.68,26.44,0.26,18.01,0.39,24.21,0.51,51.35,0.56,🔶 fine-tuned on domain-specific datasets,Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,72,6,TRUE,447f11912cfa496e32e188a55214043a05760d3a,TRUE,TRUE,2024-06-26,2024-06-26,FALSE,FALSE,pankajmathur/orca_mini_v7_72b,https://huggingface.co/pankajmathur/orca_mini_v7_72b 💬,MaziyarPanahi/Llama-3-70B-Instruct-DPO-v0.2,37.98,82.08,0.82,48.57,0.64,22.96,0.23,12.19,0.34,15.3,0.44,46.74,0.52,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,llama3,70,13,TRUE,95366b974baedee4d95c1e841bc3d15e94753804,TRUE,TRUE,2024-06-26,2024-04-27,TRUE,FALSE,MaziyarPanahi/Llama-3-70B-Instruct-DPO-v0.2,https://huggingface.co/MaziyarPanahi/Llama-3-70B-Instruct-DPO-v0.2 🔶,VAGOsolutions/Llama-3-SauerkrautLM-70b-Instruct,37.82,80.45,0.8,52.03,0.67,21.68,0.22,10.4,0.33,13.54,0.43,48.8,0.54,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,70,15,TRUE,707cfd1a93875247c0223e0c7e3d86d58c432318,TRUE,TRUE,2024-06-26,2024-04-24,TRUE,FALSE,VAGOsolutions/Llama-3-SauerkrautLM-70b-Instruct,https://huggingface.co/VAGOsolutions/Llama-3-SauerkrautLM-70b-Instruct -💬,meta-llama/Meta-Llama-3-70B-Instruct,36.18,80.99,0.81,50.19,0.65,23.34,0.23,4.92,0.29,10.92,0.42,46.74,0.52,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,llama3,70,1340,TRUE,7129260dd854a80eb10ace5f61c20324b472b31c,TRUE,TRUE,2024-06-12,2024-04-17,TRUE,TRUE,meta-llama/Meta-Llama-3-70B-Instruct,https://huggingface.co/meta-llama/Meta-Llama-3-70B-Instruct +💬,meta-llama/Meta-Llama-3-70B-Instruct,36.18,80.99,0.81,50.19,0.65,23.34,0.23,4.92,0.29,10.92,0.42,46.74,0.52,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,llama3,70,1343,TRUE,7129260dd854a80eb10ace5f61c20324b472b31c,TRUE,TRUE,2024-06-12,2024-04-17,TRUE,TRUE,meta-llama/Meta-Llama-3-70B-Instruct,https://huggingface.co/meta-llama/Meta-Llama-3-70B-Instruct +💬,meta-llama/Meta-Llama-3.1-70B-Instruct,35.97,84.28,0.84,54.45,0.68,2.72,0.03,8.84,0.32,17.32,0.46,48.19,0.53,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,bfloat16,TRUE,"",0,0,TRUE,b9461463b511ed3c0762467538ea32cf7c9669f2,TRUE,TRUE,"","",FALSE,TRUE,meta-llama/Meta-Llama-3.1-70B-Instruct,https://huggingface.co/meta-llama/Meta-Llama-3.1-70B-Instruct 🔶,Sao10K/L3-70B-Euryale-v2.1,35.35,73.84,0.74,48.7,0.65,20.85,0.21,10.85,0.33,12.25,0.42,45.6,0.51,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,cc-by-nc-4.0,70,90,TRUE,36ad832b771cd783ea7ad00ed39e61f679b1a7c6,TRUE,TRUE,2024-07-01,2024-06-11,TRUE,FALSE,Sao10K/L3-70B-Euryale-v2.1,https://huggingface.co/Sao10K/L3-70B-Euryale-v2.1 🔶,migtissera/Llama-3-70B-Synthia-v3.5,35.2,60.76,0.61,49.12,0.65,18.96,0.19,18.34,0.39,23.39,0.49,40.65,0.47,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,llama3,70,5,TRUE,8744db0bccfc18f1847633da9d29fc89b35b4190,TRUE,TRUE,2024-06-26,2024-05-26,TRUE,FALSE,migtissera/Llama-3-70B-Synthia-v3.5,https://huggingface.co/migtissera/Llama-3-70B-Synthia-v3.5 🟢,Qwen/Qwen2-72B,35.13,38.24,0.38,51.86,0.66,29.15,0.29,19.24,0.39,19.73,0.47,52.56,0.57,🟢 pretrained,Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,158,TRUE,87993795c78576318087f70b43fbf530eb7789e7,TRUE,TRUE,2024-06-26,2024-05-22,FALSE,TRUE,Qwen/Qwen2-72B,https://huggingface.co/Qwen/Qwen2-72B @@ -18,7 +19,7 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,MaziyarPanahi/Llama-3-70B-Instruct-DPO-v0.4,32.18,50.27,0.5,48.4,0.64,22.66,0.23,11.97,0.34,13.1,0.43,46.71,0.52,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,llama3,70,10,TRUE,cb03e4d810b82d86e7cb01ab146bade09a5d06d1,TRUE,TRUE,2024-06-26,2024-04-28,TRUE,FALSE,MaziyarPanahi/Llama-3-70B-Instruct-DPO-v0.4,https://huggingface.co/MaziyarPanahi/Llama-3-70B-Instruct-DPO-v0.4 💬,cognitivecomputations/dolphin-2.9.2-qwen2-72b,32,40.38,0.4,47.7,0.63,21.37,0.21,16,0.37,17.04,0.45,49.52,0.55,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,46,TRUE,e79582577c2bf2af304221af0e8308b7e7d46ca1,TRUE,TRUE,2024-06-27,2024-05-27,TRUE,TRUE,cognitivecomputations/dolphin-2.9.2-qwen2-72b,https://huggingface.co/cognitivecomputations/dolphin-2.9.2-qwen2-72b 💬,MTSAIR/MultiVerse_70B,31.73,52.49,0.52,46.14,0.62,16.16,0.16,13.87,0.35,18.82,0.47,42.89,0.49,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,72,37,TRUE,063430cdc4d972a0884e3e3e3d45ea4afbdf71a2,TRUE,TRUE,2024-06-29,2024-03-25,FALSE,FALSE,MTSAIR/MultiVerse_70B,https://huggingface.co/MTSAIR/MultiVerse_70B -💬,CohereForAI/c4ai-command-r-plus,30.86,76.64,0.77,39.92,0.58,7.55,0.08,7.38,0.31,20.42,0.48,33.24,0.4,"💬 chat models (RLHF, DPO, IFT, ...)",CohereForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,103,1593,TRUE,fa1bd7fb1572ceb861bbbbecfa8af83b29fa8cca,TRUE,TRUE,2024-06-13,2024-04-03,TRUE,TRUE,CohereForAI/c4ai-command-r-plus,https://huggingface.co/CohereForAI/c4ai-command-r-plus +💬,CohereForAI/c4ai-command-r-plus,30.86,76.64,0.77,39.92,0.58,7.55,0.08,7.38,0.31,20.42,0.48,33.24,0.4,"💬 chat models (RLHF, DPO, IFT, ...)",CohereForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,103,1594,TRUE,fa1bd7fb1572ceb861bbbbecfa8af83b29fa8cca,TRUE,TRUE,2024-06-13,2024-04-03,TRUE,TRUE,CohereForAI/c4ai-command-r-plus,https://huggingface.co/CohereForAI/c4ai-command-r-plus 💬,internlm/internlm2_5-7b-chat,30.46,61.4,0.61,57.67,0.71,8.31,0.08,10.63,0.33,14.35,0.44,30.42,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",InternLM2ForCausalLM,Original,float16,TRUE,other,7,102,TRUE,bebb00121ee105b823647c3ba2b1e152652edc33,TRUE,TRUE,2024-07-03,2024-06-27,TRUE,TRUE,internlm/internlm2_5-7b-chat,https://huggingface.co/internlm/internlm2_5-7b-chat 🟢,Qwen/Qwen1.5-110B,29.56,34.22,0.34,44.28,0.61,23.04,0.23,13.65,0.35,13.71,0.44,48.45,0.54,🟢 pretrained,Qwen2ForCausalLM,Original,bfloat16,TRUE,other,111,87,TRUE,16659038ecdcc771c1293cf47020fa7cc2750ee8,TRUE,TRUE,2024-06-13,2024-04-25,FALSE,TRUE,Qwen/Qwen1.5-110B,https://huggingface.co/Qwen/Qwen1.5-110B 🔶,abacusai/Smaug-72B-v0.1,29.56,51.7,0.52,42.42,0.59,17.75,0.18,9.62,0.32,15.39,0.45,40.46,0.46,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,72,460,TRUE,a1d657156f82c24b670158406378648233487011,TRUE,TRUE,2024-06-12,2024-02-02,FALSE,TRUE,abacusai/Smaug-72B-v0.1,https://huggingface.co/abacusai/Smaug-72B-v0.1 @@ -27,18 +28,20 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,microsoft/Phi-3-small-128k-instruct,28.75,63.44,0.63,45.57,0.62,0,0,9.84,0.32,14.7,0.44,38.94,0.45,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3SmallForCausalLM,Original,bfloat16,TRUE,mit,7,145,TRUE,f80aaa30bfc64c2b8ab214b541d9050e97163bc4,TRUE,TRUE,2024-06-13,2024-05-07,TRUE,TRUE,microsoft/Phi-3-small-128k-instruct,https://huggingface.co/microsoft/Phi-3-small-128k-instruct 💬,Azure99/blossom-v5.1-34b,28.36,56.97,0.57,44.13,0.61,14.43,0.14,7.94,0.31,7.3,0.39,39.4,0.45,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,3,TRUE,2c803204f5dbf4ce37e2df98eb0205cdc53de10d,TRUE,TRUE,2024-07-01,2024-05-19,TRUE,FALSE,Azure99/blossom-v5.1-34b,https://huggingface.co/Azure99/blossom-v5.1-34b 💬,01-ai/Yi-1.5-9B-Chat,27.71,60.46,0.6,36.95,0.56,11.63,0.12,11.3,0.33,12.84,0.43,33.06,0.4,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,8,113,TRUE,bc87d8557c98dc1e5fdef6ec23ed31088c4d3f35,TRUE,TRUE,2024-06-12,2024-05-10,TRUE,TRUE,01-ai/Yi-1.5-9B-Chat,https://huggingface.co/01-ai/Yi-1.5-9B-Chat -💬,jpacifico/Chocolatine-3B-Instruct-DPO-Revised,27.63,56.23,0.56,37.16,0.55,14.5,0.15,9.62,0.32,15.1,0.45,33.21,0.4,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,float16,TRUE,mit,3,5,TRUE,c403df6c0f78148cfb477972455cbd859149311a,TRUE,TRUE,2024-07-19,2024-07-17,TRUE,FALSE,jpacifico/Chocolatine-3B-Instruct-DPO-Revised,https://huggingface.co/jpacifico/Chocolatine-3B-Instruct-DPO-Revised -💬,microsoft/Phi-3-mini-4k-instruct,27.2,54.77,0.55,36.56,0.55,14.2,0.14,10.96,0.33,13.12,0.43,33.58,0.4,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,float16,TRUE,mit,3,887,TRUE,c1358f8a35e6d2af81890deffbbfa575b978c62f,TRUE,TRUE,2024-07-02,2024-04-22,TRUE,TRUE,microsoft/Phi-3-mini-4k-instruct,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +💬,jpacifico/Chocolatine-3B-Instruct-DPO-Revised,27.63,56.23,0.56,37.16,0.55,14.5,0.15,9.62,0.32,15.1,0.45,33.21,0.4,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,float16,TRUE,mit,3,6,TRUE,c403df6c0f78148cfb477972455cbd859149311a,TRUE,TRUE,2024-07-19,2024-07-17,TRUE,FALSE,jpacifico/Chocolatine-3B-Instruct-DPO-Revised,https://huggingface.co/jpacifico/Chocolatine-3B-Instruct-DPO-Revised +💬,microsoft/Phi-3-mini-4k-instruct,27.2,54.77,0.55,36.56,0.55,14.2,0.14,10.96,0.33,13.12,0.43,33.58,0.4,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,float16,TRUE,mit,3,888,TRUE,c1358f8a35e6d2af81890deffbbfa575b978c62f,TRUE,TRUE,2024-07-02,2024-04-22,TRUE,TRUE,microsoft/Phi-3-mini-4k-instruct,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct 💬,Qwen/Qwen1.5-32B-Chat,27.1,55.32,0.55,44.55,0.61,6.65,0.07,7.49,0.31,10.2,0.42,38.41,0.45,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,32,104,TRUE,0997b012af6ddd5465d40465a8415535b2f06cfc,TRUE,TRUE,2024-06-12,2024-04-03,TRUE,TRUE,Qwen/Qwen1.5-32B-Chat,https://huggingface.co/Qwen/Qwen1.5-32B-Chat -💬,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,26.95,58.7,0.59,37.17,0.55,10.27,0.1,9.62,0.32,16.28,0.46,29.63,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,400,TRUE,286ae6737d048ad1d965c2e830864df02db50f2f,TRUE,FALSE,2024-06-12,2024-01-11,TRUE,TRUE,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO +💬,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,26.95,58.7,0.59,37.17,0.55,10.27,0.1,9.62,0.32,16.28,0.46,29.63,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,401,TRUE,286ae6737d048ad1d965c2e830864df02db50f2f,TRUE,FALSE,2024-06-12,2024-01-11,TRUE,TRUE,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO 💬,deepseek-ai/deepseek-llm-67b-chat,26.87,55.87,0.56,33.23,0.52,6.65,0.07,8.84,0.32,23.93,0.51,32.71,0.39,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,67,171,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2024-06-12,2023-11-29,TRUE,TRUE,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat 🔶,MaziyarPanahi/Llama-3-8B-Instruct-v0.8,26.75,75.12,0.75,28.27,0.5,7.1,0.07,7.38,0.31,10.92,0.42,31.68,0.39,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,8,3,TRUE,bd80951b7ae97f633ed48b80334af8df96b49f36,TRUE,TRUE,2024-07-11,2024-05-01,TRUE,FALSE,MaziyarPanahi/Llama-3-8B-Instruct-v0.8,https://huggingface.co/MaziyarPanahi/Llama-3-8B-Instruct-v0.8 🟢,Qwen/Qwen1.5-32B,26.69,32.97,0.33,38.98,0.57,26.66,0.27,10.63,0.33,12.04,0.43,38.89,0.45,🟢 pretrained,Qwen2ForCausalLM,Original,bfloat16,TRUE,other,32,77,TRUE,cefef80dc06a65f89d1d71d0adbc56d335ca2490,TRUE,TRUE,2024-06-13,2024-04-01,FALSE,TRUE,Qwen/Qwen1.5-32B,https://huggingface.co/Qwen/Qwen1.5-32B 🔶,MaziyarPanahi/Llama-3-8B-Instruct-v0.10,26.66,76.67,0.77,27.92,0.49,4.91,0.05,7.83,0.31,10.81,0.42,31.8,0.39,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,8,3,TRUE,4411eb9f6f5e4c462a6bdbc64c26dcc123100b66,TRUE,TRUE,2024-06-26,2024-06-04,TRUE,FALSE,MaziyarPanahi/Llama-3-8B-Instruct-v0.10,https://huggingface.co/MaziyarPanahi/Llama-3-8B-Instruct-v0.10 +💬,meta-llama/Meta-Llama-3.1-8B-Instruct,26.59,77.4,0.77,28.85,0.5,15.71,0.16,2.46,0.27,4.6,0.37,30.52,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,bfloat16,TRUE,"",0,0,TRUE,df34336b42332c6d360959e259cd6271c6a09fd4,TRUE,TRUE,"","",FALSE,TRUE,meta-llama/Meta-Llama-3.1-8B-Instruct,https://huggingface.co/meta-llama/Meta-Llama-3.1-8B-Instruct 🟢,01-ai/Yi-1.5-34B-32K,26.4,31.19,0.31,43.38,0.6,13.44,0.13,15.1,0.36,14.08,0.44,41.21,0.47,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,34,TRUE,2c03a29761e4174f20347a60fbe229be4383d48b,TRUE,TRUE,2024-06-12,2024-05-15,FALSE,TRUE,01-ai/Yi-1.5-34B-32K,https://huggingface.co/01-ai/Yi-1.5-34B-32K 🟢,meta-llama/Meta-Llama-3-70B,26.37,16.03,0.16,48.71,0.65,16.54,0.17,19.69,0.4,16.01,0.45,41.21,0.47,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,llama3,70,774,TRUE,b4d08b7db49d488da3ac49adf25a6b9ac01ae338,TRUE,TRUE,2024-06-12,2024-04-17,FALSE,TRUE,meta-llama/Meta-Llama-3-70B,https://huggingface.co/meta-llama/Meta-Llama-3-70B -💬,microsoft/Phi-3-mini-4k-instruct,25.97,56.13,0.56,39.27,0.57,11.63,0.12,9.28,0.32,7.64,0.4,31.85,0.39,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,bfloat16,TRUE,mit,3,887,TRUE,ff07dc01615f8113924aed013115ab2abd32115b,TRUE,TRUE,2024-06-12,2024-04-22,TRUE,TRUE,microsoft/Phi-3-mini-4k-instruct,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +💬,microsoft/Phi-3-mini-4k-instruct,25.97,56.13,0.56,39.27,0.57,11.63,0.12,9.28,0.32,7.64,0.4,31.85,0.39,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,bfloat16,TRUE,mit,3,888,TRUE,ff07dc01615f8113924aed013115ab2abd32115b,TRUE,TRUE,2024-06-12,2024-04-22,TRUE,TRUE,microsoft/Phi-3-mini-4k-instruct,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct 🟢,dnhkng/Medium,25.94,44.06,0.44,47.73,0.63,7.78,0.08,10.4,0.33,8.73,0.41,36.96,0.43,🟢 pretrained,Phi3ForCausalLM,Original,bfloat16,TRUE,mit,18,2,TRUE,de09a79e6b2efdcc97490a37b770764e62749fd0,TRUE,TRUE,2024-07-17,2024-07-17,FALSE,FALSE,dnhkng/Medium,https://huggingface.co/dnhkng/Medium +🟢,meta-llama/Meta-Llama-3.1-70B,25.91,16.84,0.17,46.4,0.63,16.69,0.17,18.34,0.39,16.58,0.46,40.6,0.47,🟢 pretrained,Unknown,Original,bfloat16,TRUE,"",0,0,TRUE,f7d3cc45ed4ff669a354baf2e0f05e65799a0bee,TRUE,TRUE,"","",FALSE,TRUE,meta-llama/Meta-Llama-3.1-70B,https://huggingface.co/meta-llama/Meta-Llama-3.1-70B 🤝,Casual-Autopsy/L3-Umbral-Mind-RP-v2.0-8B,25.76,71.23,0.71,32.49,0.53,10.12,0.1,4.92,0.29,5.55,0.37,30.26,0.37,🤝 base merges and moerges,LlamaForCausalLM,Original,bfloat16,FALSE,llama3,8,9,TRUE,b46c066ea8387264858dc3461f382e7b42fd9c48,TRUE,TRUE,2024-07-02,2024-06-26,TRUE,FALSE,Casual-Autopsy/L3-Umbral-Mind-RP-v2.0-8B,https://huggingface.co/Casual-Autopsy/L3-Umbral-Mind-RP-v2.0-8B 🔶,Sao10K/L3-8B-Stheno-v3.2,25.76,68.73,0.69,32.02,0.52,8.53,0.09,8.05,0.31,6.45,0.38,30.76,0.38,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,cc-by-nc-4.0,8,174,TRUE,4bb828f6e1b1efd648c39b1ad682c44ff260f018,TRUE,TRUE,2024-06-30,2024-06-05,TRUE,FALSE,Sao10K/L3-8B-Stheno-v3.2,https://huggingface.co/Sao10K/L3-8B-Stheno-v3.2 🔶,Nitral-AI/Hathor_Stable-v0.2-L3-8B,25.7,71.75,0.72,32.83,0.53,9.21,0.09,4.92,0.29,5.56,0.38,29.96,0.37,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,8,38,TRUE,1c9f391c3e349f8ba51b5696290ee6db6a2b63fd,TRUE,TRUE,2024-07-02,2024-06-09,TRUE,FALSE,Nitral-AI/Hathor_Stable-v0.2-L3-8B,https://huggingface.co/Nitral-AI/Hathor_Stable-v0.2-L3-8B @@ -46,7 +49,7 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🟢,mistral-community/mixtral-8x22B-v0.3,25.55,25.83,0.26,45.73,0.63,16.84,0.17,17,0.38,7.46,0.4,40.44,0.46,🟢 pretrained,MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,140,3,TRUE,211b177b79ab5ef245ee334d106c27623e786882,TRUE,FALSE,2024-06-13,2024-05-25,FALSE,TRUE,mistral-community/mixtral-8x22B-v0.3,https://huggingface.co/mistral-community/mixtral-8x22B-v0.3 🔶,arcee-ai/Arcee-Spark,25.54,56.21,0.56,37.14,0.55,12.31,0.12,7.61,0.31,8.6,0.4,31.36,0.38,🔶 fine-tuned on domain-specific datasets,Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,73,TRUE,3fe368ea5fd32bc4a8d1bcf42510416f7fa28668,TRUE,TRUE,2024-06-26,2024-06-22,TRUE,FALSE,arcee-ai/Arcee-Spark,https://huggingface.co/arcee-ai/Arcee-Spark 🟢,mistralai/Mixtral-8x22B-v0.1,25.49,25.83,0.26,45.59,0.62,16.84,0.17,16.78,0.38,7.46,0.4,40.44,0.46,🟢 pretrained,MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,140,173,TRUE,b03e260818710044a2f088d88fab12bb220884fb,TRUE,FALSE,2024-06-12,2024-04-16,FALSE,TRUE,mistralai/Mixtral-8x22B-v0.1,https://huggingface.co/mistralai/Mixtral-8x22B-v0.1 -💬,microsoft/Phi-3-mini-128k-instruct,25.49,59.76,0.6,37.1,0.56,8.91,0.09,9.06,0.32,7.71,0.39,30.38,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,bfloat16,TRUE,mit,3,1492,TRUE,5be6479b4bc06a081e8f4c6ece294241ccd32dec,TRUE,TRUE,2024-06-12,2024-04-22,TRUE,TRUE,microsoft/Phi-3-mini-128k-instruct,https://huggingface.co/microsoft/Phi-3-mini-128k-instruct +💬,microsoft/Phi-3-mini-128k-instruct,25.49,59.76,0.6,37.1,0.56,8.91,0.09,9.06,0.32,7.71,0.39,30.38,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,bfloat16,TRUE,mit,3,1493,TRUE,5be6479b4bc06a081e8f4c6ece294241ccd32dec,TRUE,TRUE,2024-06-12,2024-04-22,TRUE,TRUE,microsoft/Phi-3-mini-128k-instruct,https://huggingface.co/microsoft/Phi-3-mini-128k-instruct 🟢,01-ai/Yi-1.5-34B,25.43,28.41,0.28,42.75,0.6,14.05,0.14,15.44,0.37,11.22,0.42,40.73,0.47,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,44,TRUE,4b486f81c935a2dadde84c6baa1e1370d40a098f,TRUE,TRUE,2024-06-12,2024-05-11,FALSE,TRUE,01-ai/Yi-1.5-34B,https://huggingface.co/01-ai/Yi-1.5-34B 💬,CohereForAI/c4ai-command-r-v01,25.35,67.48,0.67,34.56,0.54,0,0,7.61,0.31,16.13,0.45,26.33,0.34,"💬 chat models (RLHF, DPO, IFT, ...)",CohereForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,34,1033,TRUE,16881ccde1c68bbc7041280e6a66637bc46bfe88,TRUE,TRUE,2024-06-13,2024-03-11,TRUE,TRUE,CohereForAI/c4ai-command-r-v01,https://huggingface.co/CohereForAI/c4ai-command-r-v01 💬,arcee-ai/Arcee-Spark,25.33,57.18,0.57,36.92,0.55,10.73,0.11,7.49,0.31,8.4,0.4,31.26,0.38,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,apache-2.0,7,73,TRUE,3fe368ea5fd32bc4a8d1bcf42510416f7fa28668,TRUE,TRUE,2024-06-26,2024-06-22,TRUE,FALSE,arcee-ai/Arcee-Spark,https://huggingface.co/arcee-ai/Arcee-Spark @@ -54,7 +57,7 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,databricks/dbrx-instruct,25.2,54.16,0.54,35.96,0.54,6.87,0.07,12.19,0.34,12.2,0.43,29.81,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",DbrxForCausalLM,Original,bfloat16,TRUE,other,131,1090,TRUE,c0a9245908c187da8f43a81e538e67ff360904ea,TRUE,TRUE,2024-06-12,2024-03-26,TRUE,TRUE,databricks/dbrx-instruct,https://huggingface.co/databricks/dbrx-instruct 🟢,Qwen/Qwen2-57B-A14B,25.03,31.13,0.31,38.88,0.56,18.66,0.19,7.49,0.31,10.54,0.42,43.51,0.49,🟢 pretrained,Qwen2MoeForCausalLM,Original,bfloat16,TRUE,apache-2.0,57,41,TRUE,973e466c39ba76372a2ae464dbca0af3f5a5a2a9,TRUE,FALSE,2024-06-13,2024-05-22,FALSE,TRUE,Qwen/Qwen2-57B-A14B,https://huggingface.co/Qwen/Qwen2-57B-A14B 🔶,jpacifico/Chocolatine-3B-Instruct-DPO-v1.0,25,37.37,0.37,36.55,0.55,15.26,0.15,8.72,0.32,19.47,0.48,32.63,0.39,🔶 fine-tuned on domain-specific datasets,Phi3ForCausalLM,Original,float16,TRUE,apache-2.0,3,2,TRUE,98d049b8f8c305cfba81adae498a95e6b5647d4a,TRUE,TRUE,2024-07-11,2024-07-11,FALSE,FALSE,jpacifico/Chocolatine-3B-Instruct-DPO-v1.0,https://huggingface.co/jpacifico/Chocolatine-3B-Instruct-DPO-v1.0 -💬,Qwen/Qwen2-7B-Instruct,24.76,56.79,0.57,37.81,0.55,8.61,0.09,6.38,0.3,7.37,0.39,31.64,0.38,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,410,TRUE,41c66b0be1c3081f13defc6bdf946c2ef240d6a6,TRUE,TRUE,2024-06-12,2024-06-04,TRUE,TRUE,Qwen/Qwen2-7B-Instruct,https://huggingface.co/Qwen/Qwen2-7B-Instruct +💬,Qwen/Qwen2-7B-Instruct,24.76,56.79,0.57,37.81,0.55,8.61,0.09,6.38,0.3,7.37,0.39,31.64,0.38,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,413,TRUE,41c66b0be1c3081f13defc6bdf946c2ef240d6a6,TRUE,TRUE,2024-06-12,2024-06-04,TRUE,TRUE,Qwen/Qwen2-7B-Instruct,https://huggingface.co/Qwen/Qwen2-7B-Instruct 🤝,HiroseKoichi/Llama-Salad-4x8B-V3,24.75,66.54,0.67,31.93,0.52,8.53,0.09,7.05,0.3,6.45,0.37,27.98,0.35,🤝 base merges and moerges,MixtralForCausalLM,Original,bfloat16,FALSE,llama3,24,4,TRUE,a343915429779efbd1478f01ba1f7fd9d8d226c0,TRUE,FALSE,2024-06-26,2024-06-17,TRUE,FALSE,HiroseKoichi/Llama-Salad-4x8B-V3,https://huggingface.co/HiroseKoichi/Llama-Salad-4x8B-V3 💬,Azure99/blossom-v5.1-9b,24.69,50.86,0.51,34.2,0.53,10.5,0.1,11.41,0.34,8.02,0.4,33.16,0.4,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,8,1,TRUE,6044a3dc1e04529fe883aa513d37f266a320d793,TRUE,TRUE,2024-07-01,2024-05-15,TRUE,FALSE,Azure99/blossom-v5.1-9b,https://huggingface.co/Azure99/blossom-v5.1-9b 🔶,NousResearch/Hermes-2-Theta-Llama-3-8B,24.62,65.18,0.65,32.05,0.52,8.69,0.09,7.16,0.3,8.36,0.39,26.32,0.34,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,8,183,TRUE,885173e97ab8572b444f7db1290d5d0386e26816,TRUE,TRUE,2024-07-11,2024-05-05,TRUE,TRUE,NousResearch/Hermes-2-Theta-Llama-3-8B,https://huggingface.co/NousResearch/Hermes-2-Theta-Llama-3-8B @@ -67,14 +70,14 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🤝,PJMixers/LLaMa-3-CursedStock-v2.0-8B,24.03,63.31,0.63,32.56,0.53,8.61,0.09,3.24,0.27,8.04,0.39,28.4,0.36,🤝 base merges and moerges,LlamaForCausalLM,Original,bfloat16,FALSE,llama3,8,8,TRUE,d47cc29df363f71ffaf6cd21ac4bdeefa27359db,TRUE,TRUE,2024-06-27,2024-06-26,TRUE,FALSE,PJMixers/LLaMa-3-CursedStock-v2.0-8B,https://huggingface.co/PJMixers/LLaMa-3-CursedStock-v2.0-8B 🔶,Weyaxi/Einstein-v7-Qwen2-7B,24.01,41,0.41,32.84,0.52,15.18,0.15,6.6,0.3,14.06,0.44,34.4,0.41,🔶 fine-tuned on domain-specific datasets,Qwen2ForCausalLM,Original,bfloat16,TRUE,other,7,31,TRUE,d5a2f245bf98a40d196821bc378e10f35b4da81a,TRUE,TRUE,2024-06-26,2024-06-24,TRUE,FALSE,Weyaxi/Einstein-v7-Qwen2-7B,https://huggingface.co/Weyaxi/Einstein-v7-Qwen2-7B 💬,vicgalle/Roleplay-Llama-3-8B,23.94,73.2,0.73,28.55,0.5,8.69,0.09,1.45,0.26,1.68,0.35,30.09,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,apache-2.0,8,32,TRUE,57297eb57dcc2c116f061d9dda341094203da01b,TRUE,TRUE,2024-06-26,2024-04-19,TRUE,FALSE,vicgalle/Roleplay-Llama-3-8B,https://huggingface.co/vicgalle/Roleplay-Llama-3-8B -💬,meta-llama/Meta-Llama-3-8B-Instruct,23.91,74.08,0.74,28.24,0.5,8.69,0.09,1.23,0.26,1.6,0.36,29.6,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,3173,TRUE,e1945c40cd546c78e41f1151f4db032b271faeaa,TRUE,TRUE,2024-06-12,2024-04-17,TRUE,TRUE,meta-llama/Meta-Llama-3-8B-Instruct,https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct +💬,meta-llama/Meta-Llama-3-8B-Instruct,23.91,74.08,0.74,28.24,0.5,8.69,0.09,1.23,0.26,1.6,0.36,29.6,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,3178,TRUE,e1945c40cd546c78e41f1151f4db032b271faeaa,TRUE,TRUE,2024-06-12,2024-04-17,TRUE,TRUE,meta-llama/Meta-Llama-3-8B-Instruct,https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct 💬,01-ai/Yi-34B-Chat,23.9,46.99,0.47,37.62,0.56,4.31,0.04,11.74,0.34,8.36,0.4,34.37,0.41,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,338,TRUE,2e528b6a80fb064a0a746c5ca43114b135e30464,TRUE,TRUE,2024-06-12,2023-11-22,TRUE,TRUE,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat 💬,abacusai/Smaug-34B-v0.1,23.76,50.16,0.5,34.26,0.54,0,0,10.63,0.33,8.13,0.4,39.37,0.45,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,58,TRUE,34d54c65a0247d5eb694973106c816d9c0ad3fc2,TRUE,TRUE,2024-06-12,2024-01-25,TRUE,TRUE,abacusai/Smaug-34B-v0.1,https://huggingface.co/abacusai/Smaug-34B-v0.1 🟢,Qwen/Qwen2-7B,23.66,31.49,0.31,34.71,0.53,18.81,0.19,7.27,0.3,14.32,0.44,35.37,0.42,🟢 pretrained,Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,98,TRUE,453ed1575b739b5b03ce3758b23befdb0967f40e,TRUE,TRUE,2024-06-09,2024-06-04,FALSE,TRUE,Qwen/Qwen2-7B,https://huggingface.co/Qwen/Qwen2-7B 💬,NousResearch/Nous-Hermes-2-SOLAR-10.7B,23.32,52.79,0.53,34.99,0.54,5.21,0.05,5.82,0.29,13.83,0.44,27.31,0.35,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,10,201,TRUE,14c1fbe2f71acdcd58247b30d5439bd572d52386,TRUE,TRUE,2024-06-12,2024-01-01,TRUE,TRUE,NousResearch/Nous-Hermes-2-SOLAR-10.7B,https://huggingface.co/NousResearch/Nous-Hermes-2-SOLAR-10.7B 🔶,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3,23.31,68.28,0.68,29.74,0.51,7.33,0.07,2.01,0.27,3.09,0.37,29.38,0.36,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,8,71,TRUE,f73dafc2923acd56f115f21f76e9d14f8d19a63e,TRUE,TRUE,2024-07-02,2024-06-25,TRUE,FALSE,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3,https://huggingface.co/UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3 💬,MaziyarPanahi/Phi-3-mini-4k-instruct-v0.2,23.21,50.69,0.51,37.73,0.55,2.34,0.02,9.51,0.32,7.7,0.4,31.27,0.38,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,bfloat16,TRUE,mit,3,2,TRUE,c0a366a4c01d7e724ceba7e2f2c19251983423fe,TRUE,TRUE,2024-06-26,2024-05-10,TRUE,FALSE,MaziyarPanahi/Phi-3-mini-4k-instruct-v0.2,https://huggingface.co/MaziyarPanahi/Phi-3-mini-4k-instruct-v0.2 -💬,google/gemma-2-9b-it,23.18,76.95,0.77,38.55,0.57,0,0,12.42,0.34,9.38,0.4,1.78,0.12,"💬 chat models (RLHF, DPO, IFT, ...)",Gemma2ForCausalLM,Original,bfloat16,TRUE,gemma,9,290,TRUE,1937c70277fcc5f7fb0fc772fc5bc69378996e71,TRUE,TRUE,2024-07-11,2024-06-24,TRUE,TRUE,google/gemma-2-9b-it,https://huggingface.co/google/gemma-2-9b-it +💬,google/gemma-2-9b-it,23.18,76.95,0.77,38.55,0.57,0,0,12.42,0.34,9.38,0.4,1.78,0.12,"💬 chat models (RLHF, DPO, IFT, ...)",Gemma2ForCausalLM,Original,bfloat16,TRUE,gemma,9,291,TRUE,1937c70277fcc5f7fb0fc772fc5bc69378996e71,TRUE,TRUE,2024-07-11,2024-06-24,TRUE,TRUE,google/gemma-2-9b-it,https://huggingface.co/google/gemma-2-9b-it 💬,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3,23.06,67.03,0.67,29.72,0.51,7.18,0.07,2.01,0.27,2.89,0.36,29.53,0.37,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,apache-2.0,8,71,TRUE,f73dafc2923acd56f115f21f76e9d14f8d19a63e,TRUE,TRUE,2024-06-28,2024-06-25,TRUE,FALSE,UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3,https://huggingface.co/UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3 💬,MaziyarPanahi/Phi-3-mini-4k-instruct-v0.3,23.02,49.26,0.49,37.66,0.55,2.95,0.03,9.06,0.32,7.75,0.4,31.42,0.38,"💬 chat models (RLHF, DPO, IFT, ...)",Phi3ForCausalLM,Original,bfloat16,TRUE,mit,3,9,TRUE,e1f70c3724c728aadd1c7c1bb279487494f7059e,TRUE,TRUE,2024-06-26,2024-05-10,TRUE,FALSE,MaziyarPanahi/Phi-3-mini-4k-instruct-v0.3,https://huggingface.co/MaziyarPanahi/Phi-3-mini-4k-instruct-v0.3 💬,LLM360/K2-Chat,22.93,51.52,0.52,33.79,0.54,1.59,0.02,7.49,0.31,16.82,0.46,26.34,0.34,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,65,31,TRUE,5454f2d28031c9127e4227c873ca2f154e02e4c7,TRUE,TRUE,2024-06-12,2024-05-22,TRUE,TRUE,LLM360/K2-Chat,https://huggingface.co/LLM360/K2-Chat @@ -120,7 +123,7 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🤝,maldv/badger-lambda-llama-3-8b,20.76,48.61,0.49,28.1,0.5,8.31,0.08,4.25,0.28,4.52,0.38,30.74,0.38,🤝 base merges and moerges,LlamaForCausalLM,Original,bfloat16,TRUE,cc-by-nc-4.0,8,8,TRUE,8ef157d0d3c12212ca5e70d354869aed90e03f22,TRUE,TRUE,2024-06-26,2024-06-10,TRUE,FALSE,maldv/badger-lambda-llama-3-8b,https://huggingface.co/maldv/badger-lambda-llama-3-8b 🤝,nlpguy/StarFusion-alpha1,20.68,56.45,0.56,21.93,0.44,6.42,0.06,6.04,0.3,8.88,0.41,24.34,0.32,🤝 base merges and moerges,MistralForCausalLM,Original,bfloat16,FALSE,apache-2.0,7,0,TRUE,dccad965a710d7bee001b6387c8307e7c320291e,TRUE,TRUE,2024-06-26,2024-04-13,TRUE,FALSE,nlpguy/StarFusion-alpha1,https://huggingface.co/nlpguy/StarFusion-alpha1 💬,berkeley-nest/Starling-LM-7B-alpha,20.64,54.8,0.55,21.95,0.44,7.18,0.07,6.26,0.3,9.5,0.41,24.13,0.32,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,552,TRUE,1dddf3b95bc1391f6307299eb1c162c194bde9bd,TRUE,TRUE,2024-06-12,2023-11-25,TRUE,TRUE,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha -🔶,meta-llama/Meta-Llama-3-8B-Instruct,20.48,47.82,0.48,26.8,0.49,8.38,0.08,5.7,0.29,5.4,0.38,28.79,0.36,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,llama3,8,3173,TRUE,e1945c40cd546c78e41f1151f4db032b271faeaa,TRUE,TRUE,2024-07-08,2024-04-17,FALSE,TRUE,meta-llama/Meta-Llama-3-8B-Instruct,https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct +🔶,meta-llama/Meta-Llama-3-8B-Instruct,20.48,47.82,0.48,26.8,0.49,8.38,0.08,5.7,0.29,5.4,0.38,28.79,0.36,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,llama3,8,3178,TRUE,e1945c40cd546c78e41f1151f4db032b271faeaa,TRUE,TRUE,2024-07-08,2024-04-17,FALSE,TRUE,meta-llama/Meta-Llama-3-8B-Instruct,https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct 🔶,SanjiWatsuki/Kunoichi-DPO-v2-7B,20.41,54.31,0.54,20.9,0.44,6.57,0.07,6.15,0.3,11.09,0.42,23.41,0.31,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,7,72,TRUE,5278247beb482c4fceff2294570236d68b74d132,TRUE,TRUE,2024-06-28,2024-01-13,TRUE,FALSE,SanjiWatsuki/Kunoichi-DPO-v2-7B,https://huggingface.co/SanjiWatsuki/Kunoichi-DPO-v2-7B 🔶,pankajmathur/orca_mini_v6_8b_dpo,20.29,38.83,0.39,32.48,0.52,5.51,0.06,6.82,0.3,9.26,0.41,28.85,0.36,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,1,TRUE,ebb11b63839d38e8c03c7ecac012e047fcb2346e,TRUE,TRUE,2024-06-26,2024-06-21,FALSE,FALSE,pankajmathur/orca_mini_v6_8b_dpo,https://huggingface.co/pankajmathur/orca_mini_v6_8b_dpo 🟢,Qwen/Qwen1.5-14B,20.22,29.05,0.29,30.06,0.51,16.47,0.16,5.93,0.29,10.46,0.42,29.37,0.36,🟢 pretrained,Qwen2ForCausalLM,Original,bfloat16,TRUE,other,14,36,TRUE,dce4b190d34470818e5bec2a92cb8233aaa02ca2,TRUE,TRUE,2024-06-13,2024-01-22,FALSE,TRUE,Qwen/Qwen1.5-14B,https://huggingface.co/Qwen/Qwen1.5-14B @@ -153,18 +156,18 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🤝,johnsutor/Llama-3-8B-Instruct_ties-density-0.3,18.69,36.26,0.36,27.72,0.49,5.74,0.06,6.15,0.3,10.48,0.4,25.79,0.33,🤝 base merges and moerges,LlamaForCausalLM,Original,bfloat16,FALSE,apache-2.0,8,0,TRUE,8d051f3eec3fc93a4521073c2d290c4ff9144fc1,TRUE,TRUE,2024-06-26,2024-06-07,FALSE,FALSE,johnsutor/Llama-3-8B-Instruct_ties-density-0.3,https://huggingface.co/johnsutor/Llama-3-8B-Instruct_ties-density-0.3 💬,HuggingFaceH4/zephyr-7b-alpha,18.52,51.91,0.52,23.89,0.46,1.51,0.02,6.38,0.3,7.5,0.39,19.94,0.28,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1084,TRUE,2ce2d025864af849b3e5029e2ec9d568eeda892d,TRUE,TRUE,2024-06-12,2023-10-09,TRUE,TRUE,HuggingFaceH4/zephyr-7b-alpha,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha 🤝,johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.9-gamma-0.01,18.48,27.9,0.28,27.22,0.49,0,0,5.93,0.29,24.24,0.52,25.61,0.33,🤝 base merges and moerges,LlamaForCausalLM,Original,bfloat16,FALSE,apache-2.0,8,0,TRUE,c88c6b65f751156e7bc04c738947387eb55747e9,TRUE,TRUE,2024-06-26,2024-06-08,FALSE,FALSE,johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.9-gamma-0.01,https://huggingface.co/johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.9-gamma-0.01 -💬,mistralai/Mistral-7B-Instruct-v0.2,18.44,54.96,0.55,22.91,0.45,2.64,0.03,3.47,0.28,7.61,0.4,19.08,0.27,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,2426,TRUE,41b61a33a2483885c981aa79e0df6b32407ed873,TRUE,TRUE,2024-06-12,2023-12-11,TRUE,TRUE,mistralai/Mistral-7B-Instruct-v0.2,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 +💬,mistralai/Mistral-7B-Instruct-v0.2,18.44,54.96,0.55,22.91,0.45,2.64,0.03,3.47,0.28,7.61,0.4,19.08,0.27,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,2430,TRUE,41b61a33a2483885c981aa79e0df6b32407ed873,TRUE,TRUE,2024-06-12,2023-12-11,TRUE,TRUE,mistralai/Mistral-7B-Instruct-v0.2,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 🤝,johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.7-gamma-0.01,18.44,28.14,0.28,27.16,0.49,0,0,5.37,0.29,24.47,0.52,25.5,0.33,🤝 base merges and moerges,LlamaForCausalLM,Original,bfloat16,FALSE,apache-2.0,8,0,TRUE,61f4b44fb917cdb46f0ade9f8fc2a382e0cf67af,TRUE,TRUE,2024-06-26,2024-06-08,FALSE,FALSE,johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.7-gamma-0.01,https://huggingface.co/johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.7-gamma-0.01 💬,argilla/notus-7b-v1,18.37,50.82,0.51,22.75,0.45,2.57,0.03,5.26,0.29,6.59,0.34,22.26,0.3,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,mit,7,118,TRUE,30172203a2d41cb487bf7e2b92a821080783b2c9,TRUE,TRUE,2024-06-27,2023-11-16,TRUE,TRUE,argilla/notus-7b-v1,https://huggingface.co/argilla/notus-7b-v1 -💬,cognitivecomputations/dolphin-2.9-llama3-8b,18.3,38.5,0.39,27.86,0.49,5.06,0.05,4.92,0.29,13.79,0.44,19.68,0.28,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,8,376,TRUE,5aeb036f9215c558b483a654a8c6e1cc22e841bf,TRUE,TRUE,2024-06-12,2024-04-20,TRUE,TRUE,cognitivecomputations/dolphin-2.9-llama3-8b,https://huggingface.co/cognitivecomputations/dolphin-2.9-llama3-8b +💬,cognitivecomputations/dolphin-2.9-llama3-8b,18.3,38.5,0.39,27.86,0.49,5.06,0.05,4.92,0.29,13.79,0.44,19.68,0.28,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,8,377,TRUE,5aeb036f9215c558b483a654a8c6e1cc22e841bf,TRUE,TRUE,2024-06-12,2024-04-20,TRUE,TRUE,cognitivecomputations/dolphin-2.9-llama3-8b,https://huggingface.co/cognitivecomputations/dolphin-2.9-llama3-8b 🟢,meta-llama/Llama-2-70b-hf,18.25,24.07,0.24,35.9,0.55,2.49,0.02,7.05,0.3,9.78,0.41,30.2,0.37,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,llama2,68,821,TRUE,3aba440b59558f995867ba6e1f58f21d0336b5bb,TRUE,TRUE,2024-06-12,2023-07-11,FALSE,TRUE,meta-llama/Llama-2-70b-hf,https://huggingface.co/meta-llama/Llama-2-70b-hf 🔶,microsoft/Orca-2-13b,18.14,31.28,0.31,27.31,0.49,0.98,0.01,4.03,0.28,25.79,0.51,19.44,0.27,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,13,658,TRUE,2539ff53e6baa4cc603774ad5a2d646f4041ea4e,TRUE,TRUE,2024-06-12,2023-11-14,FALSE,TRUE,microsoft/Orca-2-13b,https://huggingface.co/microsoft/Orca-2-13b 💬,gradientai/Llama-3-8B-Instruct-Gradient-1048k,18.12,44.56,0.45,21.01,0.43,4.38,0.04,3.69,0.28,13.52,0.43,21.56,0.29,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,657,TRUE,8697fb25cb77c852311e03b4464b8467471d56a4,TRUE,TRUE,2024-06-12,2024-04-29,TRUE,TRUE,gradientai/Llama-3-8B-Instruct-Gradient-1048k,https://huggingface.co/gradientai/Llama-3-8B-Instruct-Gradient-1048k 🔶,uukuguy/speechless-code-mistral-7b-v1.0,18.09,36.65,0.37,24.09,0.46,4.61,0.05,4.59,0.28,14.77,0.45,23.84,0.31,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,17,TRUE,1862e0a712efc6002112e9c1235a197d58419b37,TRUE,TRUE,2024-06-26,2023-10-10,FALSE,FALSE,uukuguy/speechless-code-mistral-7b-v1.0,https://huggingface.co/uukuguy/speechless-code-mistral-7b-v1.0 🟢,THUDM/glm-4-9b,18.01,14.26,0.14,35.81,0.55,0,0,8.84,0.32,14.19,0.44,34.94,0.41,🟢 pretrained,ChatGLMModelM,Original,bfloat16,TRUE,other,9,86,TRUE,99a140996f9d4f197842fb6b1aab217a42e27ef3,TRUE,TRUE,2024-07-04,2024-06-04,FALSE,FALSE,THUDM/glm-4-9b,https://huggingface.co/THUDM/glm-4-9b 🔶,Intel/neural-chat-7b-v3,17.94,27.78,0.28,30.21,0.5,2.19,0.02,5.59,0.29,23.02,0.51,18.87,0.27,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,65,TRUE,fc679274dfcd28a8b6087634f71af7ed2a0659c4,TRUE,TRUE,2024-06-12,2023-10-25,FALSE,TRUE,Intel/neural-chat-7b-v3,https://huggingface.co/Intel/neural-chat-7b-v3 -🔶,collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2,17.89,38.09,0.38,23.65,0.46,5.36,0.05,11.07,0.33,1.6,0.34,27.56,0.35,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,3,TRUE,2560556d655d0ecaefec10f579c92292d65fb28b,TRUE,TRUE,2024-06-27,2024-06-10,FALSE,FALSE,collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2,https://huggingface.co/collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2 -💬,HuggingFaceH4/zephyr-7b-beta,17.72,49.5,0.5,21.49,0.43,2.42,0.02,5.37,0.29,7.73,0.39,19.79,0.28,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1529,TRUE,b70e0c9a2d9e14bd1e812d3c398e5f313e93b473,TRUE,TRUE,2024-06-12,2023-10-26,TRUE,TRUE,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +🔶,collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2,17.89,38.09,0.38,23.65,0.46,5.36,0.05,11.07,0.33,1.6,0.34,27.56,0.35,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,"",8,0,FALSE,2560556d655d0ecaefec10f579c92292d65fb28b,TRUE,TRUE,2024-06-27,"",FALSE,FALSE,collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2,https://huggingface.co/collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2 +💬,HuggingFaceH4/zephyr-7b-beta,17.72,49.5,0.5,21.49,0.43,2.42,0.02,5.37,0.29,7.73,0.39,19.79,0.28,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1530,TRUE,b70e0c9a2d9e14bd1e812d3c398e5f313e93b473,TRUE,TRUE,2024-06-12,2023-10-26,TRUE,TRUE,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta 💬,Open-Orca/Mistral-7B-OpenOrca,17.62,49.78,0.5,25.84,0.48,2.95,0.03,2.91,0.27,5.89,0.39,18.37,0.27,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,665,TRUE,4a37328cef00f524d3791b1c0cc559a3cc6af14d,TRUE,TRUE,2024-06-12,2023-09-29,TRUE,TRUE,Open-Orca/Mistral-7B-OpenOrca,https://huggingface.co/Open-Orca/Mistral-7B-OpenOrca 🟢,01-ai/Yi-9B,17.61,27.09,0.27,27.63,0.49,4.38,0.04,9.06,0.32,8.91,0.41,28.6,0.36,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,8,182,TRUE,b4a466d95091696285409f1dcca3028543cb39da,TRUE,TRUE,2024-06-12,2024-03-01,FALSE,TRUE,01-ai/Yi-9B,https://huggingface.co/01-ai/Yi-9B 💬,mlabonne/AlphaMonarch-7B,17.59,49.39,0.49,23.95,0.46,3.85,0.04,2.68,0.27,9.32,0.41,16.36,0.25,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,float16,FALSE,cc-by-nc-4.0,7,146,TRUE,3de065d84411d74e5b3590f67f52b0b71faf6161,TRUE,TRUE,2024-06-12,2024-02-14,TRUE,TRUE,mlabonne/AlphaMonarch-7B,https://huggingface.co/mlabonne/AlphaMonarch-7B @@ -189,10 +192,10 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,stabilityai/stablelm-2-12b-chat,16.22,40.82,0.41,25.25,0.47,2.04,0.02,2.24,0.27,7.73,0.39,19.27,0.27,"💬 chat models (RLHF, DPO, IFT, ...)",StableLmForCausalLM,Original,bfloat16,TRUE,other,12,83,TRUE,b6b62cd451b84e848514c00fafa66d9ead9297c5,TRUE,TRUE,2024-06-12,2024-04-04,TRUE,TRUE,stabilityai/stablelm-2-12b-chat,https://huggingface.co/stabilityai/stablelm-2-12b-chat 💬,CohereForAI/aya-23-8B,15.97,46.99,0.47,20.2,0.43,1.44,0.01,4.59,0.28,8.42,0.39,14.2,0.23,"💬 chat models (RLHF, DPO, IFT, ...)",CohereForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,8,328,TRUE,ec151d218a24031eb039d92fb83d10445427efc9,TRUE,TRUE,2024-06-12,2024-05-19,TRUE,TRUE,CohereForAI/aya-23-8B,https://huggingface.co/CohereForAI/aya-23-8B 🔶,pankajmathur/model_007_13b_v2,15.86,30.56,0.31,25.45,0.47,1.21,0.01,4.47,0.28,17.2,0.46,16.23,0.25,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama2,13,4,TRUE,2c6ddf25cdb134f22e2543121b5a36b41342a9e2,TRUE,TRUE,2024-06-26,2023-08-12,FALSE,FALSE,pankajmathur/model_007_13b_v2,https://huggingface.co/pankajmathur/model_007_13b_v2 -💬,HuggingFaceH4/zephyr-7b-gemma-v0.1,15.83,33.64,0.34,24.05,0.46,6.65,0.07,5.93,0.29,4.18,0.37,20.53,0.28,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,other,8,120,TRUE,03b3427d0ed07d2e0f86c0a7e53d82d4beef9540,TRUE,TRUE,2024-06-12,2024-03-01,TRUE,TRUE,HuggingFaceH4/zephyr-7b-gemma-v0.1,https://huggingface.co/HuggingFaceH4/zephyr-7b-gemma-v0.1 +💬,HuggingFaceH4/zephyr-7b-gemma-v0.1,15.83,33.64,0.34,24.05,0.46,6.65,0.07,5.93,0.29,4.18,0.37,20.53,0.28,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,other,8,121,TRUE,03b3427d0ed07d2e0f86c0a7e53d82d4beef9540,TRUE,TRUE,2024-06-12,2024-03-01,TRUE,TRUE,HuggingFaceH4/zephyr-7b-gemma-v0.1,https://huggingface.co/HuggingFaceH4/zephyr-7b-gemma-v0.1 🟩,hon9kon9ize/CantoneseLLMChat-v0.5,15.73,32.31,0.32,20.76,0.43,2.79,0.03,3.69,0.28,18.13,0.47,16.71,0.25,🟩 continuously pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,6,4,TRUE,812eb4f168c3ea258ebb220393401db9578e0f67,TRUE,TRUE,2024-07-07,2024-07-01,FALSE,FALSE,hon9kon9ize/CantoneseLLMChat-v0.5,https://huggingface.co/hon9kon9ize/CantoneseLLMChat-v0.5 🟢,NousResearch/Yarn-Solar-10b-32k,15.62,19.42,0.19,28.99,0.5,2.42,0.02,7.05,0.3,10.6,0.41,25.25,0.33,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,10,10,TRUE,ec3158b5276ac6644ddbdb36ccf6f9a106c98ede,TRUE,TRUE,2024-06-12,2024-01-17,FALSE,TRUE,NousResearch/Yarn-Solar-10b-32k,https://huggingface.co/NousResearch/Yarn-Solar-10b-32k -🟢,microsoft/phi-2,15.45,27.39,0.27,28.04,0.49,2.42,0.02,2.91,0.27,13.84,0.41,18.09,0.26,🟢 pretrained,PhiForCausalLM,Original,float16,TRUE,mit,2,3207,TRUE,ef382358ec9e382308935a992d908de099b64c23,TRUE,TRUE,2024-06-09,2023-12-13,FALSE,TRUE,microsoft/phi-2,https://huggingface.co/microsoft/phi-2 +🟢,microsoft/phi-2,15.45,27.39,0.27,28.04,0.49,2.42,0.02,2.91,0.27,13.84,0.41,18.09,0.26,🟢 pretrained,PhiForCausalLM,Original,float16,TRUE,mit,2,3208,TRUE,ef382358ec9e382308935a992d908de099b64c23,TRUE,TRUE,2024-06-09,2023-12-13,FALSE,TRUE,microsoft/phi-2,https://huggingface.co/microsoft/phi-2 🤝,win10/Breeze-13B-32k-Instruct-v1_0,15.4,35.84,0.36,25.26,0.46,0.91,0.01,1.9,0.26,11.06,0.42,17.42,0.26,🤝 base merges and moerges,MistralForCausalLM,Original,bfloat16,FALSE,apache-2.0,12,0,TRUE,220c957cf5d9c534a4ef75c11a18221c461de40a,TRUE,TRUE,2024-06-26,2024-06-26,TRUE,FALSE,win10/Breeze-13B-32k-Instruct-v1_0,https://huggingface.co/win10/Breeze-13B-32k-Instruct-v1_0 🤝,mlabonne/phixtral-2x2_8,15.39,34.31,0.34,28.5,0.49,2.57,0.03,2.01,0.27,7.71,0.36,17.23,0.26,🤝 base merges and moerges,PhiForCausalLM,Original,float16,TRUE,mit,4,146,TRUE,7744a977d83f132ae5808d8c3b70157031f7de44,TRUE,FALSE,2024-06-12,2024-01-07,TRUE,TRUE,mlabonne/phixtral-2x2_8,https://huggingface.co/mlabonne/phixtral-2x2_8 🟢,google/gemma-7b,15.28,26.59,0.27,21.12,0.44,6.42,0.06,4.92,0.29,10.98,0.41,21.64,0.29,🟢 pretrained,GemmaForCausalLM,Original,bfloat16,TRUE,gemma,8,2977,TRUE,a0eac5b80dba224e6ed79d306df50b1e92c2125d,TRUE,TRUE,2024-06-08,2024-02-08,FALSE,TRUE,google/gemma-7b,https://huggingface.co/google/gemma-7b @@ -208,25 +211,26 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,Qwen/Qwen1.5-MoE-A2.7B-Chat,14.82,37.95,0.38,20.04,0.43,0,0,3.24,0.27,6.33,0.39,21.37,0.29,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2MoeForCausalLM,Original,bfloat16,TRUE,other,14,109,TRUE,ec052fda178e241c7c443468d2fa1db6618996be,TRUE,FALSE,2024-06-12,2024-03-14,TRUE,TRUE,Qwen/Qwen1.5-MoE-A2.7B-Chat,https://huggingface.co/Qwen/Qwen1.5-MoE-A2.7B-Chat 💬,deepseek-ai/deepseek-llm-7b-chat,14.77,41.71,0.42,11.26,0.36,1.74,0.02,2.13,0.27,19.21,0.47,12.59,0.21,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,7,72,TRUE,afbda8b347ec881666061fa67447046fc5164ec8,TRUE,TRUE,2024-06-12,2023-11-29,TRUE,TRUE,deepseek-ai/deepseek-llm-7b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-7b-chat 🔶,VAGOsolutions/SauerkrautLM-Gemma-7b,14.5,34.07,0.34,18.49,0.42,4.91,0.05,4.81,0.29,2.93,0.36,21.79,0.3,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,bfloat16,TRUE,other,8,13,TRUE,4296bdabf82e900235b094e5348be03ebb0ec891,TRUE,TRUE,2024-06-26,2024-02-27,TRUE,FALSE,VAGOsolutions/SauerkrautLM-Gemma-7b,https://huggingface.co/VAGOsolutions/SauerkrautLM-Gemma-7b -🟢,mistralai/Mistral-7B-v0.1,14.5,23.86,0.24,22.02,0.44,2.49,0.02,5.59,0.29,10.68,0.41,22.36,0.3,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,3314,TRUE,26bca36bde8333b5d7f72e9ed20ccda6a618af24,TRUE,TRUE,2024-06-12,2023-09-20,FALSE,TRUE,mistralai/Mistral-7B-v0.1,https://huggingface.co/mistralai/Mistral-7B-v0.1 +🟢,mistralai/Mistral-7B-v0.1,14.5,23.86,0.24,22.02,0.44,2.49,0.02,5.59,0.29,10.68,0.41,22.36,0.3,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,3316,TRUE,26bca36bde8333b5d7f72e9ed20ccda6a618af24,TRUE,TRUE,2024-06-12,2023-09-20,FALSE,TRUE,mistralai/Mistral-7B-v0.1,https://huggingface.co/mistralai/Mistral-7B-v0.1 🔶,teknium/CollectiveCognition-v1.1-Mistral-7B,14.23,27.9,0.28,23.48,0.45,2.95,0.03,4.92,0.29,5.73,0.39,20.41,0.28,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,78,TRUE,5f57f70ec99450c70da2540e94dd7fd67be4b23c,TRUE,TRUE,2024-06-12,2023-10-04,FALSE,TRUE,teknium/CollectiveCognition-v1.1-Mistral-7B,https://huggingface.co/teknium/CollectiveCognition-v1.1-Mistral-7B 🔶,TencentARC/Mistral_Pro_8B_v0.1,14.2,21.15,0.21,22.89,0.45,5.66,0.06,4.03,0.28,11.83,0.42,19.61,0.28,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,8,64,TRUE,366f159fc5b314ba2a955209d2bca4600f84dac0,TRUE,TRUE,2024-06-12,2024-02-22,FALSE,TRUE,TencentARC/Mistral_Pro_8B_v0.1,https://huggingface.co/TencentARC/Mistral_Pro_8B_v0.1 🟢,tklohj/WindyFloLLM,14.17,26.69,0.27,24.4,0.46,1.13,0.01,3.36,0.28,11.86,0.43,17.57,0.26,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,"",13,0,FALSE,21f4241ab3f091d1d309e9076a8d8e3f014908a8,TRUE,TRUE,2024-07-10,2024-06-30,FALSE,FALSE,tklohj/WindyFloLLM,https://huggingface.co/tklohj/WindyFloLLM -🟢,mistralai/Mistral-7B-v0.3,14.17,22.66,0.23,24.04,0.45,2.64,0.03,5.59,0.29,8.36,0.4,21.7,0.3,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,320,TRUE,b67d6a03ca097c5122fa65904fce0413500bf8c8,TRUE,TRUE,2024-06-12,2024-05-22,FALSE,TRUE,mistralai/Mistral-7B-v0.3,https://huggingface.co/mistralai/Mistral-7B-v0.3 +🟢,mistralai/Mistral-7B-v0.3,14.17,22.66,0.23,24.04,0.45,2.64,0.03,5.59,0.29,8.36,0.4,21.7,0.3,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,321,TRUE,b67d6a03ca097c5122fa65904fce0413500bf8c8,TRUE,TRUE,2024-06-12,2024-05-22,FALSE,TRUE,mistralai/Mistral-7B-v0.3,https://huggingface.co/mistralai/Mistral-7B-v0.3 🔶,microsoft/Orca-2-7b,14.15,21.99,0.22,22.57,0.45,0.83,0.01,0.78,0.26,24.09,0.5,14.65,0.23,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,7,209,TRUE,60e31e6bdcf582ad103b807cb74b73ee1d2c4b17,TRUE,TRUE,2024-06-12,2023-11-14,FALSE,TRUE,microsoft/Orca-2-7b,https://huggingface.co/microsoft/Orca-2-7b 🟢,mistral-community/Mistral-7B-v0.2,14.15,22.66,0.23,23.95,0.45,2.64,0.03,5.59,0.29,8.36,0.4,21.7,0.3,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,230,TRUE,2c3e624962b1a3f3fbf52e15969565caa7bc064a,TRUE,TRUE,2024-06-12,2024-03-23,FALSE,TRUE,mistral-community/Mistral-7B-v0.2,https://huggingface.co/mistral-community/Mistral-7B-v0.2 💬,01-ai/Yi-6B-Chat,14,33.95,0.34,17,0.41,0.68,0.01,5.93,0.29,3.57,0.37,22.9,0.31,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,6,62,TRUE,01f7fabb6cfb26efeb764da4a0a19cad2c754232,TRUE,TRUE,2024-06-12,2023-11-22,TRUE,TRUE,01-ai/Yi-6B-Chat,https://huggingface.co/01-ai/Yi-6B-Chat -💬,Qwen/Qwen2-1.5B-Instruct,13.92,33.71,0.34,13.7,0.39,5.82,0.06,1.57,0.26,12.03,0.43,16.68,0.25,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,70,TRUE,ba1cf1846d7df0a0591d6c00649f57e798519da8,TRUE,TRUE,2024-06-12,2024-06-03,TRUE,TRUE,Qwen/Qwen2-1.5B-Instruct,https://huggingface.co/Qwen/Qwen2-1.5B-Instruct +💬,Qwen/Qwen2-1.5B-Instruct,13.92,33.71,0.34,13.7,0.39,5.82,0.06,1.57,0.26,12.03,0.43,16.68,0.25,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,71,TRUE,ba1cf1846d7df0a0591d6c00649f57e798519da8,TRUE,TRUE,2024-06-12,2024-06-03,TRUE,TRUE,Qwen/Qwen2-1.5B-Instruct,https://huggingface.co/Qwen/Qwen2-1.5B-Instruct 🟢,stabilityai/stablelm-2-12b,13.86,15.69,0.16,22.69,0.45,3.47,0.03,3.8,0.28,14.49,0.45,23.02,0.31,🟢 pretrained,StableLmForCausalLM,Original,bfloat16,TRUE,other,12,108,TRUE,fead13ddbf4492970666650c3cd6f85f485411ec,TRUE,TRUE,2024-06-12,2024-03-21,FALSE,TRUE,stabilityai/stablelm-2-12b,https://huggingface.co/stabilityai/stablelm-2-12b 🔶,xinchen9/llama3-b8-ft-dis,13.85,15.46,0.15,24.73,0.46,3.17,0.03,8.39,0.31,6.41,0.37,24.93,0.32,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,apache-2.0,8,0,TRUE,e4da730f28f79543262de37908943c35f8df81fe,TRUE,TRUE,2024-07-11,2024-06-28,FALSE,FALSE,xinchen9/llama3-b8-ft-dis,https://huggingface.co/xinchen9/llama3-b8-ft-dis 🔶,openchat/openchat_v3.2,13.81,29.81,0.3,20.32,0.43,1.13,0.01,2.68,0.27,13.1,0.43,15.8,0.24,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama2,13,42,TRUE,acc7ce92558681e749678648189812f15c1465fe,TRUE,TRUE,2024-06-12,2023-07-30,FALSE,TRUE,openchat/openchat_v3.2,https://huggingface.co/openchat/openchat_v3.2 +🟢,meta-llama/Meta-Llama-3.1-8B,13.78,12.7,0.13,25.29,0.47,4.61,0.05,6.15,0.3,8.98,0.38,24.95,0.32,🟢 pretrained,Unknown,Original,bfloat16,TRUE,"",0,0,TRUE,e5c39e551424c763dbc3e58e32ef2999d33a6d8d,TRUE,TRUE,"","",FALSE,TRUE,meta-llama/Meta-Llama-3.1-8B,https://huggingface.co/meta-llama/Meta-Llama-3.1-8B 🔶,AI-Sweden-Models/Llama-3-8B-instruct,13.78,24.01,0.24,18.39,0.42,0.45,0,2.13,0.27,19.94,0.48,17.75,0.26,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,7,TRUE,4e1c955228bdb4d69c1c4560e8d5872312a8f033,TRUE,TRUE,2024-06-27,2024-06-01,TRUE,FALSE,AI-Sweden-Models/Llama-3-8B-instruct,https://huggingface.co/AI-Sweden-Models/Llama-3-8B-instruct 🟢,tiiuae/falcon-11B,13.78,32.61,0.33,21.94,0.44,2.34,0.02,2.8,0.27,7.53,0.4,15.44,0.24,🟢 pretrained,FalconForCausalLM,Original,bfloat16,TRUE,unknown,11,192,TRUE,066e3bf4e2d9aaeefa129af0a6d39727d27816b3,TRUE,TRUE,2024-06-09,2024-05-09,FALSE,TRUE,tiiuae/falcon-11B,https://huggingface.co/tiiuae/falcon-11B 🟢,01-ai/Yi-6B,13.6,28.93,0.29,19.41,0.43,1.51,0.02,2.57,0.27,7.04,0.39,22.12,0.3,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,6,367,TRUE,7f7fb7662fd8ec09029364f408053c954986c8e5,TRUE,TRUE,2024-06-12,2023-11-01,FALSE,TRUE,01-ai/Yi-6B,https://huggingface.co/01-ai/Yi-6B 💬,mistralai/Mistral-7B-Instruct-v0.1,13.57,45.02,0.45,13.79,0.38,1.51,0.02,0,0.24,5.77,0.38,15.34,0.24,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,1472,TRUE,86370fc1f5e0aa51b50dcdf6eada80697b570099,TRUE,TRUE,2024-06-27,2023-09-27,TRUE,TRUE,mistralai/Mistral-7B-Instruct-v0.1,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 🔶,pankajmathur/orca_mini_v3_7b,13.52,28.21,0.28,17.84,0.41,0.3,0,0,0.25,22.71,0.5,12.04,0.21,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,7,40,TRUE,6252eb7ca29da8d951ae7d2bca948bf84e04a2b9,TRUE,TRUE,2024-06-26,2023-08-07,FALSE,FALSE,pankajmathur/orca_mini_v3_7b,https://huggingface.co/pankajmathur/orca_mini_v3_7b 🟢,NousResearch/Yarn-Mistral-7b-64k,13.43,20.8,0.21,20.23,0.43,3.02,0.03,5.37,0.29,9.88,0.41,21.27,0.29,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,49,TRUE,0273c624561fcecc8e8f4030492a9307aa60f945,TRUE,TRUE,2024-06-12,2023-10-31,FALSE,TRUE,NousResearch/Yarn-Mistral-7b-64k,https://huggingface.co/NousResearch/Yarn-Mistral-7b-64k -🟢,meta-llama/Meta-Llama-3-8B,13.41,14.55,0.15,24.5,0.46,3.25,0.03,7.38,0.31,6.24,0.36,24.55,0.32,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,5375,TRUE,62bd457b6fe961a42a631306577e622c83876cb6,TRUE,TRUE,2024-06-12,2024-04-17,FALSE,TRUE,meta-llama/Meta-Llama-3-8B,https://huggingface.co/meta-llama/Meta-Llama-3-8B +🟢,meta-llama/Meta-Llama-3-8B,13.41,14.55,0.15,24.5,0.46,3.25,0.03,7.38,0.31,6.24,0.36,24.55,0.32,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,5382,TRUE,62bd457b6fe961a42a631306577e622c83876cb6,TRUE,TRUE,2024-06-12,2024-04-17,FALSE,TRUE,meta-llama/Meta-Llama-3-8B,https://huggingface.co/meta-llama/Meta-Llama-3-8B 🟢,google/recurrentgemma-9b,13.26,30.76,0.31,14.8,0.39,4.83,0.05,4.7,0.29,6.6,0.38,17.88,0.26,🟢 pretrained,RecurrentGemmaForCausalLM,Original,bfloat16,TRUE,gemma,9,56,TRUE,7b0ed98fb889ba8bdfa7c690f08f2e57a7c48dae,TRUE,TRUE,2024-07-04,2024-06-07,FALSE,TRUE,google/recurrentgemma-9b,https://huggingface.co/google/recurrentgemma-9b 🟢,NousResearch/Yarn-Mistral-7b-128k,13.16,19.34,0.19,20.63,0.43,2.49,0.02,6.49,0.3,8.95,0.41,21.03,0.29,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,568,TRUE,d09f1f8ed437d61c1aff94c1beabee554843dcdd,TRUE,TRUE,2024-06-12,2023-10-31,FALSE,TRUE,NousResearch/Yarn-Mistral-7b-128k,https://huggingface.co/NousResearch/Yarn-Mistral-7b-128k 🔶,pankajmathur/orca_mini_v5_8b_orpo,12.88,8.24,0.08,27.88,0.5,5.97,0.06,4.59,0.28,8.97,0.41,21.63,0.29,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,1,TRUE,4cdc018043ef439f15bd8a09c4f09c6bc528dfc7,TRUE,TRUE,2024-06-26,2024-05-31,FALSE,FALSE,pankajmathur/orca_mini_v5_8b_orpo,https://huggingface.co/pankajmathur/orca_mini_v5_8b_orpo @@ -235,7 +239,7 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,meta-llama/Llama-2-70b-chat-hf,12.73,49.58,0.5,4.61,0.3,0.91,0.01,1.9,0.26,3.48,0.37,15.92,0.24,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,llama2,68,2124,TRUE,e9149a12809580e8602995856f8098ce973d1080,TRUE,TRUE,2024-06-12,2023-07-14,TRUE,TRUE,meta-llama/Llama-2-70b-chat-hf,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf 🔶,Sao10K/L3-8B-Stheno-v3.3-32K,12.57,46.04,0.46,13.51,0.38,0.98,0.01,0.89,0.26,4.07,0.37,9.95,0.19,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,cc-by-nc-4.0,8,39,TRUE,1a59d163e079c7e7f1542553d085853119960f0c,TRUE,TRUE,2024-06-26,2024-06-22,TRUE,FALSE,Sao10K/L3-8B-Stheno-v3.3-32K,https://huggingface.co/Sao10K/L3-8B-Stheno-v3.3-32K 🟢,Qwen/Qwen1.5-MoE-A2.7B,12.42,26.6,0.27,18.84,0.41,0.15,0,1.23,0.26,7.97,0.4,19.75,0.28,🟢 pretrained,Qwen2MoeForCausalLM,Original,bfloat16,TRUE,other,14,182,TRUE,1a758c50ecb6350748b9ce0a99d2352fd9fc11c9,TRUE,FALSE,2024-06-13,2024-02-29,FALSE,TRUE,Qwen/Qwen1.5-MoE-A2.7B,https://huggingface.co/Qwen/Qwen1.5-MoE-A2.7B -💬,stabilityai/stablelm-zephyr-3b,12.33,36.83,0.37,14.76,0.39,4.08,0.04,0,0.24,9.79,0.42,8.53,0.18,"💬 chat models (RLHF, DPO, IFT, ...)",StableLmForCausalLM,Original,bfloat16,TRUE,other,2,237,TRUE,a14f62d95754d96aea2be6e24c0f6966636797b9,TRUE,TRUE,2024-06-12,2023-11-21,TRUE,TRUE,stabilityai/stablelm-zephyr-3b,https://huggingface.co/stabilityai/stablelm-zephyr-3b +💬,stabilityai/stablelm-zephyr-3b,12.33,36.83,0.37,14.76,0.39,4.08,0.04,0,0.24,9.79,0.42,8.53,0.18,"💬 chat models (RLHF, DPO, IFT, ...)",StableLmForCausalLM,Original,bfloat16,TRUE,other,2,236,TRUE,a14f62d95754d96aea2be6e24c0f6966636797b9,TRUE,TRUE,2024-06-12,2023-11-21,TRUE,TRUE,stabilityai/stablelm-zephyr-3b,https://huggingface.co/stabilityai/stablelm-zephyr-3b 💬,Qwen/Qwen1.5-4B-Chat,12.33,31.57,0.32,16.3,0.4,0.98,0.01,2.24,0.27,7.36,0.4,15.51,0.24,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,3,34,TRUE,a7a4d4945d28bac955554c9abd2f74a71ebbf22f,TRUE,TRUE,2024-06-12,2024-01-30,TRUE,TRUE,Qwen/Qwen1.5-4B-Chat,https://huggingface.co/Qwen/Qwen1.5-4B-Chat 🟢,bigcode/starcoder2-15b,12.21,27.35,0.27,20.24,0.44,4.83,0.05,2.91,0.27,2.93,0.35,15.03,0.24,🟢 pretrained,Starcoder2ForCausalLM,Original,bfloat16,TRUE,bigcode-openrail-m,15,540,TRUE,46d44742909c03ac8cee08eb03fdebce02e193ec,TRUE,TRUE,2024-06-09,2024-02-20,FALSE,TRUE,bigcode/starcoder2-15b,https://huggingface.co/bigcode/starcoder2-15b 💬,Enno-Ai/EnnoAi-Pro-Llama-3-8B,12.17,31.95,0.32,17.51,0.42,0.15,0,1.57,0.26,9.08,0.41,12.79,0.22,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,creativeml-openrail-m,8,0,TRUE,6a5d745bdd304753244fe601e2a958d37d13cd71,TRUE,TRUE,2024-07-08,2024-07-01,TRUE,FALSE,Enno-Ai/EnnoAi-Pro-Llama-3-8B,https://huggingface.co/Enno-Ai/EnnoAi-Pro-Llama-3-8B @@ -250,6 +254,7 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,meta-llama/Llama-2-13b-chat-hf,11,39.85,0.4,7.16,0.33,0.6,0.01,0,0.23,8.16,0.4,10.26,0.19,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,llama2,13,998,TRUE,a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8,TRUE,TRUE,2024-06-12,2023-07-13,TRUE,TRUE,meta-llama/Llama-2-13b-chat-hf,https://huggingface.co/meta-llama/Llama-2-13b-chat-hf 🟢,meta-llama/Llama-2-13b-hf,10.99,24.82,0.25,17.22,0.41,1.06,0.01,4.14,0.28,3.39,0.35,15.31,0.24,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,llama2,13,563,TRUE,5c31dfb671ce7cfe2d7bb7c04375e44c55e815b1,TRUE,TRUE,2024-06-12,2023-07-13,FALSE,TRUE,meta-llama/Llama-2-13b-hf,https://huggingface.co/meta-llama/Llama-2-13b-hf 💬,THUDM/glm-4-9b-chat,10.97,0,0,25.21,0.47,0,0,8.5,0.31,8.06,0.4,24.07,0.32,"💬 chat models (RLHF, DPO, IFT, ...)",ChatGLMModelM,Original,bfloat16,TRUE,other,9,478,TRUE,04419001bc63e05e70991ade6da1f91c4aeec278,TRUE,TRUE,2024-07-09,2024-06-04,TRUE,FALSE,THUDM/glm-4-9b-chat,https://huggingface.co/THUDM/glm-4-9b-chat +🔶,Josephgflowers/Cinder-Phi-2-V1-F16-gguf,10.86,23.57,0.24,22.45,0.44,0,0,4.25,0.28,1.97,0.34,12.9,0.22,🔶 fine-tuned on domain-specific datasets,PhiForCausalLM,Original,float16,TRUE,mit,2,4,TRUE,85629ec9b18efee31d07630664e7a3815121badf,TRUE,TRUE,2024-06-26,2024-02-25,TRUE,FALSE,Josephgflowers/Cinder-Phi-2-V1-F16-gguf,https://huggingface.co/Josephgflowers/Cinder-Phi-2-V1-F16-gguf 🔶,lmsys/vicuna-7b-v1.5,10.78,23.52,0.24,15.15,0.39,0.76,0.01,1.12,0.26,11.42,0.42,12.74,0.21,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,llama2,7,268,TRUE,3321f76e3f527bd14065daf69dad9344000a201d,TRUE,TRUE,2024-06-12,2023-07-29,FALSE,TRUE,lmsys/vicuna-7b-v1.5,https://huggingface.co/lmsys/vicuna-7b-v1.5 💬,allenai/OLMo-7B-Instruct-hf,10.73,34.73,0.35,13.16,0.37,0.68,0.01,2.8,0.27,4.33,0.38,8.69,0.18,"💬 chat models (RLHF, DPO, IFT, ...)",OlmoForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,0,TRUE,2ea947518df93433aa71219f29b36c72ac63be95,TRUE,TRUE,2024-06-27,2024-06-04,TRUE,TRUE,allenai/OLMo-7B-Instruct-hf,https://huggingface.co/allenai/OLMo-7B-Instruct-hf 💬,internlm/internlm2-chat-1_8b,10.5,23.87,0.24,20.67,0.45,2.42,0.02,2.13,0.27,4.61,0.36,9.33,0.18,"💬 chat models (RLHF, DPO, IFT, ...)",InternLM2ForCausalLM,Original,bfloat16,TRUE,other,1,25,TRUE,4e226eeb354499f4d34ef4c27f6939f377475cc1,TRUE,TRUE,2024-06-12,2024-01-30,TRUE,TRUE,internlm/internlm2-chat-1_8b,https://huggingface.co/internlm/internlm2-chat-1_8b @@ -261,13 +266,13 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🔶,skymizer/Llama2-7b-sft-chat-custom-template-dpo,10.07,23.53,0.24,11.24,0.37,0.98,0.01,0,0.24,14.12,0.44,10.52,0.19,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama2,6,0,TRUE,22302ebd8c551a5f302fcb8366cc61fdeedf0e00,TRUE,TRUE,2024-07-01,2024-06-11,FALSE,FALSE,skymizer/Llama2-7b-sft-chat-custom-template-dpo,https://huggingface.co/skymizer/Llama2-7b-sft-chat-custom-template-dpo 🟩,pszemraj/Mistral-v0.3-6B,10.03,24.54,0.25,13.52,0.38,0.83,0.01,2.01,0.27,6.61,0.39,12.7,0.21,🟩 continuously pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,5,1,TRUE,ae11a699012b83996361f04808f4d45debf3b01c,TRUE,TRUE,2024-06-26,2024-05-25,FALSE,FALSE,pszemraj/Mistral-v0.3-6B,https://huggingface.co/pszemraj/Mistral-v0.3-6B 🔶,teknium/OpenHermes-7B,9.48,18.13,0.18,12.08,0.36,1.06,0.01,2.57,0.27,12.68,0.43,10.37,0.19,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,mit,7,13,TRUE,9f55d6eb15f1edd52ee1fd863a220aa682e78a00,TRUE,TRUE,2024-06-12,2023-09-14,FALSE,TRUE,teknium/OpenHermes-7B,https://huggingface.co/teknium/OpenHermes-7B -💬,meta-llama/Llama-2-7b-chat-hf,9.4,39.65,0.4,4.49,0.31,0.68,0.01,0.56,0.25,3.48,0.37,7.52,0.17,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,llama2,6,3707,TRUE,f5db02db724555f92da89c216ac04704f23d4590,TRUE,TRUE,2024-06-12,2023-07-13,TRUE,TRUE,meta-llama/Llama-2-7b-chat-hf,https://huggingface.co/meta-llama/Llama-2-7b-chat-hf +💬,meta-llama/Llama-2-7b-chat-hf,9.4,39.65,0.4,4.49,0.31,0.68,0.01,0.56,0.25,3.48,0.37,7.52,0.17,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,llama2,6,3708,TRUE,f5db02db724555f92da89c216ac04704f23d4590,TRUE,TRUE,2024-06-12,2023-07-13,TRUE,TRUE,meta-llama/Llama-2-7b-chat-hf,https://huggingface.co/meta-llama/Llama-2-7b-chat-hf 🔶,NousResearch/Nous-Hermes-llama-2-7b,9.28,17.29,0.17,13.79,0.38,0.68,0.01,1.79,0.26,11.68,0.43,10.44,0.19,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,mit,6,67,TRUE,b7c3ec54b754175e006ef75696a2ba3802697078,TRUE,TRUE,2024-06-12,2023-07-25,FALSE,TRUE,NousResearch/Nous-Hermes-llama-2-7b,https://huggingface.co/NousResearch/Nous-Hermes-llama-2-7b 💬,stabilityai/stablelm-2-zephyr-1_6b,9.26,32.79,0.33,6.71,0.34,2.11,0.02,0,0.24,5.99,0.35,7.93,0.17,"💬 chat models (RLHF, DPO, IFT, ...)",StableLmForCausalLM,Original,float16,TRUE,other,1,174,TRUE,2f275b1127d59fc31e4f7c7426d528768ada9ea4,TRUE,TRUE,2024-06-12,2024-01-19,TRUE,TRUE,stabilityai/stablelm-2-zephyr-1_6b,https://huggingface.co/stabilityai/stablelm-2-zephyr-1_6b 🟢,Qwen/Qwen1.5-1.8B,9.12,21.54,0.22,9.76,0.35,2.27,0.02,7.38,0.31,3.96,0.36,9.8,0.19,🟢 pretrained,Qwen2ForCausalLM,Original,bfloat16,TRUE,other,1,43,TRUE,7846de7ed421727b318d6605a0bfab659da2c067,TRUE,TRUE,2024-06-13,2024-01-22,FALSE,TRUE,Qwen/Qwen1.5-1.8B,https://huggingface.co/Qwen/Qwen1.5-1.8B 💬,Qwen/Qwen1.5-1.8B-Chat,9.01,20.19,0.2,5.91,0.33,0.45,0,6.38,0.3,12.18,0.43,8.93,0.18,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,1,43,TRUE,e482ee3f73c375a627a16fdf66fd0c8279743ca6,TRUE,TRUE,2024-06-12,2024-01-30,TRUE,TRUE,Qwen/Qwen1.5-1.8B-Chat,https://huggingface.co/Qwen/Qwen1.5-1.8B-Chat 🔶,TencentARC/LLaMA-Pro-8B,8.78,22.77,0.23,9.29,0.35,1.66,0.02,1.34,0.26,8.59,0.4,9.01,0.18,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama2,8,170,TRUE,7115e7179060e0623d1ee9ff4476faed7e478d8c,TRUE,TRUE,2024-06-12,2024-01-05,FALSE,TRUE,TencentARC/LLaMA-Pro-8B,https://huggingface.co/TencentARC/LLaMA-Pro-8B -🟢,meta-llama/Llama-2-7b-hf,8.72,25.19,0.25,10.35,0.35,1.21,0.01,2.24,0.27,3.76,0.37,9.57,0.19,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,llama2,6,1588,TRUE,01c7f73d771dfac7d292323805ebc428287df4f9,TRUE,TRUE,2024-06-12,2023-07-13,FALSE,TRUE,meta-llama/Llama-2-7b-hf,https://huggingface.co/meta-llama/Llama-2-7b-hf +🟢,meta-llama/Llama-2-7b-hf,8.72,25.19,0.25,10.35,0.35,1.21,0.01,2.24,0.27,3.76,0.37,9.57,0.19,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,llama2,6,1589,TRUE,01c7f73d771dfac7d292323805ebc428287df4f9,TRUE,TRUE,2024-06-12,2023-07-13,FALSE,TRUE,meta-llama/Llama-2-7b-hf,https://huggingface.co/meta-llama/Llama-2-7b-hf 💬,stabilityai/stablelm-2-1_6b-chat,8.63,30.6,0.31,7.49,0.34,1.06,0.01,0,0.25,5.71,0.36,6.91,0.16,"💬 chat models (RLHF, DPO, IFT, ...)",StableLmForCausalLM,Original,bfloat16,TRUE,other,1,26,TRUE,f3fe67057c2789ae1bb1fe42b038da99840d4f13,TRUE,TRUE,2024-06-12,2024-04-08,TRUE,TRUE,stabilityai/stablelm-2-1_6b-chat,https://huggingface.co/stabilityai/stablelm-2-1_6b-chat 🟢,internlm/internlm2-1_8b,8.58,21.98,0.22,13.63,0.39,1.13,0.01,0,0.25,8.23,0.38,6.54,0.16,🟢 pretrained,InternLM2ForCausalLM,Original,bfloat16,TRUE,other,8,25,TRUE,c24f301c7374ad9f9b58d1ea80f68b5f57cbca13,TRUE,TRUE,2024-06-12,2024-01-30,FALSE,TRUE,internlm/internlm2-1_8b,https://huggingface.co/internlm/internlm2-1_8b 🟢,NousResearch/Yarn-Llama-2-13b-128k,8.39,16.55,0.17,13.51,0.38,1.13,0.01,1.12,0.26,3.39,0.35,14.67,0.23,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,"",13,113,TRUE,4e3e87a067f64f8814c83dd5e3bad92dcf8a2391,TRUE,TRUE,2024-06-13,2023-08-30,FALSE,TRUE,NousResearch/Yarn-Llama-2-13b-128k,https://huggingface.co/NousResearch/Yarn-Llama-2-13b-128k @@ -278,19 +283,19 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,google/recurrentgemma-2b-it,8.06,29.49,0.29,8.11,0.33,1.74,0.02,1.01,0.26,3.62,0.34,4.41,0.14,"💬 chat models (RLHF, DPO, IFT, ...)",RecurrentGemmaForCausalLM,Original,bfloat16,TRUE,gemma,2,101,TRUE,150248167d171fbdf4b02e7d28a4b3d749e570f6,TRUE,TRUE,2024-06-12,2024-04-08,TRUE,TRUE,google/recurrentgemma-2b-it,https://huggingface.co/google/recurrentgemma-2b-it 💬,google/gemma-1.1-2b-it,7.78,30.67,0.31,5.86,0.32,0.15,0,2.57,0.27,2.02,0.34,5.37,0.15,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,gemma,2,133,TRUE,bf4924f313df5166dee1467161e886e55f2eb4d4,TRUE,TRUE,2024-06-12,2024-03-26,TRUE,TRUE,google/gemma-1.1-2b-it,https://huggingface.co/google/gemma-1.1-2b-it 🟢,ibm-granite/granite-7b-base,7.75,24.14,0.24,9.05,0.35,0.6,0.01,0,0.25,3.4,0.36,9.27,0.18,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,6,21,TRUE,23fcb4cb5b69f8a122fb944491e9f1ad664ba37b,TRUE,TRUE,2024-06-12,2024-04-19,FALSE,TRUE,ibm-granite/granite-7b-base,https://huggingface.co/ibm-granite/granite-7b-base -🟢,tensoropera/Fox-1-1.6B,7.69,27.66,0.28,7.4,0.33,1.28,0.01,1.79,0.26,3.87,0.35,4.13,0.14,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,20,TRUE,6389dde4d7e52aa1200ad954c565f03c7fdcf8db,TRUE,TRUE,2024-06-29,2024-06-13,FALSE,FALSE,tensoropera/Fox-1-1.6B,https://huggingface.co/tensoropera/Fox-1-1.6B +🟢,tensoropera/Fox-1-1.6B,7.69,27.66,0.28,7.4,0.33,1.28,0.01,1.79,0.26,3.87,0.35,4.13,0.14,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,21,TRUE,6389dde4d7e52aa1200ad954c565f03c7fdcf8db,TRUE,TRUE,2024-06-29,2024-06-13,FALSE,FALSE,tensoropera/Fox-1-1.6B,https://huggingface.co/tensoropera/Fox-1-1.6B 🔶,VAGOsolutions/SauerkrautLM-Gemma-2b,7.58,24.75,0.25,9.13,0.34,1.96,0.02,0.89,0.26,3.51,0.37,5.21,0.15,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,bfloat16,TRUE,other,2,8,TRUE,f9d5575c23da96f33ce77dea3b0776746b9469bc,TRUE,TRUE,2024-06-26,2024-03-06,TRUE,FALSE,VAGOsolutions/SauerkrautLM-Gemma-2b,https://huggingface.co/VAGOsolutions/SauerkrautLM-Gemma-2b 🟢,deepseek-ai/deepseek-moe-16b-base,7.37,24.5,0.24,8.36,0.34,1.81,0.02,0.56,0.25,3.36,0.37,5.61,0.15,🟢 pretrained,DeepseekForCausalLM,Original,bfloat16,TRUE,other,16,77,TRUE,521d2bc4fb69a3f3ae565310fcc3b65f97af2580,TRUE,FALSE,2024-06-12,2024-01-08,FALSE,TRUE,deepseek-ai/deepseek-moe-16b-base,https://huggingface.co/deepseek-ai/deepseek-moe-16b-base 🟢,google/gemma-2b,7.27,20.38,0.2,8.25,0.34,2.72,0.03,0.67,0.26,7.56,0.4,4.06,0.14,🟢 pretrained,GemmaForCausalLM,Original,bfloat16,TRUE,gemma,2,805,TRUE,2ac59a5d7bf4e1425010f0d457dde7d146658953,TRUE,TRUE,2024-06-12,2024-02-08,FALSE,TRUE,google/gemma-2b,https://huggingface.co/google/gemma-2b 🟢,stabilityai/stablelm-3b-4e1t,7.26,22.03,0.22,9.01,0.35,0.68,0.01,0,0.24,4.42,0.38,7.43,0.17,🟢 pretrained,StableLmForCausalLM,Original,bfloat16,TRUE,cc-by-sa-4.0,2,305,TRUE,fa4a6a92fca83c3b4223a3c9bf792887090ebfba,TRUE,TRUE,2024-06-12,2023-09-29,FALSE,TRUE,stabilityai/stablelm-3b-4e1t,https://huggingface.co/stabilityai/stablelm-3b-4e1t -💬,google/gemma-2b-it,7.22,26.9,0.27,5.21,0.32,0.45,0,3.8,0.28,3.03,0.33,3.92,0.14,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,gemma,2,592,TRUE,de144fb2268dee1066f515465df532c05e699d48,TRUE,TRUE,2024-06-12,2024-02-08,TRUE,TRUE,google/gemma-2b-it,https://huggingface.co/google/gemma-2b-it +💬,google/gemma-2b-it,7.22,26.9,0.27,5.21,0.32,0.45,0,3.8,0.28,3.03,0.33,3.92,0.14,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,gemma,2,593,TRUE,de144fb2268dee1066f515465df532c05e699d48,TRUE,TRUE,2024-06-12,2024-02-08,TRUE,TRUE,google/gemma-2b-it,https://huggingface.co/google/gemma-2b-it 🔶,cgato/TheSalt-L3-8b-v0.3.2,7.19,27.05,0.27,2.61,0.3,3.47,0.03,2.13,0.27,6.3,0.39,1.55,0.11,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,cc-by-nc-4.0,8,1,TRUE,5cf08e2bf9590ebcd14ba021e113def28c65afa2,TRUE,TRUE,2024-06-26,2024-06-18,TRUE,FALSE,cgato/TheSalt-L3-8b-v0.3.2,https://huggingface.co/cgato/TheSalt-L3-8b-v0.3.2 🟢,NousResearch/Yarn-Llama-2-7b-64k,7.12,17,0.17,7.04,0.33,0.98,0.01,1.9,0.26,6.93,0.39,8.87,0.18,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,"",7,23,TRUE,08491431ac3b50add7443f5d4c02850801d877be,TRUE,TRUE,2024-06-13,2023-08-30,FALSE,TRUE,NousResearch/Yarn-Llama-2-7b-64k,https://huggingface.co/NousResearch/Yarn-Llama-2-7b-64k 🟢,Qwen/Qwen2-0.5B,7.06,18.67,0.19,7.99,0.33,2.57,0.03,0.78,0.26,4.6,0.38,7.76,0.17,🟢 pretrained,Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,58,TRUE,ff3a49fac17555b8dfc4db6709f480cc8f16a9fe,TRUE,TRUE,2024-06-09,2024-05-31,FALSE,TRUE,Qwen/Qwen2-0.5B,https://huggingface.co/Qwen/Qwen2-0.5B 🟢,microsoft/phi-1_5,7.06,20.33,0.2,7.47,0.34,1.13,0.01,2.35,0.27,3.39,0.34,7.68,0.17,🟢 pretrained,PhiForCausalLM,Original,float16,TRUE,mit,1,1296,TRUE,675aa382d814580b22651a30acb1a585d7c25963,TRUE,TRUE,2024-06-09,2023-09-10,FALSE,TRUE,microsoft/phi-1_5,https://huggingface.co/microsoft/phi-1_5 🟢,google/recurrentgemma-2b,6.94,30.02,0.3,5.01,0.32,1.66,0.02,0,0.25,2.94,0.34,1.99,0.12,🟢 pretrained,RecurrentGemmaForCausalLM,Original,bfloat16,TRUE,gemma,2,89,TRUE,195f13c55b371fc721eda0662c00c64642c70e17,TRUE,TRUE,2024-06-13,2024-04-06,FALSE,TRUE,google/recurrentgemma-2b,https://huggingface.co/google/recurrentgemma-2b 🟢,databricks/dolly-v1-6b,6.89,22.24,0.22,4.78,0.32,1.36,0.01,1.9,0.26,8.12,0.4,2.95,0.13,🟢 pretrained,GPTJForCausalLM,Original,bfloat16,TRUE,cc-by-nc-4.0,6,310,TRUE,c9a85b3a322b402e20c839c702c725afe0cb454d,TRUE,TRUE,2024-06-12,2023-03-23,FALSE,TRUE,databricks/dolly-v1-6b,https://huggingface.co/databricks/dolly-v1-6b -🟢,HuggingFaceTB/SmolLM-135M,6.84,21.25,0.21,3.29,0.3,0.68,0.01,1.12,0.26,13.34,0.44,1.36,0.11,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,61,TRUE,eec6e461571fba3e197a57c298f60b75422eae02,TRUE,TRUE,2024-07-18,2024-07-14,FALSE,FALSE,HuggingFaceTB/SmolLM-135M,https://huggingface.co/HuggingFaceTB/SmolLM-135M +🟢,HuggingFaceTB/SmolLM-135M,6.84,21.25,0.21,3.29,0.3,0.68,0.01,1.12,0.26,13.34,0.44,1.36,0.11,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,62,TRUE,eec6e461571fba3e197a57c298f60b75422eae02,TRUE,TRUE,2024-07-18,2024-07-14,FALSE,FALSE,HuggingFaceTB/SmolLM-135M,https://huggingface.co/HuggingFaceTB/SmolLM-135M 🔶,togethercomputer/GPT-JT-6B-v1,6.83,20.61,0.21,7.32,0.33,0.76,0.01,1.45,0.26,3.87,0.37,6.95,0.16,🔶 fine-tuned on domain-specific datasets,GPTJForCausalLM,Original,float16,TRUE,apache-2.0,6,302,TRUE,f34aa35f906895602c1f86f5685e598afdea8051,TRUE,TRUE,2024-06-12,2022-11-24,FALSE,TRUE,togethercomputer/GPT-JT-6B-v1,https://huggingface.co/togethercomputer/GPT-JT-6B-v1 🟢,allenai/OLMo-7B-hf,6.78,27.19,0.27,5.76,0.33,0.68,0.01,3.02,0.27,2.08,0.35,1.92,0.12,🟢 pretrained,OlmoForCausalLM,Original,bfloat16,TRUE,apache-2.0,6,8,TRUE,687d934d36a05417048d0fe7482f24f389fef6aa,TRUE,TRUE,2024-06-27,2024-04-12,FALSE,TRUE,allenai/OLMo-7B-hf,https://huggingface.co/allenai/OLMo-7B-hf 🔶,togethercomputer/LLaMA-2-7B-32K,6.71,18.65,0.19,8.09,0.34,0.68,0.01,0,0.25,4.32,0.38,8.53,0.18,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,llama2,7,526,TRUE,46c24bb5aef59722fa7aa6d75e832afd1d64b980,TRUE,TRUE,2024-06-12,2023-07-26,FALSE,TRUE,togethercomputer/LLaMA-2-7B-32K,https://huggingface.co/togethercomputer/LLaMA-2-7B-32K @@ -298,9 +303,9 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🟢,EleutherAI/gpt-j-6b,6.55,25.22,0.25,4.91,0.32,1.21,0.01,0,0.25,5.25,0.37,2.68,0.12,🟢 pretrained,GPTJForCausalLM,Original,bfloat16,TRUE,apache-2.0,6,1388,TRUE,47e169305d2e8376be1d31e765533382721b2cc1,TRUE,TRUE,2024-06-12,2022-03-02,FALSE,TRUE,EleutherAI/gpt-j-6b,https://huggingface.co/EleutherAI/gpt-j-6b 🔶,winglian/llama-3-8b-256k-PoSE,6.55,29.09,0.29,5.5,0.32,1.44,0.01,1.01,0.26,0.94,0.33,1.29,0.11,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,"",8,41,FALSE,93e7b0b6433c96583ffcef3bc47203e6fdcbbe8b,TRUE,TRUE,2024-06-26,2024-04-26,TRUE,FALSE,winglian/llama-3-8b-256k-PoSE,https://huggingface.co/winglian/llama-3-8b-256k-PoSE 🟢,bigcode/starcoder2-3b,6.54,20.37,0.2,8.91,0.35,1.44,0.01,0,0.24,1.43,0.34,7.07,0.16,🟢 pretrained,Starcoder2ForCausalLM,Original,bfloat16,TRUE,bigcode-openrail-m,3,125,TRUE,733247c55e3f73af49ce8e9c7949bf14af205928,TRUE,TRUE,2024-06-09,2023-11-29,FALSE,TRUE,bigcode/starcoder2-3b,https://huggingface.co/bigcode/starcoder2-3b -🟢,gpt2,6.54,18.08,0.18,2.67,0.3,0.23,0,1.12,0.26,15.35,0.45,1.77,0.12,🟢 pretrained,GPT2LMHeadModel,Original,bfloat16,TRUE,mit,0,2096,TRUE,607a30d783dfa663caf39e06633721c8d4cfcd7e,TRUE,TRUE,2024-06-09,2022-03-02,FALSE,TRUE,gpt2,https://huggingface.co/gpt2 +🟢,gpt2,6.54,18.08,0.18,2.67,0.3,0.23,0,1.12,0.26,15.35,0.45,1.77,0.12,🟢 pretrained,GPT2LMHeadModel,Original,bfloat16,TRUE,mit,0,2102,TRUE,607a30d783dfa663caf39e06633721c8d4cfcd7e,TRUE,TRUE,2024-06-09,2022-03-02,FALSE,TRUE,gpt2,https://huggingface.co/gpt2 🟩,BEE-spoke-data/smol_llama-220M-GQA-fineweb_edu,6.52,19.88,0.2,2.31,0.29,0,0,1.23,0.26,14.26,0.44,1.41,0.11,🟩 continuously pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,1,TRUE,dec16b41d5e94070dbc1f8449a554373fd4cc1d1,TRUE,TRUE,2024-06-26,2024-06-08,FALSE,FALSE,BEE-spoke-data/smol_llama-220M-GQA-fineweb_edu,https://huggingface.co/BEE-spoke-data/smol_llama-220M-GQA-fineweb_edu -🟢,openai-community/gpt2,6.51,17.93,0.18,2.67,0.3,0.23,0,1.12,0.26,15.35,0.45,1.77,0.12,🟢 pretrained,GPT2LMHeadModel,Original,bfloat16,TRUE,mit,0,2096,TRUE,607a30d783dfa663caf39e06633721c8d4cfcd7e,TRUE,TRUE,2024-06-12,2022-03-02,FALSE,TRUE,openai-community/gpt2,https://huggingface.co/openai-community/gpt2 +🟢,openai-community/gpt2,6.51,17.93,0.18,2.67,0.3,0.23,0,1.12,0.26,15.35,0.45,1.77,0.12,🟢 pretrained,GPT2LMHeadModel,Original,bfloat16,TRUE,mit,0,2102,TRUE,607a30d783dfa663caf39e06633721c8d4cfcd7e,TRUE,TRUE,2024-06-12,2022-03-02,FALSE,TRUE,openai-community/gpt2,https://huggingface.co/openai-community/gpt2 🟢,allenai/OLMo-1B-hf,6.47,21.82,0.22,3.2,0.31,0.76,0.01,1.57,0.26,9.56,0.41,1.93,0.12,🟢 pretrained,OlmoForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,10,TRUE,8e995430edd24416ccfa98b5b283fa07b0c9f1a9,TRUE,TRUE,2024-06-12,2024-04-12,FALSE,TRUE,allenai/OLMo-1B-hf,https://huggingface.co/allenai/OLMo-1B-hf 🟢,BEE-spoke-data/smol_llama-220M-GQA,6.4,23.86,0.24,3.04,0.3,0,0,0.78,0.26,9.07,0.41,1.66,0.11,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,11,TRUE,8845b1d3c0bc73522ef2700aab467183cbdca9f7,TRUE,TRUE,2024-06-26,2023-12-22,FALSE,FALSE,BEE-spoke-data/smol_llama-220M-GQA,https://huggingface.co/BEE-spoke-data/smol_llama-220M-GQA 💬,Qwen/Qwen2-0.5B-Instruct,6.39,22.47,0.22,5.88,0.32,1.66,0.02,0,0.25,2.41,0.34,5.9,0.15,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,103,TRUE,c291d6fce4804a1d39305f388dd32897d1f7acc4,TRUE,TRUE,2024-06-12,2024-06-03,TRUE,TRUE,Qwen/Qwen2-0.5B-Instruct,https://huggingface.co/Qwen/Qwen2-0.5B-Instruct @@ -308,10 +313,10 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🟢,EleutherAI/gpt-neo-2.7B,6.34,25.9,0.26,4.18,0.31,0.53,0.01,2.13,0.27,3.52,0.36,1.81,0.12,🟢 pretrained,GPTNeoForCausalLM,Original,bfloat16,TRUE,mit,2,399,TRUE,e24fa291132763e59f4a5422741b424fb5d59056,TRUE,TRUE,2024-06-12,2022-03-02,FALSE,TRUE,EleutherAI/gpt-neo-2.7B,https://huggingface.co/EleutherAI/gpt-neo-2.7B 🔶,togethercomputer/RedPajama-INCITE-7B-Instruct,6.33,20.55,0.21,7.91,0.34,1.36,0.01,0.11,0.25,5.03,0.37,3.03,0.13,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,7,104,TRUE,7f36397b9985a3f981cdb618f8fec1c565ca5927,TRUE,TRUE,2024-06-12,2023-05-05,FALSE,TRUE,togethercomputer/RedPajama-INCITE-7B-Instruct,https://huggingface.co/togethercomputer/RedPajama-INCITE-7B-Instruct 🟢,facebook/opt-30b,6.2,24.53,0.25,3.5,0.31,0.6,0.01,2.57,0.27,4.19,0.36,1.82,0.12,🟢 pretrained,OPTForCausalLM,Original,float16,TRUE,other,30,133,TRUE,ceea0a90ac0f6fae7c2c34bcb40477438c152546,TRUE,TRUE,2024-06-12,2022-05-11,FALSE,TRUE,facebook/opt-30b,https://huggingface.co/facebook/opt-30b -🟢,HuggingFaceTB/SmolLM-360M,6.15,21.34,0.21,3.28,0.31,0.45,0,2.35,0.27,8.09,0.4,1.37,0.11,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,24,TRUE,318cc630b73730bfd712e5873063156ffb8936b5,TRUE,TRUE,2024-07-18,2024-07-14,FALSE,FALSE,HuggingFaceTB/SmolLM-360M,https://huggingface.co/HuggingFaceTB/SmolLM-360M +🟢,HuggingFaceTB/SmolLM-360M,6.15,21.34,0.21,3.28,0.31,0.45,0,2.35,0.27,8.09,0.4,1.37,0.11,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,25,TRUE,318cc630b73730bfd712e5873063156ffb8936b5,TRUE,TRUE,2024-07-18,2024-07-14,FALSE,FALSE,HuggingFaceTB/SmolLM-360M,https://huggingface.co/HuggingFaceTB/SmolLM-360M 🟢,EleutherAI/gpt-neox-20b,5.99,25.87,0.26,4.93,0.32,0.6,0.01,0,0.24,2.82,0.36,1.73,0.12,🟢 pretrained,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,20,504,TRUE,c292233c833e336628618a88a648727eb3dff0a7,TRUE,TRUE,2024-06-09,2022-04-07,FALSE,TRUE,EleutherAI/gpt-neox-20b,https://huggingface.co/EleutherAI/gpt-neox-20b 🟢,mosaicml/mpt-7b,5.98,21.52,0.22,6.55,0.33,1.28,0.01,1.34,0.26,2.9,0.37,2.29,0.12,🟢 pretrained,MPTForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,1151,TRUE,039e37745f00858f0e01e988383a8c4393b1a4f5,TRUE,TRUE,2024-06-08,2023-05-05,FALSE,TRUE,mosaicml/mpt-7b,https://huggingface.co/mosaicml/mpt-7b -🟢,gpt2,5.98,8.33,0.08,9.2,0.31,0,0,0,0.23,18.33,0.43,0,0.1,🟢 pretrained,GPT2LMHeadModel,Original,float16,TRUE,mit,0,2096,TRUE,607a30d783dfa663caf39e06633721c8d4cfcd7e,TRUE,TRUE,2024-06-26,2022-03-02,FALSE,TRUE,gpt2,https://huggingface.co/gpt2 +🟢,gpt2,5.98,8.33,0.08,9.2,0.31,0,0,0,0.23,18.33,0.43,0,0.1,🟢 pretrained,GPT2LMHeadModel,Original,float16,TRUE,mit,0,2102,TRUE,607a30d783dfa663caf39e06633721c8d4cfcd7e,TRUE,TRUE,2024-06-26,2022-03-02,FALSE,TRUE,gpt2,https://huggingface.co/gpt2 🟢,EleutherAI/pythia-12b,5.93,24.71,0.25,4.99,0.32,0.91,0.01,0,0.25,3.79,0.36,1.21,0.11,🟢 pretrained,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,12,129,TRUE,35c9d7f32fbb108fb8b5bdd574eb03369d1eed49,TRUE,TRUE,2024-06-12,2023-02-28,FALSE,TRUE,EleutherAI/pythia-12b,https://huggingface.co/EleutherAI/pythia-12b 🟢,EleutherAI/pythia-6.9b,5.85,22.81,0.23,5.88,0.32,0.76,0.01,0.22,0.25,3.81,0.36,1.63,0.11,🟢 pretrained,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,6,41,TRUE,f271943e880e60c0c715fd10e4dc74ec4e31eb44,TRUE,TRUE,2024-06-12,2023-02-14,FALSE,TRUE,EleutherAI/pythia-6.9b,https://huggingface.co/EleutherAI/pythia-6.9b 🔶,Josephgflowers/TinyLlama-Cinder-Agent-v1,5.82,26.7,0.27,3.8,0.31,0.38,0,0,0.24,2.23,0.34,1.79,0.12,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,mit,1,0,TRUE,a9cd8b48bfe30f29bb1f819213da9a4c41eee67f,TRUE,TRUE,2024-06-26,2024-05-21,TRUE,FALSE,Josephgflowers/TinyLlama-Cinder-Agent-v1,https://huggingface.co/Josephgflowers/TinyLlama-Cinder-Agent-v1 @@ -323,18 +328,18 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 💬,Qwen/Qwen1.5-0.5B-Chat,5.56,18.07,0.18,4.32,0.32,0,0,2.57,0.27,6.06,0.38,2.36,0.12,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,0,72,TRUE,4d14e384a4b037942bb3f3016665157c8bcb70ea,TRUE,TRUE,2024-06-12,2024-01-31,TRUE,TRUE,Qwen/Qwen1.5-0.5B-Chat,https://huggingface.co/Qwen/Qwen1.5-0.5B-Chat 🟢,microsoft/phi-1,5.52,20.68,0.21,4.27,0.31,0.68,0.01,2.01,0.27,3.7,0.35,1.8,0.12,🟢 pretrained,PhiForCausalLM,Original,bfloat16,TRUE,mit,1,199,TRUE,b9ac0e6d78d43970ecf88e9e0154b3a7da20ed89,TRUE,TRUE,2024-06-13,2023-09-10,FALSE,TRUE,microsoft/phi-1,https://huggingface.co/microsoft/phi-1 🔶,pankajmathur/orca_mini_v2_7b,5.5,13.58,0.14,10.2,0.35,1.13,0.01,0,0.25,2.08,0.36,6.02,0.15,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,cc-by-nc-sa-4.0,7,36,TRUE,66d3f32a4a6bca0a2a261f1bdb54d2582028f75f,TRUE,TRUE,2024-06-26,2023-07-03,FALSE,FALSE,pankajmathur/orca_mini_v2_7b,https://huggingface.co/pankajmathur/orca_mini_v2_7b -🟢,openai-community/gpt2-large,5.48,20.48,0.2,3.25,0.31,0.68,0.01,1.23,0.26,5.66,0.38,1.58,0.11,🟢 pretrained,GPT2LMHeadModel,Original,bfloat16,TRUE,mit,0,243,TRUE,32b71b12589c2f8d625668d2335a01cac3249519,TRUE,TRUE,2024-06-12,2022-03-02,FALSE,TRUE,openai-community/gpt2-large,https://huggingface.co/openai-community/gpt2-large +🟢,openai-community/gpt2-large,5.48,20.48,0.2,3.25,0.31,0.68,0.01,1.23,0.26,5.66,0.38,1.58,0.11,🟢 pretrained,GPT2LMHeadModel,Original,bfloat16,TRUE,mit,0,242,TRUE,32b71b12589c2f8d625668d2335a01cac3249519,TRUE,TRUE,2024-06-12,2022-03-02,FALSE,TRUE,openai-community/gpt2-large,https://huggingface.co/openai-community/gpt2-large 🟢,togethercomputer/RedPajama-INCITE-7B-Base,5.46,20.82,0.21,5.09,0.32,0.98,0.01,0.67,0.26,3.02,0.36,2.19,0.12,🟢 pretrained,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,7,93,TRUE,78f7e482443971f4873ba3239f0ac810a367833b,TRUE,TRUE,2024-06-12,2023-05-04,FALSE,TRUE,togethercomputer/RedPajama-INCITE-7B-Base,https://huggingface.co/togethercomputer/RedPajama-INCITE-7B-Base 🔶,databricks/dolly-v2-3b,5.45,22.47,0.22,3.32,0.31,0.6,0.01,1.45,0.26,3.22,0.33,1.61,0.11,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,bfloat16,TRUE,mit,3,284,TRUE,f6c9be08f16fe4d3a719bee0a4a7c7415b5c65df,TRUE,TRUE,2024-06-12,2023-04-13,FALSE,TRUE,databricks/dolly-v2-3b,https://huggingface.co/databricks/dolly-v2-3b 🟢,EleutherAI/pythia-2.8b,5.44,21.73,0.22,5.08,0.32,0.68,0.01,0,0.25,3.64,0.35,1.52,0.11,🟢 pretrained,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,2,28,TRUE,2a259cdd96a4beb1cdf467512e3904197345f6a9,TRUE,TRUE,2024-06-12,2023-02-13,FALSE,TRUE,EleutherAI/pythia-2.8b,https://huggingface.co/EleutherAI/pythia-2.8b 🟢,togethercomputer/RedPajama-INCITE-Base-3B-v1,5.43,22.94,0.23,3.52,0.31,0.91,0.01,0,0.24,4,0.37,1.24,0.11,🟢 pretrained,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,3,91,TRUE,094fbdd0c911feb485ce55de1952ab2e75277e1e,TRUE,TRUE,2024-06-12,2023-05-04,FALSE,TRUE,togethercomputer/RedPajama-INCITE-Base-3B-v1,https://huggingface.co/togethercomputer/RedPajama-INCITE-Base-3B-v1 -🟢,HuggingFaceTB/SmolLM-1.7B,5.43,23.62,0.24,4.41,0.32,0.76,0.01,0,0.24,2.13,0.34,1.64,0.11,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,85,TRUE,673a07602ca1191e5bc2ddda428e2f608a0a14c0,TRUE,TRUE,2024-07-18,2024-07-14,FALSE,FALSE,HuggingFaceTB/SmolLM-1.7B,https://huggingface.co/HuggingFaceTB/SmolLM-1.7B +🟢,HuggingFaceTB/SmolLM-1.7B,5.43,23.62,0.24,4.41,0.32,0.76,0.01,0,0.24,2.13,0.34,1.64,0.11,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,89,TRUE,673a07602ca1191e5bc2ddda428e2f608a0a14c0,TRUE,TRUE,2024-07-18,2024-07-14,FALSE,FALSE,HuggingFaceTB/SmolLM-1.7B,https://huggingface.co/HuggingFaceTB/SmolLM-1.7B 🔶,PygmalionAI/pygmalion-6b,5.39,20.91,0.21,5.09,0.32,0.6,0.01,0,0.25,3.71,0.37,2.04,0.12,🔶 fine-tuned on domain-specific datasets,GPTJForCausalLM,Original,float16,TRUE,creativeml-openrail-m,6,725,TRUE,2a0d74449c8fbf0378194e95f64aa92e16297294,TRUE,TRUE,2024-06-12,2023-01-07,FALSE,TRUE,PygmalionAI/pygmalion-6b,https://huggingface.co/PygmalionAI/pygmalion-6b 🟢,EleutherAI/gpt-neo-1.3B,5.33,20.79,0.21,3.02,0.3,0.68,0.01,0.78,0.26,4.87,0.38,1.82,0.12,🟢 pretrained,GPTNeoForCausalLM,Original,bfloat16,TRUE,mit,1,247,TRUE,dbe59a7f4a88d01d1ba9798d78dbe3fe038792c8,TRUE,TRUE,2024-06-12,2022-03-02,FALSE,TRUE,EleutherAI/gpt-neo-1.3B,https://huggingface.co/EleutherAI/gpt-neo-1.3B 🟢,facebook/opt-1.3b,5.25,23.83,0.24,3.65,0.31,0.76,0.01,0,0.24,2.08,0.34,1.19,0.11,🟢 pretrained,OPTForCausalLM,Original,float16,TRUE,other,1,142,TRUE,3f5c25d0bc631cb57ac65913f76e22c2dfb61d62,TRUE,TRUE,2024-06-12,2022-05-11,FALSE,TRUE,facebook/opt-1.3b,https://huggingface.co/facebook/opt-1.3b 💬,microsoft/DialoGPT-medium,5.25,14.79,0.15,2.56,0.3,0,0,0.56,0.25,12.28,0.43,1.32,0.11,"💬 chat models (RLHF, DPO, IFT, ...)",GPT2LMHeadModel,Original,bfloat16,TRUE,mit,0,307,TRUE,7b40bb0f92c45fefa957d088000d8648e5c7fa33,TRUE,TRUE,2024-06-13,2022-03-02,TRUE,TRUE,microsoft/DialoGPT-medium,https://huggingface.co/microsoft/DialoGPT-medium 🟢,stabilityai/stablelm-2-1_6b,5.22,11.57,0.12,8.63,0.34,0.15,0,0,0.25,5.79,0.39,5.15,0.15,🟢 pretrained,StableLmForCausalLM,Original,float16,TRUE,other,1,174,TRUE,8879812cccd176fbbe9ceb747b815bcc7d6499f8,TRUE,TRUE,2024-06-12,2024-01-18,FALSE,TRUE,stabilityai/stablelm-2-1_6b,https://huggingface.co/stabilityai/stablelm-2-1_6b -💬,HuggingFaceTB/SmolLM-1.7B-Instruct,5.14,23.48,0.23,2.08,0.29,0,0,1.34,0.26,2.08,0.35,1.85,0.12,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,58,TRUE,0ad161e59935a9a691dfde2818df8b98786f30a7,TRUE,TRUE,2024-07-18,2024-07-15,TRUE,FALSE,HuggingFaceTB/SmolLM-1.7B-Instruct,https://huggingface.co/HuggingFaceTB/SmolLM-1.7B-Instruct +💬,HuggingFaceTB/SmolLM-1.7B-Instruct,5.14,23.48,0.23,2.08,0.29,0,0,1.34,0.26,2.08,0.35,1.85,0.12,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,59,TRUE,0ad161e59935a9a691dfde2818df8b98786f30a7,TRUE,TRUE,2024-07-18,2024-07-15,TRUE,FALSE,HuggingFaceTB/SmolLM-1.7B-Instruct,https://huggingface.co/HuggingFaceTB/SmolLM-1.7B-Instruct 🟢,Qwen/Qwen1.5-0.5B,5.14,17.06,0.17,5.04,0.32,0.45,0,0.56,0.25,4.3,0.36,3.41,0.13,🟢 pretrained,Qwen2ForCausalLM,Original,bfloat16,TRUE,other,0,136,TRUE,8f445e3628f3500ee69f24e1303c9f10f5342a39,TRUE,TRUE,2024-06-13,2024-01-22,FALSE,TRUE,Qwen/Qwen1.5-0.5B,https://huggingface.co/Qwen/Qwen1.5-0.5B 🟢,EleutherAI/pythia-410m,5.11,21.95,0.22,2.72,0.3,0.3,0,1.23,0.26,3.06,0.36,1.42,0.11,🟢 pretrained,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,0,20,TRUE,9879c9b5f8bea9051dcb0e68dff21493d67e9d4f,TRUE,TRUE,2024-06-09,2023-02-13,FALSE,TRUE,EleutherAI/pythia-410m,https://huggingface.co/EleutherAI/pythia-410m 🟢,tiiuae/falcon-7b,5.1,18.21,0.18,5.96,0.33,0.53,0.01,0,0.24,4.5,0.38,1.39,0.11,🟢 pretrained,FalconForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,1054,TRUE,898df1396f35e447d5fe44e0a3ccaaaa69f30d36,TRUE,TRUE,2024-06-09,2023-04-24,FALSE,TRUE,tiiuae/falcon-7b,https://huggingface.co/tiiuae/falcon-7b @@ -342,7 +347,7 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🟢,openai-community/gpt2-xl,4.98,20.39,0.2,2.58,0.3,0.3,0,1.12,0.26,4.04,0.37,1.46,0.11,🟢 pretrained,GPT2LMHeadModel,Original,bfloat16,TRUE,mit,1,295,TRUE,15ea56dee5df4983c59b2538573817e1667135e2,TRUE,TRUE,2024-06-12,2022-03-02,FALSE,TRUE,openai-community/gpt2-xl,https://huggingface.co/openai-community/gpt2-xl 🔶,togethercomputer/GPT-NeoXT-Chat-Base-20B,4.94,18.3,0.18,6.83,0.33,1.13,0.01,0,0.25,1.76,0.35,1.61,0.11,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,20,693,TRUE,d386708e84d862a65f7d2b4989f64750cb657227,TRUE,TRUE,2024-06-12,2023-03-03,FALSE,TRUE,togethercomputer/GPT-NeoXT-Chat-Base-20B,https://huggingface.co/togethercomputer/GPT-NeoXT-Chat-Base-20B 🔶,togethercomputer/RedPajama-INCITE-Chat-3B-v1,4.75,16.52,0.17,5.16,0.32,0.3,0,0,0.24,5.09,0.37,1.41,0.11,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,apache-2.0,3,147,TRUE,f0e0995eba801096ed04cb87931d96a8316871af,TRUE,TRUE,2024-06-13,2023-05-05,FALSE,TRUE,togethercomputer/RedPajama-INCITE-Chat-3B-v1,https://huggingface.co/togethercomputer/RedPajama-INCITE-Chat-3B-v1 -💬,HuggingFaceTB/SmolLM-360M-Instruct,4.71,19.52,0.2,2.08,0.29,0,0,1.9,0.26,2.9,0.35,1.85,0.12,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,18,TRUE,8e951de8c220295ea4f85d078c4e320df7137535,TRUE,TRUE,2024-07-18,2024-07-15,TRUE,FALSE,HuggingFaceTB/SmolLM-360M-Instruct,https://huggingface.co/HuggingFaceTB/SmolLM-360M-Instruct +💬,HuggingFaceTB/SmolLM-360M-Instruct,4.71,19.52,0.2,2.08,0.29,0,0,1.9,0.26,2.9,0.35,1.85,0.12,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,0,20,TRUE,8e951de8c220295ea4f85d078c4e320df7137535,TRUE,TRUE,2024-07-18,2024-07-15,TRUE,FALSE,HuggingFaceTB/SmolLM-360M-Instruct,https://huggingface.co/HuggingFaceTB/SmolLM-360M-Instruct 🟢,TinyLlama/TinyLlama_v1.1,4.7,20.01,0.2,3.21,0.3,0.45,0,0,0.25,3.98,0.37,0.54,0.1,🟢 pretrained,LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,1,31,TRUE,ff3c701f2424c7625fdefb9dd470f45ef18b02d6,TRUE,TRUE,2024-06-12,2024-03-09,FALSE,TRUE,TinyLlama/TinyLlama_v1.1,https://huggingface.co/TinyLlama/TinyLlama_v1.1 🤝,paloalma/TW3-JRGL-v2,4.57,3.1,0.03,4.11,0.31,5.21,0.05,0.78,0.26,12.38,0.43,1.85,0.12,🤝 base merges and moerges,LlamaForCausalLM,Original,bfloat16,FALSE,apache-2.0,72,0,TRUE,aca3f0ba2bfb90038a9e2cd5b486821d4c181b46,TRUE,TRUE,2024-06-26,2024-04-01,TRUE,FALSE,paloalma/TW3-JRGL-v2,https://huggingface.co/paloalma/TW3-JRGL-v2 🔶,WizardLMTeam/WizardLM-13B-V1.0,4.55,18.5,0.19,2.15,0.29,0,0,1.23,0.26,3.55,0.35,1.85,0.12,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,"",13,71,TRUE,964a93aa2e78da377115bb856075a69ebe8aefa4,TRUE,TRUE,2024-06-13,2023-05-13,FALSE,TRUE,WizardLMTeam/WizardLM-13B-V1.0,https://huggingface.co/WizardLMTeam/WizardLM-13B-V1.0 @@ -359,8 +364,8 @@ t,model,average,ifeval,ifeval_raw,bbh,bbh_raw,math_lvl_5,math_lvl_5_raw,gpqa,gpq 🟢,bigscience/bloom-560m,3.46,6.2,0.06,2.89,0.3,0.08,0,1.57,0.26,8.19,0.4,1.83,0.12,🟢 pretrained,BloomForCausalLM,Original,bfloat16,TRUE,bigscience-bloom-rail-1.0,0,329,TRUE,ac2ae5fab2ce3f9f40dc79b5ca9f637430d24971,TRUE,TRUE,2024-06-13,2022-05-19,FALSE,TRUE,bigscience/bloom-560m,https://huggingface.co/bigscience/bloom-560m 🔶,pankajmathur/orca_mini_3b,3.07,7.42,0.07,4.69,0.32,0.53,0.01,0,0.25,4.2,0.33,1.61,0.11,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,cc-by-nc-sa-4.0,3,158,TRUE,31e1a7bc3f7ea2f247b432d60036d975b8d590e9,TRUE,TRUE,2024-06-26,2023-06-22,FALSE,FALSE,pankajmathur/orca_mini_3b,https://huggingface.co/pankajmathur/orca_mini_3b 🟢,LiteAI/Hare-1.1B-base,1.95,0.12,0,1.72,0.29,0,0,1.23,0.26,7.58,0.4,1.04,0.11,🟢 pretrained,MistralForCausalLM,Original,float16,TRUE,apache-2.0,1,7,TRUE,c4faddb2163d8d940b422035e67f4c13cb8c2cb1,TRUE,TRUE,2024-07-19,2024-06-05,FALSE,FALSE,LiteAI/Hare-1.1B-base,https://huggingface.co/LiteAI/Hare-1.1B-base +🟢,awnr/Mistral-7B-v0.1-signtensors-7-over-16,1.66,0,0,2.35,0.29,0,0,1.23,0.26,4.52,0.36,1.85,0.12,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,0,TRUE,0e1f2cb0a81c38fc6c567d9c007883ab62fae266,TRUE,TRUE,2024-06-27,2024-06-26,FALSE,FALSE,awnr/Mistral-7B-v0.1-signtensors-7-over-16,https://huggingface.co/awnr/Mistral-7B-v0.1-signtensors-7-over-16 +🟢,awnr/Mistral-7B-v0.1-signtensors-1-over-4,1.66,0,0,2.35,0.29,0,0,1.23,0.26,4.52,0.36,1.85,0.12,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,0,TRUE,b288ab9d8adfd2963a44a7935bb47649f55bcbee,TRUE,TRUE,2024-06-28,2024-06-27,FALSE,FALSE,awnr/Mistral-7B-v0.1-signtensors-1-over-4,https://huggingface.co/awnr/Mistral-7B-v0.1-signtensors-1-over-4 🟢,awnr/Mistral-7B-v0.1-signtensors-3-over-8,1.66,0,0,2.35,0.29,0,0,1.23,0.26,4.52,0.36,1.85,0.12,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,0,TRUE,fa368f705ace05da2fef25c030fe740cf1fef176,TRUE,TRUE,2024-06-27,2024-06-26,FALSE,FALSE,awnr/Mistral-7B-v0.1-signtensors-3-over-8,https://huggingface.co/awnr/Mistral-7B-v0.1-signtensors-3-over-8 🟢,awnr/Mistral-7B-v0.1-signtensors-1-over-2,1.66,0,0,2.35,0.29,0,0,1.23,0.26,4.52,0.36,1.85,0.12,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,1,TRUE,9575327242f8539eac59b6d788beccf54a6f9414,TRUE,TRUE,2024-06-28,2024-06-27,FALSE,FALSE,awnr/Mistral-7B-v0.1-signtensors-1-over-2,https://huggingface.co/awnr/Mistral-7B-v0.1-signtensors-1-over-2 -🟢,awnr/Mistral-7B-v0.1-signtensors-1-over-4,1.66,0,0,2.35,0.29,0,0,1.23,0.26,4.52,0.36,1.85,0.12,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,0,TRUE,b288ab9d8adfd2963a44a7935bb47649f55bcbee,TRUE,TRUE,2024-06-28,2024-06-27,FALSE,FALSE,awnr/Mistral-7B-v0.1-signtensors-1-over-4,https://huggingface.co/awnr/Mistral-7B-v0.1-signtensors-1-over-4 -🟢,awnr/Mistral-7B-v0.1-signtensors-7-over-16,1.66,0,0,2.35,0.29,0,0,1.23,0.26,4.52,0.36,1.85,0.12,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,0,TRUE,0e1f2cb0a81c38fc6c567d9c007883ab62fae266,TRUE,TRUE,2024-06-27,2024-06-26,FALSE,FALSE,awnr/Mistral-7B-v0.1-signtensors-7-over-16,https://huggingface.co/awnr/Mistral-7B-v0.1-signtensors-7-over-16 🔶,pankajmathur/orca_mini_v6_8b,1.41,1.11,0.01,3.22,0.3,0,0,0,0.24,2.77,0.36,1.38,0.11,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,llama3,8,1,TRUE,e95dc8e4c6b6ca5957b657cc2d905683142eaf3e,TRUE,TRUE,2024-06-26,2024-06-02,TRUE,FALSE,pankajmathur/orca_mini_v6_8b,https://huggingface.co/pankajmathur/orca_mini_v6_8b diff --git a/csv/lmsys.csv b/csv/lmsys.csv index 8cb19c2..c6cec27 100644 --- a/csv/lmsys.csv +++ b/csv/lmsys.csv @@ -1,117 +1,118 @@ rank,model,arena_score,95_pct_ci,votes,organization,license,knowledge_cutoff,url -1,GPT-4o-2024-05-13,1287,+3/-4,62251,OpenAI,Proprietary,2023/10,https://openai.com/index/hello-gpt-4o/ -2,Claude 3.5 Sonnet,1271,+3/-3,31482,Anthropic,Proprietary,2024/4,https://www.anthropic.com/news/claude-3-5-sonnet -2,Gemini-Advanced-0514,1267,+4/-4,46549,Google,Proprietary,Online,https://gemini.google.com/advanced -3,Gemini-1.5-Pro-API-0514,1262,+3/-3,55037,Google,Proprietary,2023/11,https://deepmind.google/technologies/gemini/pro -4,Gemini-1.5-Pro-API-0409-Preview,1257,+4/-3,55678,Google,Proprietary,2023/11,https://blog.google/technology/ai/google-gemini-next-generation-model-february-2024/ -4,GPT-4-Turbo-2024-04-09,1257,+3/-3,75215,OpenAI,Proprietary,2023/12,https://platform.openai.com/docs/models/gpt-4-turbo-and-gpt-4 -7,GPT-4-1106-preview,1251,+3/-3,87739,OpenAI,Proprietary,2023/4,https://openai.com/blog/new-models-and-developer-products-announced-at-devday -7,Claude 3 Opus,1248,+2/-2,146594,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family -7,GPT-4-0125-preview,1245,+3/-2,81062,OpenAI,Proprietary,2023/12,https://openai.com/blog/new-models-and-developer-products-announced-at-devday -9,Yi-Large-preview,1240,+3/-3,49814,01 AI,Proprietary,Unknown,https://platform.lingyiwanwu.com/docs#%E6%A8%A1%E5%9E%8B -11,Gemini-1.5-Flash-API-0514,1228,+4/-3,46614,Google,Proprietary,2023/11,https://deepmind.google/technologies/gemini/flash/ -11,Deepseek-v2-API-0628,1222,+7/-6,6726,DeepSeek AI,Proprietary,Unknown,https://platform.deepseek.com/api-docs/updates#deepseek-chat -12,Gemma-2-27B-it,1216,+4/-5,18175,Google,Gemma license,2024/6,https://ai.google.dev/gemma -12,Yi-Large,1214,+4/-4,14627,01 AI,Proprietary,Unknown,https://platform.01.ai/docs#models-and-pricing -13,Nemotron-4-340B-Instruct,1209,+4/-4,20683,Nvidia,NVIDIA Open Model,2023/6,https://huggingface.co/nvidia/Nemotron-4-340B-Instruct -13,Bard (Gemini Pro),1208,+5/-4,11831,Google,Proprietary,Online,https://bard.google.com/ -13,GLM-4-0520,1207,+5/-6,10249,Zhipu AI,Proprietary,Unknown,https://open.bigmodel.cn/dev/api#language -15,Llama-3-70b-Instruct,1207,+2/-3,152792,Meta,Llama 3 Community,2023/12,https://llama.meta.com/llama3/ -18,Claude 3 Sonnet,1201,+2/-3,112160,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family -18,Reka-Core-20240501,1200,+3/-3,60340,Reka AI,Proprietary,Unknown,https://www.reka.ai/news/reka-core-our-frontier-class-multimodal-language-model -21,Command R+,1190,+3/-3,78846,Cohere,CC-BY-NC-4.0,2024/3,https://txt.cohere.com/command-r-plus-microsoft-azure/ -21,Gemma-2-9B-it,1187,+4/-5,18294,Google,Gemma license,2024/6,https://ai.google.dev/gemma -21,Qwen2-72B-Instruct,1187,+3/-4,29530,Alibaba,Qianwen LICENSE,2024/6,https://qwenlm.github.io/blog/qwen2/ -21,GPT-4-0314,1186,+3/-3,55993,OpenAI,Proprietary,2021/9,https://openai.com/research/gpt-4 -21,GLM-4-0116,1183,+8/-7,7591,Zhipu AI,Proprietary,Unknown,https://open.bigmodel.cn/ -21,Qwen-Max-0428,1183,+4/-4,25781,Alibaba,Proprietary,Unknown,https://help.aliyun.com/zh/dashscope/developer-reference/api-details -22,DeepSeek-Coder-V2-Instruct,1178,+6/-4,14906,DeepSeek AI,DeepSeek License,2024/6,https://huggingface.co/deepseek-ai/DeepSeek-Coder-V2-Instruct -25,Claude 3 Haiku,1179,+2/-2,102820,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family -29,Reka-Flash-Preview-20240611,1165,+4/-4,18039,Reka AI,Proprietary,Unknown,https://docs.reka.ai/http-api.html#generation -29,Qwen1.5-110B-Chat,1162,+3/-4,27511,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ -29,GPT-4-0613,1161,+2/-3,84750,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo -29,Yi-1.5-34B-Chat,1157,+4/-5,25183,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat -29,Reka-Flash-21B-online,1156,+6/-4,16046,Reka AI,Proprietary,Online,https://docs.reka.ai/http-api.html#generation -30,Mistral-Large-2402,1157,+2/-3,63729,Mistral,Proprietary,Unknown,https://mistral.ai/news/mistral-large/ -32,Llama-3-8b-Instruct,1152,+3/-2,100826,Meta,Llama 3 Community,2023/3,https://llama.meta.com/llama3/ -34,Claude-1,1148,+4/-4,21178,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/introducing-claude -35,Command R,1149,+3/-3,54921,Cohere,CC-BY-NC-4.0,2024/3,https://txt.cohere.com/command-r -35,Mistral Medium,1148,+3/-3,35568,Mistral,Proprietary,Unknown,https://mistral.ai/news/la-plateforme/ -35,Reka-Flash-21B,1147,+4/-4,25803,Reka AI,Proprietary,2023/11,https://www.reka.ai/news/reka-flash-efficient-and-capable-multimodal-language-models -35,Qwen1.5-72B-Chat,1147,+3/-3,40666,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -35,Mixtral-8x22b-Instruct-v0.1,1146,+4/-3,44997,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ -42,Claude-2.0,1131,+4/-5,12781,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/claude-2 -42,Gemini Pro (Dev API),1131,+5/-4,18793,Google,Proprietary,2023/4,https://ai.google.dev/docs/gemini_api_overview -42,Zephyr-ORPO-141b-A35b-v0.1,1127,+7/-6,4867,HuggingFace,Apache 2.0,2024/4,https://huggingface.co/HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1 -42,Qwen1.5-32B-Chat,1125,+4/-3,22784,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ -42,Mistral-Next,1124,+5/-5,12384,Mistral,Proprietary,Unknown,https://chat.mistral.ai/chat -42,Phi-3-Medium-4k-Instruct,1123,+5/-5,17472,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct -44,Starling-LM-7B-beta,1119,+5/-5,16659,Nexusflow,Apache-2.0,2024/3,https://huggingface.co/Nexusflow/Starling-LM-7B-beta -45,Claude-2.1,1118,+3/-3,37715,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/claude-2-1 -45,GPT-3.5-Turbo-0613,1117,+4/-3,38970,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 -47,Gemini Pro,1110,+8/-6,6569,Google,Proprietary,2023/4,https://blog.google/technology/ai/gemini-api-developers-cloud/ -48,Yi-34B-Chat,1111,+5/-5,15946,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat -48,Claude-Instant-1,1111,+5/-4,20637,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/introducing-claude -49,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,72489,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ -52,Qwen1.5-14B-Chat,1108,+4/-3,18668,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -52,GPT-3.5-Turbo-0314,1106,+7/-8,5663,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 -52,WizardLM-70B-v1.0,1106,+5/-6,8393,Microsoft,Llama 2 Community,2023/8,https://huggingface.co/WizardLM/WizardLM-70B-V1.0 -53,GPT-3.5-Turbo-0125,1105,+2/-3,66678,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5-turbo -53,DBRX-Instruct-Preview,1103,+4/-3,33748,Databricks,DBRX LICENSE,2023/12,https://www.databricks.com/blog/introducing-dbrx-new-state-art-open-llm -53,Phi-3-Small-8k-Instruct,1102,+4/-4,18522,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-small-8k-instruct -55,Tulu-2-DPO-70B,1099,+5/-6,6666,AllenAI/UW,AI2 ImpACT Low-risk,2023/11,https://huggingface.co/allenai/tulu-2-dpo-70b -61,Llama-2-70b-chat,1093,+3/-3,39647,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf -61,OpenChat-3.5-0106,1091,+4/-5,12987,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 -61,Vicuna-33B,1090,+4/-4,22964,LMSYS,Non-commercial,2023/8,https://huggingface.co/lmsys/vicuna-33b-v1.3 -61,Snowflake Arctic Instruct,1090,+4/-4,34221,Snowflake,Apache 2.0,2024/4,https://www.snowflake.com/blog/arctic-open-efficient-foundation-language-models-snowflake/ -61,Starling-LM-7B-alpha,1088,+6/-5,10425,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha -61,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+10/-8,3841,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO -63,Gemma-1.1-7B-it,1084,+4/-3,25106,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it -63,NV-Llama2-70B-SteerLM-Chat,1080,+9/-9,3635,Nvidia,Llama 2 Community,2023/11,https://huggingface.co/nvidia/Llama2-70B-SteerLM-Chat -66,pplx-70b-online,1077,+7/-8,6896,Perplexity AI,Proprietary,Online,https://blog.perplexity.ai/blog/introducing-pplx-online-llms -66,DeepSeek-LLM-67B-Chat,1076,+7/-8,4983,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat -67,OpenChat-3.5,1076,+6/-6,8120,OpenChat,Apache-2.0,2023/11,https://huggingface.co/openchat/openchat_3.5 -67,OpenHermes-2.5-Mistral-7b,1074,+7/-7,5093,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B -68,Mistral-7B-Instruct-v0.2,1072,+4/-4,20074,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 -68,Qwen1.5-7B-Chat,1070,+7/-7,4870,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -69,GPT-3.5-Turbo-1106,1068,+5/-5,17027,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 -69,Dolphin-2.2.1-Mistral-7B,1062,+11/-15,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b -71,Phi-3-Mini-4k-Instruct,1066,+4/-3,21159,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -71,SOLAR-10.7B-Instruct-v1.0,1062,+8/-7,4293,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 -73,Llama-2-13b-chat,1063,+5/-4,19763,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-13b-chat-hf -73,Phi-3-Mini-4k-Instruct-June-24,1062,+7/-8,5456,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -75,WizardLM-13b-v1.2,1058,+6/-7,7194,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 -79,Zephyr-7b-beta,1053,+5/-6,11337,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta -79,MPT-30B-chat,1045,+11/-11,2649,MosaicML,CC-BY-NC-SA-4.0,2023/6,https://huggingface.co/mosaicml/mpt-30b-chat -79,CodeLlama-70B-instruct,1042,+14/-14,1192,Meta,Llama 2 Community,2024/1,https://huggingface.co/codellama/CodeLlama-70b-hf -81,Zephyr-7b-alpha,1041,+11/-13,1818,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha -82,pplx-7b-online,1044,+7/-7,6340,Perplexity AI,Proprietary,Online,https://blog.perplexity.ai/blog/introducing-pplx-online-llms -82,CodeLlama-34B-instruct,1042,+8/-8,7514,Meta,Llama 2 Community,2023/7,https://huggingface.co/codellama/CodeLlama-34b-Instruct-hf -82,falcon-180b-chat,1034,+15/-17,1327,TII,Falcon-180B TII License,2023/9,https://huggingface.co/tiiuae/falcon-180B-chat -84,Vicuna-13B,1041,+4/-6,19798,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-13b-v1.5 -84,Gemma-7B-it,1037,+7/-5,9182,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it -84,Llama-2-7b-chat,1037,+4/-5,14569,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-7b-chat-hf -84,Phi-3-Mini-128k-Instruct,1037,+4/-5,21617,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ -84,Qwen-14B-Chat,1035,+6/-7,5074,Alibaba,Qianwen LICENSE,2023/8,https://huggingface.co/Qwen/Qwen-14B-Chat -84,Guanaco-33B,1032,+11/-11,3002,UW,Non-commercial,2023/5,https://huggingface.co/timdettmers/guanaco-33b-merged -94,Gemma-1.1-2B-it,1021,+6/-6,11385,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-2b-it -94,StripedHyena-Nous-7B,1017,+7/-7,5267,Together AI,Apache 2.0,2023/12,https://huggingface.co/togethercomputer/StripedHyena-Nous-7B -94,OLMo-7B-instruct,1015,+7/-8,6502,Allen AI,Apache-2.0,2024/2,https://huggingface.co/allenai/OLMo-7B-Instruct -97,Mistral-7B-Instruct-v0.1,1008,+5/-6,9153,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 -97,Vicuna-7B,1005,+8/-7,7023,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-7b-v1.5 -98,PaLM-Chat-Bison-001,1003,+5/-7,8751,Google,Proprietary,2021/6,https://cloud.google.com/vertex-ai/docs/generative-ai/learn/models#foundation_models -100,Gemma-2B-it,989,+8/-10,4919,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it -102,Qwen1.5-4B-Chat,988,+6/-7,7816,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -104,Koala-13B,964,+9/-7,7042,UC Berkeley,Non-commercial,2023/4,https://bair.berkeley.edu/blog/2023/04/03/koala/ -104,ChatGLM3-6B,955,+10/-9,4764,Tsinghua,Apache-2.0,2023/10,https://huggingface.co/THUDM/chatglm3-6b -106,GPT4All-13B-Snoozy,931,+12/-14,1787,Nomic AI,Non-commercial,2023/3,https://huggingface.co/nomic-ai/gpt4all-13b-snoozy -106,MPT-7B-Chat,927,+10/-10,4020,MosaicML,CC-BY-NC-SA-4.0,2023/5,https://huggingface.co/mosaicml/mpt-7b-chat -106,ChatGLM2-6B,924,+11/-14,2709,Tsinghua,Apache-2.0,2023/6,https://huggingface.co/THUDM/chatglm2-6b -106,RWKV-4-Raven-14B,921,+7/-9,4940,RWKV,Apache 2.0,2023/4,https://huggingface.co/BlinkDL/rwkv-4-raven -109,Alpaca-13B,901,+10/-9,5874,Stanford,Non-commercial,2023/3,https://crfm.stanford.edu/2023/03/13/alpaca.html -110,OpenAssistant-Pythia-12B,893,+8/-8,6385,OpenAssistant,Apache 2.0,2023/4,https://huggingface.co/OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5 -111,ChatGLM-6B,879,+10/-11,4999,Tsinghua,Non-commercial,2023/3,https://huggingface.co/THUDM/chatglm-6b -112,FastChat-T5-3B,868,+9/-10,4313,LMSYS,Apache 2.0,2023/4,https://huggingface.co/lmsys/fastchat-t5-3b-v1.0 -114,StableLM-Tuned-Alpha-7B,839,+11/-10,3339,Stability AI,CC-BY-NC-SA-4.0,2023/4,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b -114,Dolly-V2-12B,822,+11/-11,3487,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b -115,LLaMA-13B,799,+13/-12,2444,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 +1,GPT-4o-2024-05-13,1287,+3/-3,64700,OpenAI,Proprietary,2023/10,https://openai.com/index/hello-gpt-4o/ +1,GPT-4o-mini-2024-07-18,1280,+8/-9,4449,OpenAI,Proprietary,2023/10,https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/ +2,Claude 3.5 Sonnet,1272,+4/-3,34591,Anthropic,Proprietary,2024/4,https://www.anthropic.com/news/claude-3-5-sonnet +3,Gemini-Advanced-0514,1267,+3/-3,48001,Google,Proprietary,Online,https://gemini.google.com/advanced +4,Gemini-1.5-Pro-API-0514,1261,+4/-2,57448,Google,Proprietary,2023/11,https://deepmind.google/technologies/gemini/pro +5,Gemini-1.5-Pro-API-0409-Preview,1257,+3/-3,55681,Google,Proprietary,2023/11,https://blog.google/technology/ai/google-gemini-next-generation-model-february-2024/ +5,GPT-4-Turbo-2024-04-09,1257,+2/-3,76597,OpenAI,Proprietary,2023/12,https://platform.openai.com/docs/models/gpt-4-turbo-and-gpt-4 +8,GPT-4-1106-preview,1251,+2/-2,88475,OpenAI,Proprietary,2023/4,https://openai.com/blog/new-models-and-developer-products-announced-at-devday +8,Claude 3 Opus,1248,+2/-2,147947,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family +9,GPT-4-0125-preview,1245,+3/-3,81807,OpenAI,Proprietary,2023/12,https://openai.com/blog/new-models-and-developer-products-announced-at-devday +10,Yi-Large-preview,1240,+3/-3,50499,01 AI,Proprietary,Unknown,https://platform.lingyiwanwu.com/docs#%E6%A8%A1%E5%9E%8B +12,Gemini-1.5-Flash-API-0514,1228,+3/-3,48048,Google,Proprietary,2023/11,https://deepmind.google/technologies/gemini/flash/ +12,Deepseek-v2-API-0628,1222,+6/-6,8089,DeepSeek AI,Proprietary,Unknown,https://platform.deepseek.com/api-docs/updates#deepseek-chat +13,Gemma-2-27B-it,1217,+4/-3,19624,Google,Gemma license,2024/6,https://ai.google.dev/gemma +13,Yi-Large,1214,+5/-5,15276,01 AI,Proprietary,Unknown,https://platform.01.ai/docs#models-and-pricing +14,Bard (Gemini Pro),1209,+7/-6,11830,Google,Proprietary,Online,https://bard.google.com/ +14,GLM-4-0520,1207,+7/-5,10253,Zhipu AI,Proprietary,Unknown,https://open.bigmodel.cn/dev/api#language +15,Nemotron-4-340B-Instruct,1209,+4/-4,20685,Nvidia,NVIDIA Open Model,2023/6,https://huggingface.co/nvidia/Nemotron-4-340B-Instruct +15,Llama-3-70b-Instruct,1207,+2/-3,154914,Meta,Llama 3 Community,2023/12,https://llama.meta.com/llama3/ +18,Claude 3 Sonnet,1201,+2/-3,112955,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family +18,Reka-Core-20240501,1200,+3/-3,61757,Reka AI,Proprietary,Unknown,https://www.reka.ai/news/reka-core-our-frontier-class-multimodal-language-model +22,Command R+,1190,+3/-3,79583,Cohere,CC-BY-NC-4.0,2024/3,https://txt.cohere.com/command-r-plus-microsoft-azure/ +22,Gemma-2-9B-it,1188,+3/-4,19774,Google,Gemma license,2024/6,https://ai.google.dev/gemma +22,Qwen2-72B-Instruct,1187,+3/-4,30310,Alibaba,Qianwen LICENSE,2024/6,https://qwenlm.github.io/blog/qwen2/ +22,GPT-4-0314,1186,+3/-3,55984,OpenAI,Proprietary,2021/9,https://openai.com/research/gpt-4 +22,GLM-4-0116,1183,+6/-6,7589,Zhipu AI,Proprietary,Unknown,https://open.bigmodel.cn/ +23,Qwen-Max-0428,1183,+4/-4,25775,Alibaba,Proprietary,Unknown,https://help.aliyun.com/zh/dashscope/developer-reference/api-details +24,DeepSeek-Coder-V2-Instruct,1179,+5/-5,15644,DeepSeek AI,DeepSeek License,2024/6,https://huggingface.co/deepseek-ai/DeepSeek-Coder-V2-Instruct +26,Claude 3 Haiku,1179,+3/-2,104266,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family +30,Reka-Flash-Preview-20240611,1165,+4/-3,19489,Reka AI,Proprietary,Unknown,https://docs.reka.ai/http-api.html#generation +30,Qwen1.5-110B-Chat,1162,+3/-3,27497,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ +30,GPT-4-0613,1161,+2/-3,85431,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo +31,Yi-1.5-34B-Chat,1157,+4/-4,25171,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat +31,Mistral-Large-2402,1157,+2/-3,64444,Mistral,Proprietary,Unknown,https://mistral.ai/news/mistral-large/ +31,Reka-Flash-21B-online,1156,+4/-6,16041,Reka AI,Proprietary,Online,https://docs.reka.ai/http-api.html#generation +33,Llama-3-8b-Instruct,1152,+3/-3,102317,Meta,Llama 3 Community,2023/3,https://llama.meta.com/llama3/ +35,Command R,1149,+3/-2,55724,Cohere,CC-BY-NC-4.0,2024/3,https://txt.cohere.com/command-r +35,Claude-1,1149,+4/-5,21179,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/introducing-claude +35,Mistral Medium,1148,+3/-4,35568,Mistral,Proprietary,Unknown,https://mistral.ai/news/la-plateforme/ +35,Reka-Flash-21B,1147,+3/-5,25801,Reka AI,Proprietary,2023/11,https://www.reka.ai/news/reka-flash-efficient-and-capable-multimodal-language-models +35,Qwen1.5-72B-Chat,1147,+3/-3,40662,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +37,Mixtral-8x22b-Instruct-v0.1,1146,+2/-4,45772,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ +43,Claude-2.0,1131,+6/-5,12783,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/claude-2 +43,Gemini Pro (Dev API),1131,+4/-5,18794,Google,Proprietary,2023/4,https://ai.google.dev/docs/gemini_api_overview +43,Zephyr-ORPO-141b-A35b-v0.1,1127,+8/-7,4865,HuggingFace,Apache 2.0,2024/4,https://huggingface.co/HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1 +43,Qwen1.5-32B-Chat,1125,+5/-5,22770,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ +43,Mistral-Next,1124,+6/-5,12383,Mistral,Proprietary,Unknown,https://chat.mistral.ai/chat +43,Phi-3-Medium-4k-Instruct,1122,+4/-4,18222,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct +45,Starling-LM-7B-beta,1119,+5/-4,16663,Nexusflow,Apache-2.0,2024/3,https://huggingface.co/Nexusflow/Starling-LM-7B-beta +45,Claude-2.1,1118,+4/-3,37713,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/claude-2-1 +45,GPT-3.5-Turbo-0613,1117,+4/-3,38965,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 +49,Claude-Instant-1,1111,+5/-5,20631,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/introducing-claude +49,Yi-34B-Chat,1111,+5/-5,15947,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat +49,Gemini Pro,1111,+8/-7,6568,Google,Proprietary,2023/4,https://blog.google/technology/ai/gemini-api-developers-cloud/ +50,GPT-3.5-Turbo-0314,1106,+8/-9,5663,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 +51,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,73266,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ +53,Qwen1.5-14B-Chat,1109,+4/-4,18673,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +53,WizardLM-70B-v1.0,1106,+6/-7,8392,Microsoft,Llama 2 Community,2023/8,https://huggingface.co/WizardLM/WizardLM-70B-V1.0 +53,GPT-3.5-Turbo-0125,1105,+4/-3,67470,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5-turbo +53,DBRX-Instruct-Preview,1103,+4/-3,33738,Databricks,DBRX LICENSE,2023/12,https://www.databricks.com/blog/introducing-dbrx-new-state-art-open-llm +53,Tulu-2-DPO-70B,1099,+8/-8,6669,AllenAI/UW,AI2 ImpACT Low-risk,2023/11,https://huggingface.co/allenai/tulu-2-dpo-70b +55,Phi-3-Small-8k-Instruct,1102,+4/-6,18517,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-small-8k-instruct +61,Llama-2-70b-chat,1093,+3/-4,39635,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf +61,OpenChat-3.5-0106,1091,+5/-5,12985,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 +62,Vicuna-33B,1091,+4/-4,22954,LMSYS,Non-commercial,2023/8,https://huggingface.co/lmsys/vicuna-33b-v1.3 +62,Snowflake Arctic Instruct,1090,+3/-4,34214,Snowflake,Apache 2.0,2024/4,https://www.snowflake.com/blog/arctic-open-efficient-foundation-language-models-snowflake/ +62,Starling-LM-7B-alpha,1088,+7/-5,10424,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha +62,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+8/-8,3843,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO +63,NV-Llama2-70B-SteerLM-Chat,1080,+9/-12,3636,Nvidia,Llama 2 Community,2023/11,https://huggingface.co/nvidia/Llama2-70B-SteerLM-Chat +64,Gemma-1.1-7B-it,1084,+4/-4,25112,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it +67,DeepSeek-LLM-67B-Chat,1077,+8/-8,4984,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat +68,pplx-70b-online,1078,+6/-7,6893,Perplexity AI,Proprietary,Online,https://blog.perplexity.ai/blog/introducing-pplx-online-llms +68,OpenChat-3.5,1076,+5/-6,8121,OpenChat,Apache-2.0,2023/11,https://huggingface.co/openchat/openchat_3.5 +68,OpenHermes-2.5-Mistral-7b,1074,+6/-9,5090,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B +69,Mistral-7B-Instruct-v0.2,1072,+4/-4,20068,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 +69,Qwen1.5-7B-Chat,1070,+7/-7,4869,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +70,GPT-3.5-Turbo-1106,1068,+4/-4,17028,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 +70,Phi-3-Mini-4k-Instruct,1066,+5/-4,21159,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +70,Dolphin-2.2.1-Mistral-7B,1062,+11/-12,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b +70,Phi-3-Mini-4k-Instruct-June-24,1062,+9/-6,6268,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +72,SOLAR-10.7B-Instruct-v1.0,1062,+8/-8,4293,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 +75,Llama-2-13b-chat,1063,+4/-4,19757,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-13b-chat-hf +76,WizardLM-13b-v1.2,1058,+6/-7,7195,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 +80,Zephyr-7b-beta,1053,+5/-6,11334,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +80,CodeLlama-70B-instruct,1042,+16/-20,1191,Meta,Llama 2 Community,2024/1,https://huggingface.co/codellama/CodeLlama-70b-hf +81,MPT-30B-chat,1045,+9/-12,2649,MosaicML,CC-BY-NC-SA-4.0,2023/6,https://huggingface.co/mosaicml/mpt-30b-chat +82,pplx-7b-online,1045,+7/-7,6338,Perplexity AI,Proprietary,Online,https://blog.perplexity.ai/blog/introducing-pplx-online-llms +83,Zephyr-7b-alpha,1041,+10/-12,1817,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha +84,CodeLlama-34B-instruct,1042,+7/-6,7514,Meta,Llama 2 Community,2023/7,https://huggingface.co/codellama/CodeLlama-34b-Instruct-hf +84,falcon-180b-chat,1034,+15/-17,1326,TII,Falcon-180B TII License,2023/9,https://huggingface.co/tiiuae/falcon-180B-chat +85,Vicuna-13B,1042,+4/-5,19798,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-13b-v1.5 +85,Gemma-7B-it,1037,+6/-7,9177,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it +85,Llama-2-7b-chat,1037,+5/-4,14568,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-7b-chat-hf +85,Phi-3-Mini-128k-Instruct,1037,+4/-4,21620,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ +85,Qwen-14B-Chat,1035,+8/-10,5071,Alibaba,Qianwen LICENSE,2023/8,https://huggingface.co/Qwen/Qwen-14B-Chat +85,Guanaco-33B,1032,+11/-12,3003,UW,Non-commercial,2023/5,https://huggingface.co/timdettmers/guanaco-33b-merged +93,Gemma-1.1-2B-it,1021,+7/-6,11375,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-2b-it +93,StripedHyena-Nous-7B,1017,+9/-9,5266,Together AI,Apache 2.0,2023/12,https://huggingface.co/togethercomputer/StripedHyena-Nous-7B +94,OLMo-7B-instruct,1015,+8/-9,6500,Allen AI,Apache-2.0,2024/2,https://huggingface.co/allenai/OLMo-7B-Instruct +98,Mistral-7B-Instruct-v0.1,1008,+6/-6,9151,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 +98,Vicuna-7B,1005,+6/-8,7023,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-7b-v1.5 +98,PaLM-Chat-Bison-001,1003,+7/-7,8747,Google,Proprietary,2021/6,https://cloud.google.com/vertex-ai/docs/generative-ai/learn/models#foundation_models +101,Gemma-2B-it,989,+8/-8,4919,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it +103,Qwen1.5-4B-Chat,988,+6/-8,7811,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +105,Koala-13B,964,+7/-8,7040,UC Berkeley,Non-commercial,2023/4,https://bair.berkeley.edu/blog/2023/04/03/koala/ +105,ChatGLM3-6B,955,+10/-11,4763,Tsinghua,Apache-2.0,2023/10,https://huggingface.co/THUDM/chatglm3-6b +106,GPT4All-13B-Snoozy,931,+15/-15,1787,Nomic AI,Non-commercial,2023/3,https://huggingface.co/nomic-ai/gpt4all-13b-snoozy +107,MPT-7B-Chat,927,+12/-8,4019,MosaicML,CC-BY-NC-SA-4.0,2023/5,https://huggingface.co/mosaicml/mpt-7b-chat +107,ChatGLM2-6B,924,+10/-12,2708,Tsinghua,Apache-2.0,2023/6,https://huggingface.co/THUDM/chatglm2-6b +107,RWKV-4-Raven-14B,921,+7/-8,4942,RWKV,Apache 2.0,2023/4,https://huggingface.co/BlinkDL/rwkv-4-raven +111,Alpaca-13B,901,+9/-7,5874,Stanford,Non-commercial,2023/3,https://crfm.stanford.edu/2023/03/13/alpaca.html +111,OpenAssistant-Pythia-12B,893,+8/-8,6385,OpenAssistant,Apache 2.0,2023/4,https://huggingface.co/OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5 +112,ChatGLM-6B,879,+10/-9,4999,Tsinghua,Non-commercial,2023/3,https://huggingface.co/THUDM/chatglm-6b +113,FastChat-T5-3B,869,+10/-10,4309,LMSYS,Apache 2.0,2023/4,https://huggingface.co/lmsys/fastchat-t5-3b-v1.0 +115,StableLM-Tuned-Alpha-7B,840,+12/-12,3337,Stability AI,CC-BY-NC-SA-4.0,2023/4,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b +115,Dolly-V2-12B,822,+11/-11,3488,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b +117,LLaMA-13B,799,+11/-14,2444,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 diff --git a/csv/merged.csv b/csv/merged.csv index 53a559a..9cc8fb5 100644 --- a/csv/merged.csv +++ b/csv/merged.csv @@ -1,56 +1,56 @@ key,t,model.x,average,arc,hellaswag,mmlu,truthfulqa,winogrande,gsm8k,type,architecture,weight_type,precision,merged,hub_license,params_b,hub_hearts,available_on_the_hub,model_sha,flagged,moe,date,fullname,url.x,rank,model.y,arena_score,95_pct_ci,votes,organization,license,knowledge_cutoff,url.y -deepseek-llm-67b-chat,💬,deepseek-ai/deepseek-llm-67b-chat,71.79,67.75,86.82,72.42,55.85,84.21,63.68,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,other,67,168,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2023-12-01T07:45:30Z,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat,66,DeepSeek-LLM-67B-Chat,1076,+7/-8,4983,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat -deepseek-llm-67b-chat,🔶,deepseek-ai/deepseek-llm-67b-chat,71.52,67.75,86.8,72.19,55.83,84.21,62.32,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,67,168,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2024-01-19T19:12:01Z,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat,66,DeepSeek-LLM-67B-Chat,1076,+7/-8,4983,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat -dolly-v2-12b,🔶,databricks/dolly-v2-12b,39.46,42.41,72.53,25.92,33.83,60.85,1.21,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,mit,12,1943,TRUE,19308160448536e378e3db21a73a751579ee7fdd,TRUE,TRUE,2023-09-09T10:52:17Z,databricks/dolly-v2-12b,https://huggingface.co/databricks/dolly-v2-12b,114,Dolly-V2-12B,822,+11/-11,3487,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b -dolphin-2.2.1-mistral-7b,🔶,cognitivecomputations/dolphin-2.2.1-mistral-7b,65.01,63.23,83.8,63.16,53.14,78.61,48.14,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,187,TRUE,2022924c0bb13588308d429e0b7f51568c07629c,TRUE,TRUE,2023-12-30T19:55:50Z,cognitivecomputations/dolphin-2.2.1-mistral-7b,https://huggingface.co/cognitivecomputations/dolphin-2.2.1-mistral-7b,69,Dolphin-2.2.1-Mistral-7B,1062,+11/-15,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b -dolphin-2.2.1-mistral-7b,🔶,ehartford/dolphin-2.2.1-mistral-7b,64.93,63.31,83.76,63.17,53.11,78.14,48.07,🔶 fine-tuned on domain-specific datasets,Unknown,Original,bfloat16,TRUE,"",7,0,FALSE,001b48e9aebffb395c698af47b6b48364cc3cbe8,TRUE,TRUE,2023-12-02T05:25:26Z,ehartford/dolphin-2.2.1-mistral-7b,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b,69,Dolphin-2.2.1-Mistral-7B,1062,+11/-15,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b -dolphin-2.2.1-mistral-7b,🔶,ehartford/dolphin-2.2.1-mistral-7b,60.54,63.48,83.86,63.28,53.17,78.37,21.08,🔶 fine-tuned on domain-specific datasets,Unknown,Original,float16,TRUE,"",7,0,FALSE,001b48e9aebffb395c698af47b6b48364cc3cbe8,TRUE,TRUE,2023-11-15T20:44:49Z,ehartford/dolphin-2.2.1-mistral-7b,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b,69,Dolphin-2.2.1-Mistral-7B,1062,+11/-15,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b -gemma-1.1-7b-it,💬,google/gemma-1.1-7b-it,60.09,60.07,76.14,60.92,50.74,69.69,42.99,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,float16,TRUE,gemma,8,251,TRUE,689f62a7dfc06893ea915ca75f1cd26825c76146,TRUE,TRUE,2024-04-11T19:11:38Z,google/gemma-1.1-7b-it,https://huggingface.co/google/gemma-1.1-7b-it,63,Gemma-1.1-7B-it,1084,+4/-3,25106,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it -gemma-1.1-7b-it,💬,OpenModels4all/gemma-1.1-7b-it,59.78,59.98,76.21,60.39,50.4,69.93,41.77,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,gemma,8,3,TRUE,484670e31c44eededf8c64064eb0207e7af4a2b3,TRUE,TRUE,2024-04-09T09:05:33Z,OpenModels4all/gemma-1.1-7b-it,https://huggingface.co/OpenModels4all/gemma-1.1-7b-it,63,Gemma-1.1-7B-it,1084,+4/-3,25106,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it -gemma-2b-it,🔶,google/gemma-2b-it,42.75,43.94,62.7,37.65,45.82,60.93,5.46,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,float16,TRUE,gemma,2,566,TRUE,9642e777f24fde593d204a9b2471dce33334e64a,TRUE,TRUE,2024-02-22T13:13:54Z,google/gemma-2b-it,https://huggingface.co/google/gemma-2b-it,100,Gemma-2B-it,989,+8/-10,4919,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it -gemma-7b-it,🔶,google/gemma-7b-it,53.56,51.45,71.96,53.52,47.29,67.96,29.19,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,float16,TRUE,gemma,8,1099,TRUE,dec4b13d574762bd36f0a1b75541439bd852b2e8,TRUE,TRUE,2024-02-22T13:13:37Z,google/gemma-7b-it,https://huggingface.co/google/gemma-7b-it,84,Gemma-7B-it,1037,+7/-5,9182,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it -llama-13b,🟢,huggingface/llama-13b,51.36,56.23,80.93,47.67,39.48,76.24,7.58,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,other,13,0,FALSE,4022c52fcc7473ce7364bb5ac166195903ea1efb,TRUE,TRUE,2023-10-16T12:48:18Z,huggingface/llama-13b,https://huggingface.co/huggingface/llama-13b,115,LLaMA-13B,799,+13/-12,2444,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 -llama-13b,🟢,huggyllama/llama-13b,51.33,56.14,80.92,47.61,39.48,76.24,7.58,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,other,13,137,TRUE,bf57045473f207bb1de1ed035ace226f4d9f9bba,TRUE,TRUE,2023-09-09T10:52:17Z,huggyllama/llama-13b,https://huggingface.co/huggyllama/llama-13b,115,LLaMA-13B,799,+13/-12,2444,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 -mistral-7b-instruct-v0.1,💬,mistralai/Mistral-7B-Instruct-v0.1,54.96,54.52,75.63,55.38,56.28,73.72,14.25,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,1456,TRUE,7961f5aa9b736bf8e364b2e6f201190f97a27931,TRUE,TRUE,2023-10-16T12:48:18Z,mistralai/Mistral-7B-Instruct-v0.1,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1,97,Mistral-7B-Instruct-v0.1,1008,+5/-6,9153,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 -mistral-7b-instruct-v0.2,💬,mistralai/Mistral-7B-Instruct-v0.2,65.71,63.14,84.88,60.78,68.26,77.19,40.03,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,2382,TRUE,c72e5d1908b1e2929ec8fc4c8820e9706af1f80f,TRUE,TRUE,2023-12-11T20:10:06Z,mistralai/Mistral-7B-Instruct-v0.2,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2,68,Mistral-7B-Instruct-v0.2,1072,+4/-4,20074,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 -mistral-7b-instruct-v0.2,💬,dfurman/Mistral-7B-Instruct-v0.2,61.79,60.15,82.79,60.07,56.06,76.87,34.8,"💬 chat models (RLHF, DPO, IFT, ...)",?,Adapter,float16,TRUE,apache-2.0,7,5,TRUE,322faff8bb0c72b772762de7635f5aea9864a24a,TRUE,TRUE,2024-01-02T17:44:20Z,dfurman/Mistral-7B-Instruct-v0.2,https://huggingface.co/dfurman/Mistral-7B-Instruct-v0.2,68,Mistral-7B-Instruct-v0.2,1072,+4/-4,20074,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 -mixtral-8x22b-instruct-v0.1,💬,mistralai/Mixtral-8x22B-Instruct-v0.1,79.15,72.7,89.08,77.77,68.14,85.16,82.03,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,140,613,TRUE,eb69dca9c68bbdcffd5f522f632d5c04ab6c65b3,TRUE,FALSE,2024-04-17T15:30:22Z,mistralai/Mixtral-8x22B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1,35,Mixtral-8x22b-Instruct-v0.1,1146,+4/-3,44997,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ -mixtral-8x7b-instruct-v0.1,🔶,mistralai/Mixtral-8x7B-Instruct-v0.1,72.7,70.14,87.55,71.4,64.98,81.06,61.11,🔶 fine-tuned on domain-specific datasets,MixtralForCausalLM,Original,float16,TRUE,apache-2.0,46,3920,TRUE,125c431e2ff41a156b9f9076f744d2f35dd6e67a,TRUE,FALSE,2024-01-01T02:10:03Z,mistralai/Mixtral-8x7B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1,49,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,72489,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ -mixtral-8x7b-instruct-v0.1,💬,mistralai/Mixtral-8x7B-Instruct-v0.1,72.62,70.22,87.63,71.16,64.58,81.37,60.73,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,3920,TRUE,3de0408ae8b591d9ac516a2384925dd98ebc66f4,TRUE,FALSE,2023-12-11T12:54:17Z,mistralai/Mixtral-8x7B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1,49,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,72489,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ -mpt-30b-chat,🔶,mosaicml/mpt-30b-chat,55.38,58.7,82.54,51.16,52.42,75.3,12.13,🔶 fine-tuned on domain-specific datasets,MPTForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,30,199,TRUE,54f33278a04aa4e612bca482b82f801ab658e890,TRUE,TRUE,2023-09-09T10:52:17Z,mosaicml/mpt-30b-chat,https://huggingface.co/mosaicml/mpt-30b-chat,79,MPT-30B-chat,1045,+11/-11,2649,MosaicML,CC-BY-NC-SA-4.0,2023/6,https://huggingface.co/mosaicml/mpt-30b-chat -mpt-7b-chat,🔶,mosaicml/mpt-7b-chat,45.39,46.5,75.51,37.62,40.16,68.43,4.09,🔶 fine-tuned on domain-specific datasets,MPTForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,7,513,TRUE,64e5c9c9fb53a8e89690c2dee75a5add37f7113e,TRUE,TRUE,2023-09-09T10:52:17Z,mosaicml/mpt-7b-chat,https://huggingface.co/mosaicml/mpt-7b-chat,106,MPT-7B-Chat,927,+10/-10,4020,MosaicML,CC-BY-NC-SA-4.0,2023/5,https://huggingface.co/mosaicml/mpt-7b-chat -nous-hermes-2-mixtral-8x7b-dpo,🔶,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,73.35,71.08,87.29,72.17,54.83,83.11,71.65,🔶 fine-tuned on domain-specific datasets,MixtralForCausalLM,Original,float16,TRUE,apache-2.0,46,383,TRUE,566cdea53950f86eb51dae62812c29e79405cffe,TRUE,FALSE,2024-01-22T08:41:28Z,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,61,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+10/-8,3841,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO -nous-hermes-2-mixtral-8x7b-dpo,?,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,73.12,71.42,87.21,72.28,54.53,82.64,70.66,"",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,383,TRUE,6ba531f1aec62375bf94ad9c7bb064953c4e9868,TRUE,FALSE,2024-06-09T15:01:07Z,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,61,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+10/-8,3841,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO -openchat-3.5-0106,💬,openchat/openchat-3.5-0106,69.3,66.04,82.93,65.04,51.9,81.77,68.16,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,341,TRUE,9619fb7d2a8e25fa6b0633c0f57f7f4aa79b45c4,TRUE,TRUE,2024-01-10T09:45:30Z,openchat/openchat-3.5-0106,https://huggingface.co/openchat/openchat-3.5-0106,61,OpenChat-3.5-0106,1091,+4/-5,12987,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 -openhermes-2.5-mistral-7b,🔶,teknium/OpenHermes-2.5-Mistral-7B,61.52,64.93,84.18,63.64,52.24,78.06,26.08,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,787,TRUE,2a54cad766bc90828354db5c4199795aecfd0df1,TRUE,TRUE,2023-11-17T19:50:31Z,teknium/OpenHermes-2.5-Mistral-7B,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B,67,OpenHermes-2.5-Mistral-7b,1074,+7/-7,5093,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B -openhermes-2.5-mistral-7b,🔶,teknium/OpenHermes-2.5-Mistral-7B,61.45,64.93,84.3,63.82,52.31,77.9,25.47,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,787,TRUE,2a54cad766bc90828354db5c4199795aecfd0df1,TRUE,TRUE,2023-11-14T15:14:43Z,teknium/OpenHermes-2.5-Mistral-7B,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B,67,OpenHermes-2.5-Mistral-7b,1074,+7/-7,5093,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B -phi-3-medium-4k-instruct,🟢,unsloth/Phi-3-medium-4k-instruct,73.57,67.06,85.69,77.85,57.75,72.85,80.21,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,mit,13,23,TRUE,1099cff4ded0cc74fb38a90951c4e21865cddd73,TRUE,TRUE,2024-05-28T06:35:31Z,unsloth/Phi-3-medium-4k-instruct,https://huggingface.co/unsloth/Phi-3-medium-4k-instruct,42,Phi-3-Medium-4k-Instruct,1123,+5/-5,17472,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct -phi-3-medium-4k-instruct,🔶,microsoft/Phi-3-medium-4k-instruct,73.45,67.32,85.76,77.83,57.71,72.69,79.38,🔶 fine-tuned on domain-specific datasets,Phi3ForCausalLM,Original,bfloat16,TRUE,mit,13,136,TRUE,d27c49ed6abea9167240288dceb4ab6bca855293,TRUE,FALSE,2024-05-27T15:40:50Z,microsoft/Phi-3-medium-4k-instruct,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct,42,Phi-3-Medium-4k-Instruct,1123,+5/-5,17472,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct -phi-3-mini-128k-instruct,💬,microsoft/Phi-3-mini-128k-instruct,68.07,63.14,80.09,68.7,54.12,72.85,69.52,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,float16,TRUE,mit,3,1355,TRUE,ebee18c488086b396dde649f2aa6548b9b8d2404,TRUE,FALSE,2024-04-25T13:14:03Z,microsoft/Phi-3-mini-128k-instruct,https://huggingface.co/microsoft/Phi-3-mini-128k-instruct,84,Phi-3-Mini-128k-Instruct,1037,+4/-5,21617,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ -phi-3-mini-4k-instruct,💬,microsoft/Phi-3-mini-4k-instruct,69.91,62.97,80.6,69.08,59.88,72.38,74.53,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,float16,TRUE,mit,3,724,TRUE,b86bcaf57ea4dfdec5dbe12a377028b2fab0d480,TRUE,FALSE,2024-04-26T08:51:19Z,microsoft/Phi-3-mini-4k-instruct,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct,71,Phi-3-Mini-4k-Instruct,1066,+4/-3,21159,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -phi-3-mini-4k-instruct,🟢,unsloth/Phi-3-mini-4k-instruct,69.86,62.97,80.61,69.08,59.88,72.69,73.92,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,mit,3,27,TRUE,4caf5ac193b82d28dea55dcbb22aa51d2a3be453,TRUE,TRUE,2024-05-11T07:51:45Z,unsloth/Phi-3-mini-4k-instruct,https://huggingface.co/unsloth/Phi-3-mini-4k-instruct,71,Phi-3-Mini-4k-Instruct,1066,+4/-3,21159,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -qwen1.5-110b-chat,💬,Qwen/Qwen1.5-110B-Chat,68.01,72.01,84.67,78.04,65.86,77.35,30.1,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,110,117,TRUE,5e04700b8091f10a98f1fe0b20c48c10d195ef5f,TRUE,FALSE,2024-04-29T12:55:18Z,Qwen/Qwen1.5-110B-Chat,https://huggingface.co/Qwen/Qwen1.5-110B-Chat,29,Qwen1.5-110B-Chat,1162,+3/-4,27511,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ -qwen1.5-14b-chat,🔶,Qwen/Qwen1.5-14B-Chat,62.37,58.79,82.33,68.52,60.38,73.32,30.86,🔶 fine-tuned on domain-specific datasets,Qwen2ForCausalLM,Original,float16,TRUE,other,14,99,TRUE,17e11c306ed235e970c9bb8e5f7233527140cdcf,TRUE,FALSE,2024-03-01T12:30:06Z,Qwen/Qwen1.5-14B-Chat,https://huggingface.co/Qwen/Qwen1.5-14B-Chat,52,Qwen1.5-14B-Chat,1108,+4/-3,18668,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-14b-chat,💬,Qwen/Qwen1.5-14B-Chat,62.27,58.7,82.27,68.57,60.36,73.09,30.63,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,14,99,TRUE,9492b22871f43e975435455f5c616c77fe7a50ec,TRUE,FALSE,2024-05-16T07:47:25Z,Qwen/Qwen1.5-14B-Chat,https://huggingface.co/Qwen/Qwen1.5-14B-Chat,52,Qwen1.5-14B-Chat,1108,+4/-3,18668,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-32b-chat,💬,Qwen/Qwen1.5-32B-Chat,62.95,66.04,85.49,74.99,66.95,77.19,7.05,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,32,102,TRUE,0b1785d88bbe93aa90a8a19da8af78eccbf010a6,TRUE,TRUE,2024-04-05T21:01:12Z,Qwen/Qwen1.5-32B-Chat,https://huggingface.co/Qwen/Qwen1.5-32B-Chat,42,Qwen1.5-32B-Chat,1125,+4/-3,22784,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ -qwen1.5-4b-chat,💬,Qwen/Qwen1.5-4B-Chat,46.79,43.26,69.73,55.55,44.79,64.96,2.43,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,3,34,TRUE,15bf46b13b1e6b6dd18ff7fa3242af406cc7e791,TRUE,FALSE,2024-02-12T17:13:33Z,Qwen/Qwen1.5-4B-Chat,https://huggingface.co/Qwen/Qwen1.5-4B-Chat,102,Qwen1.5-4B-Chat,988,+6/-7,7816,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-72b-chat,💬,Qwen/Qwen1.5-72B-Chat,65.98,68.26,86.47,77.46,63.84,78.93,20.92,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,214,TRUE,bc11a298a0c6a5cd737064db62c6ad20ec6331be,TRUE,FALSE,2024-02-17T04:34:39Z,Qwen/Qwen1.5-72B-Chat,https://huggingface.co/Qwen/Qwen1.5-72B-Chat,35,Qwen1.5-72B-Chat,1147,+3/-3,40666,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-72b-chat,💬,Qwen/Qwen1.5-72B-Chat,65.96,68.52,86.42,77.44,63.9,79.08,20.39,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,72,214,TRUE,1a6ccc1215278f962c794b1848c710c29ef4053d,TRUE,FALSE,2024-03-07T14:52:34Z,Qwen/Qwen1.5-72B-Chat,https://huggingface.co/Qwen/Qwen1.5-72B-Chat,35,Qwen1.5-72B-Chat,1147,+3/-3,40666,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-7b-chat,💬,Qwen/Qwen1.5-7B-Chat,55.15,55.89,78.56,61.65,53.54,67.72,13.57,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,7,153,TRUE,0addb6bfd79e59bce8f61ed60cdafd906c04d447,TRUE,FALSE,2024-02-12T17:13:18Z,Qwen/Qwen1.5-7B-Chat,https://huggingface.co/Qwen/Qwen1.5-7B-Chat,68,Qwen1.5-7B-Chat,1070,+7/-7,4870,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-7b-chat,💬,Qwen/Qwen1.5-7B-Chat,55.13,55.89,78.56,61.7,53.65,67.8,13.19,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,7,153,TRUE,0addb6bfd79e59bce8f61ed60cdafd906c04d447,TRUE,FALSE,2024-02-18T04:43:41Z,Qwen/Qwen1.5-7B-Chat,https://huggingface.co/Qwen/Qwen1.5-7B-Chat,68,Qwen1.5-7B-Chat,1070,+7/-7,4870,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -solar-10.7b-instruct-v1.0,?,upstage/SOLAR-10.7B-Instruct-v1.0,74.2,71.08,88.16,66.21,71.43,83.58,64.75,"",LlamaForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,10,591,TRUE,d3167df97a44b8632538b32ee8cd887893ea1435,TRUE,FALSE,2024-06-09T15:01:03Z,upstage/SOLAR-10.7B-Instruct-v1.0,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0,71,SOLAR-10.7B-Instruct-v1.0,1062,+8/-7,4293,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 -stablelm-tuned-alpha-7b,🔶,stabilityai/stablelm-tuned-alpha-7b,34.04,31.91,53.59,24.41,40.37,53.12,0.83,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,7,359,TRUE,25071b093c15c0d1cb2b2876c6deb621b764fcf5,TRUE,TRUE,2023-09-09T10:52:17Z,stabilityai/stablelm-tuned-alpha-7b,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b,114,StableLM-Tuned-Alpha-7B,839,+11/-10,3339,Stability AI,CC-BY-NC-SA-4.0,2023/4,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b -starling-lm-7b-alpha,🔶,berkeley-nest/Starling-LM-7B-alpha,67.13,63.82,84.9,64.67,46.39,80.58,62.4,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,551,TRUE,f721e85293598f2ef774e483ae95343e39811577,FALSE,TRUE,2023-11-30T20:12:15Z,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha,61,Starling-LM-7B-alpha,1088,+6/-5,10425,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha -starling-lm-7b-alpha,🔶,berkeley-nest/Starling-LM-7B-alpha,67.05,63.65,84.87,64.7,46.32,80.43,62.32,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,551,TRUE,76e60ca9807f55acd8eff3ec7ae022c5fbdf1e0e,FALSE,TRUE,2023-11-28T06:48:55Z,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha,61,Starling-LM-7B-alpha,1088,+6/-5,10425,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha -starling-lm-7b-beta,💬,Nexusflow/Starling-LM-7B-beta,69.88,67.24,83.47,65.14,55.47,81.29,66.64,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,326,TRUE,ee26b7c2cf9db00e1d9a92c9989d5b2a0b891dbd,TRUE,TRUE,2024-03-23T21:12:48Z,Nexusflow/Starling-LM-7B-beta,https://huggingface.co/Nexusflow/Starling-LM-7B-beta,44,Starling-LM-7B-beta,1119,+5/-5,16659,Nexusflow,Apache-2.0,2024/3,https://huggingface.co/Nexusflow/Starling-LM-7B-beta -tulu-2-dpo-70b,💬,allenai/tulu-2-dpo-70b,73.77,72.1,88.99,69.84,65.78,83.27,62.62,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,68,146,TRUE,0ab5c875f0070d5aee8d36bc55f41de440a13f02,TRUE,TRUE,2024-02-01T13:38:05Z,allenai/tulu-2-dpo-70b,https://huggingface.co/allenai/tulu-2-dpo-70b,55,Tulu-2-DPO-70B,1099,+5/-6,6666,AllenAI/UW,AI2 ImpACT Low-risk,2023/11,https://huggingface.co/allenai/tulu-2-dpo-70b -vicuna-13b,🔶,eachadea/vicuna-13b,52.3,51.71,79.94,50.84,52.68,71.03,7.58,🔶 fine-tuned on domain-specific datasets,Unknown,Original,float16,TRUE,"",12,0,FALSE,ac4218770a58baaaaf25201076fe082abb6ffd13,TRUE,TRUE,2023-10-16T12:46:18Z,eachadea/vicuna-13b,https://huggingface.co/eachadea/vicuna-13b,84,Vicuna-13B,1041,+4/-6,19798,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-13b-v1.5 -wizardlm-13b-v1.2,🔶,WizardLM/WizardLM-13B-V1.2,54.76,59.04,82.21,54.64,47.27,71.9,13.5,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,"",13,0,FALSE,6760d0c07ffdc2405295ed7a29437cf4dc414bac,TRUE,TRUE,2023-09-09T10:52:17Z,WizardLM/WizardLM-13B-V1.2,https://huggingface.co/WizardLM/WizardLM-13B-V1.2,75,WizardLM-13b-v1.2,1058,+6/-7,7194,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 -wizardlm-70b-v1.0,💬,WizardLM/WizardLM-70B-V1.0,61.25,65.44,84.41,64.05,54.81,80.82,17.97,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,4bit,TRUE,"",70,0,FALSE,6dae38060d70b82dcfe787a612d04aaf0adf0738,TRUE,TRUE,2023-09-09T10:52:17Z,WizardLM/WizardLM-70B-V1.0,https://huggingface.co/WizardLM/WizardLM-70B-V1.0,52,WizardLM-70B-v1.0,1106,+5/-6,8393,Microsoft,Llama 2 Community,2023/8,https://huggingface.co/WizardLM/WizardLM-70B-V1.0 -yi-1.5-34b-chat,?,01-ai/Yi-1.5-34B-Chat,74.82,70.48,85.97,77.08,62.16,81.61,71.65,"",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,180,TRUE,fa695ee438bfcd0ec2b378fa1c7e0dea1b40393e,TRUE,TRUE,2024-06-09T15:02:51Z,01-ai/Yi-1.5-34B-Chat,https://huggingface.co/01-ai/Yi-1.5-34B-Chat,29,Yi-1.5-34B-Chat,1157,+4/-5,25183,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat -yi-34b-chat,💬,01-ai/Yi-34B-Chat,65.32,65.44,84.16,74.9,55.37,80.11,31.92,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,332,TRUE,a99ec35331cbfc9da596af7d4538fe2efecff03c,TRUE,FALSE,2023-12-04T08:52:11Z,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat,48,Yi-34B-Chat,1111,+5/-5,15946,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat -yi-34b-chat,💬,01-ai/Yi-34B-Chat,63.17,65.1,84.08,74.87,55.41,79.79,19.79,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,apache-2.0,34,332,TRUE,a99ec35331cbfc9da596af7d4538fe2efecff03c,TRUE,FALSE,2023-11-23T10:23:14Z,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat,48,Yi-34B-Chat,1111,+5/-5,15946,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat -zephyr-7b-alpha,🔶,HuggingFaceH4/zephyr-7b-alpha,59.5,61.01,84.04,61.39,57.9,78.61,14.03,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1085,TRUE,2cd2cd16a6ab22585d643cf264fac73b18e7852a,TRUE,TRUE,2023-10-16T12:48:18Z,HuggingFaceH4/zephyr-7b-alpha,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha,81,Zephyr-7b-alpha,1041,+11/-13,1818,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha -zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,61.95,62.03,84.36,61.07,57.45,77.74,29.04,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1493,TRUE,8af01af3d4f9dc9b962447180d6d0f8c5315da86,TRUE,TRUE,2023-11-16T02:50:49Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,79,Zephyr-7b-beta,1053,+5/-6,11337,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta -zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,61.59,62.46,84.35,60.7,57.83,77.11,27.07,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,8bit,TRUE,mit,7,1493,TRUE,0f17b36adfbe7d86ea1c591a9efeeae17b313f48,TRUE,TRUE,2023-12-04T06:04:15Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,79,Zephyr-7b-beta,1053,+5/-6,11337,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta -zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,59.08,62.03,84.53,61.06,57.44,78.06,11.37,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,mit,7,1493,TRUE,8af01af3d4f9dc9b962447180d6d0f8c5315da86,TRUE,TRUE,2023-11-16T02:50:38Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,79,Zephyr-7b-beta,1053,+5/-6,11337,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +deepseek-llm-67b-chat,💬,deepseek-ai/deepseek-llm-67b-chat,71.79,67.75,86.82,72.42,55.85,84.21,63.68,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,other,67,168,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2023-12-01T07:45:30Z,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat,67,DeepSeek-LLM-67B-Chat,1077,+8/-8,4984,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat +deepseek-llm-67b-chat,🔶,deepseek-ai/deepseek-llm-67b-chat,71.52,67.75,86.8,72.19,55.83,84.21,62.32,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,67,168,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2024-01-19T19:12:01Z,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat,67,DeepSeek-LLM-67B-Chat,1077,+8/-8,4984,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat +dolly-v2-12b,🔶,databricks/dolly-v2-12b,39.46,42.41,72.53,25.92,33.83,60.85,1.21,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,mit,12,1943,TRUE,19308160448536e378e3db21a73a751579ee7fdd,TRUE,TRUE,2023-09-09T10:52:17Z,databricks/dolly-v2-12b,https://huggingface.co/databricks/dolly-v2-12b,115,Dolly-V2-12B,822,+11/-11,3488,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b +dolphin-2.2.1-mistral-7b,🔶,cognitivecomputations/dolphin-2.2.1-mistral-7b,65.01,63.23,83.8,63.16,53.14,78.61,48.14,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,187,TRUE,2022924c0bb13588308d429e0b7f51568c07629c,TRUE,TRUE,2023-12-30T19:55:50Z,cognitivecomputations/dolphin-2.2.1-mistral-7b,https://huggingface.co/cognitivecomputations/dolphin-2.2.1-mistral-7b,70,Dolphin-2.2.1-Mistral-7B,1062,+11/-12,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b +dolphin-2.2.1-mistral-7b,🔶,ehartford/dolphin-2.2.1-mistral-7b,64.93,63.31,83.76,63.17,53.11,78.14,48.07,🔶 fine-tuned on domain-specific datasets,Unknown,Original,bfloat16,TRUE,"",7,0,FALSE,001b48e9aebffb395c698af47b6b48364cc3cbe8,TRUE,TRUE,2023-12-02T05:25:26Z,ehartford/dolphin-2.2.1-mistral-7b,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b,70,Dolphin-2.2.1-Mistral-7B,1062,+11/-12,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b +dolphin-2.2.1-mistral-7b,🔶,ehartford/dolphin-2.2.1-mistral-7b,60.54,63.48,83.86,63.28,53.17,78.37,21.08,🔶 fine-tuned on domain-specific datasets,Unknown,Original,float16,TRUE,"",7,0,FALSE,001b48e9aebffb395c698af47b6b48364cc3cbe8,TRUE,TRUE,2023-11-15T20:44:49Z,ehartford/dolphin-2.2.1-mistral-7b,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b,70,Dolphin-2.2.1-Mistral-7B,1062,+11/-12,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b +gemma-1.1-7b-it,💬,google/gemma-1.1-7b-it,60.09,60.07,76.14,60.92,50.74,69.69,42.99,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,float16,TRUE,gemma,8,251,TRUE,689f62a7dfc06893ea915ca75f1cd26825c76146,TRUE,TRUE,2024-04-11T19:11:38Z,google/gemma-1.1-7b-it,https://huggingface.co/google/gemma-1.1-7b-it,64,Gemma-1.1-7B-it,1084,+4/-4,25112,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it +gemma-1.1-7b-it,💬,OpenModels4all/gemma-1.1-7b-it,59.78,59.98,76.21,60.39,50.4,69.93,41.77,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,gemma,8,3,TRUE,484670e31c44eededf8c64064eb0207e7af4a2b3,TRUE,TRUE,2024-04-09T09:05:33Z,OpenModels4all/gemma-1.1-7b-it,https://huggingface.co/OpenModels4all/gemma-1.1-7b-it,64,Gemma-1.1-7B-it,1084,+4/-4,25112,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it +gemma-2b-it,🔶,google/gemma-2b-it,42.75,43.94,62.7,37.65,45.82,60.93,5.46,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,float16,TRUE,gemma,2,566,TRUE,9642e777f24fde593d204a9b2471dce33334e64a,TRUE,TRUE,2024-02-22T13:13:54Z,google/gemma-2b-it,https://huggingface.co/google/gemma-2b-it,101,Gemma-2B-it,989,+8/-8,4919,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it +gemma-7b-it,🔶,google/gemma-7b-it,53.56,51.45,71.96,53.52,47.29,67.96,29.19,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,float16,TRUE,gemma,8,1099,TRUE,dec4b13d574762bd36f0a1b75541439bd852b2e8,TRUE,TRUE,2024-02-22T13:13:37Z,google/gemma-7b-it,https://huggingface.co/google/gemma-7b-it,85,Gemma-7B-it,1037,+6/-7,9177,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it +llama-13b,🟢,huggingface/llama-13b,51.36,56.23,80.93,47.67,39.48,76.24,7.58,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,other,13,0,FALSE,4022c52fcc7473ce7364bb5ac166195903ea1efb,TRUE,TRUE,2023-10-16T12:48:18Z,huggingface/llama-13b,https://huggingface.co/huggingface/llama-13b,117,LLaMA-13B,799,+11/-14,2444,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 +llama-13b,🟢,huggyllama/llama-13b,51.33,56.14,80.92,47.61,39.48,76.24,7.58,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,other,13,137,TRUE,bf57045473f207bb1de1ed035ace226f4d9f9bba,TRUE,TRUE,2023-09-09T10:52:17Z,huggyllama/llama-13b,https://huggingface.co/huggyllama/llama-13b,117,LLaMA-13B,799,+11/-14,2444,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 +mistral-7b-instruct-v0.1,💬,mistralai/Mistral-7B-Instruct-v0.1,54.96,54.52,75.63,55.38,56.28,73.72,14.25,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,1456,TRUE,7961f5aa9b736bf8e364b2e6f201190f97a27931,TRUE,TRUE,2023-10-16T12:48:18Z,mistralai/Mistral-7B-Instruct-v0.1,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1,98,Mistral-7B-Instruct-v0.1,1008,+6/-6,9151,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 +mistral-7b-instruct-v0.2,💬,mistralai/Mistral-7B-Instruct-v0.2,65.71,63.14,84.88,60.78,68.26,77.19,40.03,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,2382,TRUE,c72e5d1908b1e2929ec8fc4c8820e9706af1f80f,TRUE,TRUE,2023-12-11T20:10:06Z,mistralai/Mistral-7B-Instruct-v0.2,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2,69,Mistral-7B-Instruct-v0.2,1072,+4/-4,20068,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 +mistral-7b-instruct-v0.2,💬,dfurman/Mistral-7B-Instruct-v0.2,61.79,60.15,82.79,60.07,56.06,76.87,34.8,"💬 chat models (RLHF, DPO, IFT, ...)",?,Adapter,float16,TRUE,apache-2.0,7,5,TRUE,322faff8bb0c72b772762de7635f5aea9864a24a,TRUE,TRUE,2024-01-02T17:44:20Z,dfurman/Mistral-7B-Instruct-v0.2,https://huggingface.co/dfurman/Mistral-7B-Instruct-v0.2,69,Mistral-7B-Instruct-v0.2,1072,+4/-4,20068,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 +mixtral-8x22b-instruct-v0.1,💬,mistralai/Mixtral-8x22B-Instruct-v0.1,79.15,72.7,89.08,77.77,68.14,85.16,82.03,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,140,613,TRUE,eb69dca9c68bbdcffd5f522f632d5c04ab6c65b3,TRUE,FALSE,2024-04-17T15:30:22Z,mistralai/Mixtral-8x22B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1,37,Mixtral-8x22b-Instruct-v0.1,1146,+2/-4,45772,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ +mixtral-8x7b-instruct-v0.1,🔶,mistralai/Mixtral-8x7B-Instruct-v0.1,72.7,70.14,87.55,71.4,64.98,81.06,61.11,🔶 fine-tuned on domain-specific datasets,MixtralForCausalLM,Original,float16,TRUE,apache-2.0,46,3920,TRUE,125c431e2ff41a156b9f9076f744d2f35dd6e67a,TRUE,FALSE,2024-01-01T02:10:03Z,mistralai/Mixtral-8x7B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1,51,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,73266,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ +mixtral-8x7b-instruct-v0.1,💬,mistralai/Mixtral-8x7B-Instruct-v0.1,72.62,70.22,87.63,71.16,64.58,81.37,60.73,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,3920,TRUE,3de0408ae8b591d9ac516a2384925dd98ebc66f4,TRUE,FALSE,2023-12-11T12:54:17Z,mistralai/Mixtral-8x7B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1,51,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,73266,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ +mpt-30b-chat,🔶,mosaicml/mpt-30b-chat,55.38,58.7,82.54,51.16,52.42,75.3,12.13,🔶 fine-tuned on domain-specific datasets,MPTForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,30,199,TRUE,54f33278a04aa4e612bca482b82f801ab658e890,TRUE,TRUE,2023-09-09T10:52:17Z,mosaicml/mpt-30b-chat,https://huggingface.co/mosaicml/mpt-30b-chat,81,MPT-30B-chat,1045,+9/-12,2649,MosaicML,CC-BY-NC-SA-4.0,2023/6,https://huggingface.co/mosaicml/mpt-30b-chat +mpt-7b-chat,🔶,mosaicml/mpt-7b-chat,45.39,46.5,75.51,37.62,40.16,68.43,4.09,🔶 fine-tuned on domain-specific datasets,MPTForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,7,513,TRUE,64e5c9c9fb53a8e89690c2dee75a5add37f7113e,TRUE,TRUE,2023-09-09T10:52:17Z,mosaicml/mpt-7b-chat,https://huggingface.co/mosaicml/mpt-7b-chat,107,MPT-7B-Chat,927,+12/-8,4019,MosaicML,CC-BY-NC-SA-4.0,2023/5,https://huggingface.co/mosaicml/mpt-7b-chat +nous-hermes-2-mixtral-8x7b-dpo,🔶,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,73.35,71.08,87.29,72.17,54.83,83.11,71.65,🔶 fine-tuned on domain-specific datasets,MixtralForCausalLM,Original,float16,TRUE,apache-2.0,46,383,TRUE,566cdea53950f86eb51dae62812c29e79405cffe,TRUE,FALSE,2024-01-22T08:41:28Z,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,62,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+8/-8,3843,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO +nous-hermes-2-mixtral-8x7b-dpo,?,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,73.12,71.42,87.21,72.28,54.53,82.64,70.66,"",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,383,TRUE,6ba531f1aec62375bf94ad9c7bb064953c4e9868,TRUE,FALSE,2024-06-09T15:01:07Z,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,62,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+8/-8,3843,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO +openchat-3.5-0106,💬,openchat/openchat-3.5-0106,69.3,66.04,82.93,65.04,51.9,81.77,68.16,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,341,TRUE,9619fb7d2a8e25fa6b0633c0f57f7f4aa79b45c4,TRUE,TRUE,2024-01-10T09:45:30Z,openchat/openchat-3.5-0106,https://huggingface.co/openchat/openchat-3.5-0106,61,OpenChat-3.5-0106,1091,+5/-5,12985,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 +openhermes-2.5-mistral-7b,🔶,teknium/OpenHermes-2.5-Mistral-7B,61.52,64.93,84.18,63.64,52.24,78.06,26.08,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,787,TRUE,2a54cad766bc90828354db5c4199795aecfd0df1,TRUE,TRUE,2023-11-17T19:50:31Z,teknium/OpenHermes-2.5-Mistral-7B,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B,68,OpenHermes-2.5-Mistral-7b,1074,+6/-9,5090,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B +openhermes-2.5-mistral-7b,🔶,teknium/OpenHermes-2.5-Mistral-7B,61.45,64.93,84.3,63.82,52.31,77.9,25.47,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,787,TRUE,2a54cad766bc90828354db5c4199795aecfd0df1,TRUE,TRUE,2023-11-14T15:14:43Z,teknium/OpenHermes-2.5-Mistral-7B,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B,68,OpenHermes-2.5-Mistral-7b,1074,+6/-9,5090,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B +phi-3-medium-4k-instruct,🟢,unsloth/Phi-3-medium-4k-instruct,73.57,67.06,85.69,77.85,57.75,72.85,80.21,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,mit,13,23,TRUE,1099cff4ded0cc74fb38a90951c4e21865cddd73,TRUE,TRUE,2024-05-28T06:35:31Z,unsloth/Phi-3-medium-4k-instruct,https://huggingface.co/unsloth/Phi-3-medium-4k-instruct,43,Phi-3-Medium-4k-Instruct,1122,+4/-4,18222,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct +phi-3-medium-4k-instruct,🔶,microsoft/Phi-3-medium-4k-instruct,73.45,67.32,85.76,77.83,57.71,72.69,79.38,🔶 fine-tuned on domain-specific datasets,Phi3ForCausalLM,Original,bfloat16,TRUE,mit,13,136,TRUE,d27c49ed6abea9167240288dceb4ab6bca855293,TRUE,FALSE,2024-05-27T15:40:50Z,microsoft/Phi-3-medium-4k-instruct,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct,43,Phi-3-Medium-4k-Instruct,1122,+4/-4,18222,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct +phi-3-mini-128k-instruct,💬,microsoft/Phi-3-mini-128k-instruct,68.07,63.14,80.09,68.7,54.12,72.85,69.52,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,float16,TRUE,mit,3,1355,TRUE,ebee18c488086b396dde649f2aa6548b9b8d2404,TRUE,FALSE,2024-04-25T13:14:03Z,microsoft/Phi-3-mini-128k-instruct,https://huggingface.co/microsoft/Phi-3-mini-128k-instruct,85,Phi-3-Mini-128k-Instruct,1037,+4/-4,21620,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ +phi-3-mini-4k-instruct,💬,microsoft/Phi-3-mini-4k-instruct,69.91,62.97,80.6,69.08,59.88,72.38,74.53,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,float16,TRUE,mit,3,724,TRUE,b86bcaf57ea4dfdec5dbe12a377028b2fab0d480,TRUE,FALSE,2024-04-26T08:51:19Z,microsoft/Phi-3-mini-4k-instruct,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct,70,Phi-3-Mini-4k-Instruct,1066,+5/-4,21159,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +phi-3-mini-4k-instruct,🟢,unsloth/Phi-3-mini-4k-instruct,69.86,62.97,80.61,69.08,59.88,72.69,73.92,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,mit,3,27,TRUE,4caf5ac193b82d28dea55dcbb22aa51d2a3be453,TRUE,TRUE,2024-05-11T07:51:45Z,unsloth/Phi-3-mini-4k-instruct,https://huggingface.co/unsloth/Phi-3-mini-4k-instruct,70,Phi-3-Mini-4k-Instruct,1066,+5/-4,21159,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +qwen1.5-110b-chat,💬,Qwen/Qwen1.5-110B-Chat,68.01,72.01,84.67,78.04,65.86,77.35,30.1,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,110,117,TRUE,5e04700b8091f10a98f1fe0b20c48c10d195ef5f,TRUE,FALSE,2024-04-29T12:55:18Z,Qwen/Qwen1.5-110B-Chat,https://huggingface.co/Qwen/Qwen1.5-110B-Chat,30,Qwen1.5-110B-Chat,1162,+3/-3,27497,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ +qwen1.5-14b-chat,🔶,Qwen/Qwen1.5-14B-Chat,62.37,58.79,82.33,68.52,60.38,73.32,30.86,🔶 fine-tuned on domain-specific datasets,Qwen2ForCausalLM,Original,float16,TRUE,other,14,99,TRUE,17e11c306ed235e970c9bb8e5f7233527140cdcf,TRUE,FALSE,2024-03-01T12:30:06Z,Qwen/Qwen1.5-14B-Chat,https://huggingface.co/Qwen/Qwen1.5-14B-Chat,53,Qwen1.5-14B-Chat,1109,+4/-4,18673,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-14b-chat,💬,Qwen/Qwen1.5-14B-Chat,62.27,58.7,82.27,68.57,60.36,73.09,30.63,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,14,99,TRUE,9492b22871f43e975435455f5c616c77fe7a50ec,TRUE,FALSE,2024-05-16T07:47:25Z,Qwen/Qwen1.5-14B-Chat,https://huggingface.co/Qwen/Qwen1.5-14B-Chat,53,Qwen1.5-14B-Chat,1109,+4/-4,18673,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-32b-chat,💬,Qwen/Qwen1.5-32B-Chat,62.95,66.04,85.49,74.99,66.95,77.19,7.05,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,32,102,TRUE,0b1785d88bbe93aa90a8a19da8af78eccbf010a6,TRUE,TRUE,2024-04-05T21:01:12Z,Qwen/Qwen1.5-32B-Chat,https://huggingface.co/Qwen/Qwen1.5-32B-Chat,43,Qwen1.5-32B-Chat,1125,+5/-5,22770,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ +qwen1.5-4b-chat,💬,Qwen/Qwen1.5-4B-Chat,46.79,43.26,69.73,55.55,44.79,64.96,2.43,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,3,34,TRUE,15bf46b13b1e6b6dd18ff7fa3242af406cc7e791,TRUE,FALSE,2024-02-12T17:13:33Z,Qwen/Qwen1.5-4B-Chat,https://huggingface.co/Qwen/Qwen1.5-4B-Chat,103,Qwen1.5-4B-Chat,988,+6/-8,7811,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-72b-chat,💬,Qwen/Qwen1.5-72B-Chat,65.98,68.26,86.47,77.46,63.84,78.93,20.92,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,214,TRUE,bc11a298a0c6a5cd737064db62c6ad20ec6331be,TRUE,FALSE,2024-02-17T04:34:39Z,Qwen/Qwen1.5-72B-Chat,https://huggingface.co/Qwen/Qwen1.5-72B-Chat,35,Qwen1.5-72B-Chat,1147,+3/-3,40662,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-72b-chat,💬,Qwen/Qwen1.5-72B-Chat,65.96,68.52,86.42,77.44,63.9,79.08,20.39,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,72,214,TRUE,1a6ccc1215278f962c794b1848c710c29ef4053d,TRUE,FALSE,2024-03-07T14:52:34Z,Qwen/Qwen1.5-72B-Chat,https://huggingface.co/Qwen/Qwen1.5-72B-Chat,35,Qwen1.5-72B-Chat,1147,+3/-3,40662,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-7b-chat,💬,Qwen/Qwen1.5-7B-Chat,55.15,55.89,78.56,61.65,53.54,67.72,13.57,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,7,153,TRUE,0addb6bfd79e59bce8f61ed60cdafd906c04d447,TRUE,FALSE,2024-02-12T17:13:18Z,Qwen/Qwen1.5-7B-Chat,https://huggingface.co/Qwen/Qwen1.5-7B-Chat,69,Qwen1.5-7B-Chat,1070,+7/-7,4869,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-7b-chat,💬,Qwen/Qwen1.5-7B-Chat,55.13,55.89,78.56,61.7,53.65,67.8,13.19,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,7,153,TRUE,0addb6bfd79e59bce8f61ed60cdafd906c04d447,TRUE,FALSE,2024-02-18T04:43:41Z,Qwen/Qwen1.5-7B-Chat,https://huggingface.co/Qwen/Qwen1.5-7B-Chat,69,Qwen1.5-7B-Chat,1070,+7/-7,4869,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +solar-10.7b-instruct-v1.0,?,upstage/SOLAR-10.7B-Instruct-v1.0,74.2,71.08,88.16,66.21,71.43,83.58,64.75,"",LlamaForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,10,591,TRUE,d3167df97a44b8632538b32ee8cd887893ea1435,TRUE,FALSE,2024-06-09T15:01:03Z,upstage/SOLAR-10.7B-Instruct-v1.0,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0,72,SOLAR-10.7B-Instruct-v1.0,1062,+8/-8,4293,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 +stablelm-tuned-alpha-7b,🔶,stabilityai/stablelm-tuned-alpha-7b,34.04,31.91,53.59,24.41,40.37,53.12,0.83,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,7,359,TRUE,25071b093c15c0d1cb2b2876c6deb621b764fcf5,TRUE,TRUE,2023-09-09T10:52:17Z,stabilityai/stablelm-tuned-alpha-7b,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b,115,StableLM-Tuned-Alpha-7B,840,+12/-12,3337,Stability AI,CC-BY-NC-SA-4.0,2023/4,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b +starling-lm-7b-alpha,🔶,berkeley-nest/Starling-LM-7B-alpha,67.13,63.82,84.9,64.67,46.39,80.58,62.4,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,551,TRUE,f721e85293598f2ef774e483ae95343e39811577,FALSE,TRUE,2023-11-30T20:12:15Z,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha,62,Starling-LM-7B-alpha,1088,+7/-5,10424,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha +starling-lm-7b-alpha,🔶,berkeley-nest/Starling-LM-7B-alpha,67.05,63.65,84.87,64.7,46.32,80.43,62.32,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,551,TRUE,76e60ca9807f55acd8eff3ec7ae022c5fbdf1e0e,FALSE,TRUE,2023-11-28T06:48:55Z,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha,62,Starling-LM-7B-alpha,1088,+7/-5,10424,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha +starling-lm-7b-beta,💬,Nexusflow/Starling-LM-7B-beta,69.88,67.24,83.47,65.14,55.47,81.29,66.64,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,326,TRUE,ee26b7c2cf9db00e1d9a92c9989d5b2a0b891dbd,TRUE,TRUE,2024-03-23T21:12:48Z,Nexusflow/Starling-LM-7B-beta,https://huggingface.co/Nexusflow/Starling-LM-7B-beta,45,Starling-LM-7B-beta,1119,+5/-4,16663,Nexusflow,Apache-2.0,2024/3,https://huggingface.co/Nexusflow/Starling-LM-7B-beta +tulu-2-dpo-70b,💬,allenai/tulu-2-dpo-70b,73.77,72.1,88.99,69.84,65.78,83.27,62.62,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,68,146,TRUE,0ab5c875f0070d5aee8d36bc55f41de440a13f02,TRUE,TRUE,2024-02-01T13:38:05Z,allenai/tulu-2-dpo-70b,https://huggingface.co/allenai/tulu-2-dpo-70b,53,Tulu-2-DPO-70B,1099,+8/-8,6669,AllenAI/UW,AI2 ImpACT Low-risk,2023/11,https://huggingface.co/allenai/tulu-2-dpo-70b +vicuna-13b,🔶,eachadea/vicuna-13b,52.3,51.71,79.94,50.84,52.68,71.03,7.58,🔶 fine-tuned on domain-specific datasets,Unknown,Original,float16,TRUE,"",12,0,FALSE,ac4218770a58baaaaf25201076fe082abb6ffd13,TRUE,TRUE,2023-10-16T12:46:18Z,eachadea/vicuna-13b,https://huggingface.co/eachadea/vicuna-13b,85,Vicuna-13B,1042,+4/-5,19798,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-13b-v1.5 +wizardlm-13b-v1.2,🔶,WizardLM/WizardLM-13B-V1.2,54.76,59.04,82.21,54.64,47.27,71.9,13.5,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,"",13,0,FALSE,6760d0c07ffdc2405295ed7a29437cf4dc414bac,TRUE,TRUE,2023-09-09T10:52:17Z,WizardLM/WizardLM-13B-V1.2,https://huggingface.co/WizardLM/WizardLM-13B-V1.2,76,WizardLM-13b-v1.2,1058,+6/-7,7195,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 +wizardlm-70b-v1.0,💬,WizardLM/WizardLM-70B-V1.0,61.25,65.44,84.41,64.05,54.81,80.82,17.97,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,4bit,TRUE,"",70,0,FALSE,6dae38060d70b82dcfe787a612d04aaf0adf0738,TRUE,TRUE,2023-09-09T10:52:17Z,WizardLM/WizardLM-70B-V1.0,https://huggingface.co/WizardLM/WizardLM-70B-V1.0,53,WizardLM-70B-v1.0,1106,+6/-7,8392,Microsoft,Llama 2 Community,2023/8,https://huggingface.co/WizardLM/WizardLM-70B-V1.0 +yi-1.5-34b-chat,?,01-ai/Yi-1.5-34B-Chat,74.82,70.48,85.97,77.08,62.16,81.61,71.65,"",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,180,TRUE,fa695ee438bfcd0ec2b378fa1c7e0dea1b40393e,TRUE,TRUE,2024-06-09T15:02:51Z,01-ai/Yi-1.5-34B-Chat,https://huggingface.co/01-ai/Yi-1.5-34B-Chat,31,Yi-1.5-34B-Chat,1157,+4/-4,25171,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat +yi-34b-chat,💬,01-ai/Yi-34B-Chat,65.32,65.44,84.16,74.9,55.37,80.11,31.92,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,332,TRUE,a99ec35331cbfc9da596af7d4538fe2efecff03c,TRUE,FALSE,2023-12-04T08:52:11Z,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat,49,Yi-34B-Chat,1111,+5/-5,15947,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat +yi-34b-chat,💬,01-ai/Yi-34B-Chat,63.17,65.1,84.08,74.87,55.41,79.79,19.79,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,apache-2.0,34,332,TRUE,a99ec35331cbfc9da596af7d4538fe2efecff03c,TRUE,FALSE,2023-11-23T10:23:14Z,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat,49,Yi-34B-Chat,1111,+5/-5,15947,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat +zephyr-7b-alpha,🔶,HuggingFaceH4/zephyr-7b-alpha,59.5,61.01,84.04,61.39,57.9,78.61,14.03,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1085,TRUE,2cd2cd16a6ab22585d643cf264fac73b18e7852a,TRUE,TRUE,2023-10-16T12:48:18Z,HuggingFaceH4/zephyr-7b-alpha,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha,83,Zephyr-7b-alpha,1041,+10/-12,1817,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha +zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,61.95,62.03,84.36,61.07,57.45,77.74,29.04,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1493,TRUE,8af01af3d4f9dc9b962447180d6d0f8c5315da86,TRUE,TRUE,2023-11-16T02:50:49Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,80,Zephyr-7b-beta,1053,+5/-6,11334,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,61.59,62.46,84.35,60.7,57.83,77.11,27.07,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,8bit,TRUE,mit,7,1493,TRUE,0f17b36adfbe7d86ea1c591a9efeeae17b313f48,TRUE,TRUE,2023-12-04T06:04:15Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,80,Zephyr-7b-beta,1053,+5/-6,11334,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,59.08,62.03,84.53,61.06,57.44,78.06,11.37,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,mit,7,1493,TRUE,8af01af3d4f9dc9b962447180d6d0f8c5315da86,TRUE,TRUE,2023-11-16T02:50:38Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,80,Zephyr-7b-beta,1053,+5/-6,11334,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta