diff --git a/csv/lmsys.csv b/csv/lmsys.csv index 2b72744..0921e13 100644 --- a/csv/lmsys.csv +++ b/csv/lmsys.csv @@ -1,156 +1,158 @@ rank,rank_stylectrl,model,arena_score,95_pct_ci,votes,organization,license,knowledge_cutoff,url -1,1,ChatGPT-4o-latest (2024-09-03),1340,+4/-3,33743,OpenAI,Proprietary,2023/10,https://help.openai.com/en/articles/9624314-model-release-notes -1,1,o1-preview,1335,+4/-4,21071,OpenAI,Proprietary,2023/10,https://platform.openai.com/docs/models/o1 -3,6,o1-mini,1308,+4/-4,23128,OpenAI,Proprietary,2023/10,https://platform.openai.com/docs/models/o1 -3,4,Gemini-1.5-Pro-002,1303,+4/-4,15736,Google,Proprietary,Unknown,https://aistudio.google.com/app/prompts/new_chat?instructions=lmsys&model=gemini-1.5-pro-002 -4,4,Gemini-1.5-Pro-Exp-0827,1299,+4/-3,32385,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-pro-exp-0827 -6,9,Grok-2-08-13,1290,+3/-3,40873,xAI,Proprietary,2024/3,https://x.ai/blog/grok-2 -6,3,Claude 3.5 Sonnet (20241022),1286,+6/-6,7284,Anthropic,Proprietary,2024/4,https://www.anthropic.com/news/3-5-models-and-computer-use -6,11,Yi-Lightning,1285,+4/-4,20973,01 AI,Proprietary,Unknown,https://platform.lingyiwanwu.com/docs#%E6%A8%A1%E5%9E%8B%E4%B8%8E%E8%AE%A1%E8%B4%B9 -6,4,GPT-4o-2024-05-13,1285,+3/-3,102960,OpenAI,Proprietary,2023/10,https://openai.com/index/hello-gpt-4o/ -10,15,GLM-4-Plus,1275,+4/-4,19922,Zhipu AI,Proprietary,Unknown,https://bigmodel.cn/dev/howuse/glm-4 -10,18,GPT-4o-mini-2024-07-18,1273,+4/-3,42661,OpenAI,Proprietary,2023/10,https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/ -10,19,Gemini-1.5-Flash-002,1272,+5/-6,12379,Google,Proprietary,Unknown,https://aistudio.google.com/app/prompts/new_chat?instructions=lmsys&model=gemini-1.5-flash-002 -10,26,Llama-3.1-Nemotron-70b-Instruct,1271,+5/-7,6228,Nvidia,Llama 3.1,2023/12,https://huggingface.co/nvidia/Llama-3.1-Nemotron-70B-Instruct -10,14,Gemini-1.5-Flash-Exp-0827,1269,+4/-4,25503,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-flash-exp-0827 -11,6,Claude 3.5 Sonnet (20240620),1268,+3/-3,81086,Anthropic,Proprietary,2024/4,https://www.anthropic.com/news/claude-3-5-sonnet -11,25,Grok-2-Mini-08-13,1267,+4/-3,34105,xAI,Proprietary,2024/3,https://x.ai/blog/grok-2 -11,8,Meta-Llama-3.1-405b-Instruct-fp8,1267,+4/-3,43099,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ -11,7,Gemini Advanced App (2024-05-14),1266,+3/-3,52235,Google,Proprietary,Online,https://gemini.google.com/advanced -11,7,Meta-Llama-3.1-405b-Instruct-bf16,1266,+5/-6,14607,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ -12,14,Yi-Lightning-lite,1265,+3/-5,17271,01 AI,Proprietary,Unknown,https://platform.lingyiwanwu.com/docs#%E6%A8%A1%E5%9E%8B%E4%B8%8E%E8%AE%A1%E8%B4%B9 -12,9,GPT-4o-2024-08-06,1264,+3/-4,34765,OpenAI,Proprietary,2023/10,https://platform.openai.com/docs/models/gpt-4o -12,19,Qwen-Max-0919,1263,+5/-5,15384,Alibaba,Qwen,Unknown,https://help.aliyun.com/zh/dashscope/developer-reference/model-introduction -19,14,Gemini-1.5-Pro-001,1260,+3/-2,82665,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-pro -19,25,Qwen2.5-72b-Instruct,1258,+4/-5,17390,Alibaba,Qwen,2024/9,https://qwenlm.github.io/blog/qwen2.5/ -22,14,GPT-4-Turbo-2024-04-09,1256,+2/-2,99055,OpenAI,Proprietary,2023/12,https://platform.openai.com/docs/models/gpt-4-turbo-and-gpt-4 -22,25,Deepseek-v2.5,1256,+4/-4,17601,DeepSeek,DeepSeek,Unknown,https://huggingface.co/deepseek-ai/DeepSeek-V2.5 -24,19,Mistral-Large-2407,1251,+3/-3,39456,Mistral,Mistral Research,2024/7,https://mistral.ai/news/mistral-large-2407/ -25,25,Athene-70b,1250,+4/-4,20711,NexusFlow,CC-BY-NC-4.0,2024/7,https://huggingface.co/Nexusflow/Athene-70B -26,15,GPT-4-1106-preview,1250,+2/-3,103422,OpenAI,Proprietary,2023/4,https://openai.com/blog/new-models-and-developer-products-announced-at-devday -27,14,Claude 3 Opus,1248,+2/-3,177919,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family -27,31,Meta-Llama-3.1-70b-Instruct,1247,+3/-3,38692,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ -28,19,GPT-4-0125-preview,1245,+3/-2,96746,OpenAI,Proprietary,2023/12,https://openai.com/blog/new-models-and-developer-products-announced-at-devday -32,31,Yi-Large-preview,1240,+4/-4,51730,01 AI,Proprietary,Unknown,https://platform.lingyiwanwu.com/docs#%E6%A8%A1%E5%9E%8B -34,31,Reka-Core-20240722,1230,+6/-6,13335,Reka AI,Proprietary,Unknown,https://docs.reka.ai/available-models -34,31,Qwen-Plus-0828,1227,+5/-5,14745,Alibaba,Proprietary,Unknown,https://help.aliyun.com/zh/model-studio/getting-started/models -34,33,Gemini-1.5-Flash-001,1227,+3/-3,65822,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-flash -34,31,Jamba-1.5-Large,1221,+6/-6,9182,AI21 Labs,Jamba Open,2024/3,https://www.ai21.com/jamba -34,24,Llama-3.1-Nemotron-51b-Instruct,1218,+12/-12,1816,Nvidia,Llama 3.1,2023/12,https://huggingface.co/nvidia/Llama-3_1-Nemotron-51B-Instruct -35,33,Deepseek-v2-API-0628,1219,+4/-4,19612,DeepSeek AI,DeepSeek,Unknown,https://platform.deepseek.com/api-docs/updates#deepseek-chat -37,31,Gemma-2-27b-it,1219,+3/-3,49844,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-27b-it -37,33,Gemma-2-9b-it-SimPO,1215,+6/-5,10622,Princeton,MIT,2024/7,https://huggingface.co/princeton-nlp/gemma-2-9b-it-SimPO -37,35,Command R+ (08-2024),1215,+4/-6,10599,Cohere,CC-BY-NC-4.0,2024/8,https://docs.cohere.com/docs/command-r-plus#model-details -37,36,Deepseek-Coder-v2-0724,1214,+5/-5,11772,DeepSeek,Proprietary,Unknown,https://platform.deepseek.com/api-docs/updates/#version-2024-07-24 -37,39,Yi-Large,1212,+5/-4,16671,01 AI,Proprietary,Unknown,https://platform.01.ai/docs#models-and-pricing -39,50,Gemini-1.5-Flash-8B-001,1211,+4/-6,13402,Google,Proprietary,Unknown,https://aistudio.google.com/app/prompts/new_chat?instructions=lmsys&model=gemini-1.5-flash-8b -40,36,Nemotron-4-340B-Instruct,1209,+4/-4,20649,Nvidia,NVIDIA Open Model,2023/6,https://huggingface.co/nvidia/Nemotron-4-340B-Instruct -40,43,GLM-4-0520,1206,+6/-5,10229,Zhipu AI,Proprietary,Unknown,https://open.bigmodel.cn/dev/api#language -42,41,Llama-3-70b-Instruct,1206,+2/-2,163932,Meta,Llama 3 Community,2023/12,https://llama.meta.com/llama3/ -43,54,Gemini-1.5-Flash-8b-Exp-0827,1205,+3/-4,25483,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-flash-8b-exp-0827 -48,38,Claude 3 Sonnet,1201,+2/-2,113087,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family -48,49,Reka-Flash-20240722,1201,+3/-4,13775,Reka AI,Proprietary,Unknown,https://docs.reka.ai/available-models -48,51,Reka-Core-20240501,1199,+3/-2,62603,Reka AI,Proprietary,Unknown,https://www.reka.ai/news/reka-core-our-frontier-class-multimodal-language-model -53,49,Command R+ (04-2024),1190,+3/-3,80899,Cohere,CC-BY-NC-4.0,2024/3,https://txt.cohere.com/command-r-plus-microsoft-azure/ -53,52,Gemma-2-9b-it,1190,+3/-3,36551,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-9b-it -53,49,Qwen2-72B-Instruct,1187,+4/-4,38990,Alibaba,Qianwen LICENSE,2024/6,https://qwenlm.github.io/blog/qwen2/ -53,33,GPT-4-0314,1186,+2/-3,55981,OpenAI,Proprietary,2021/9,https://openai.com/research/gpt-4 -53,60,GLM-4-0116,1183,+5/-7,7580,Zhipu AI,Proprietary,Unknown,https://open.bigmodel.cn/ -54,54,Qwen-Max-0428,1183,+3/-5,25723,Alibaba,Proprietary,Unknown,https://help.aliyun.com/zh/dashscope/developer-reference/api-details -57,51,Command R (08-2024),1179,+4/-6,10940,Cohere,CC-BY-NC-4.0,2024/8,https://docs.cohere.com/docs/command-r-plus#model-details -57,52,Claude 3 Haiku,1179,+2/-2,121352,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family -57,49,DeepSeek-Coder-V2-Instruct,1178,+4/-5,15804,DeepSeek AI,DeepSeek License,2024/6,https://huggingface.co/deepseek-ai/DeepSeek-Coder-V2-Instruct -57,62,Jamba-1.5-Mini,1176,+6/-6,9299,AI21 Labs,Jamba Open,2024/3,https://www.ai21.com/jamba -59,82,Meta-Llama-3.1-8b-Instruct,1173,+3/-3,36916,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ -64,63,Reka-Flash-Preview-20240611,1165,+4/-4,20469,Reka AI,Proprietary,Unknown,https://docs.reka.ai/http-api.html#generation -64,49,GPT-4-0613,1163,+2/-3,91680,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo -64,62,Qwen1.5-110B-Chat,1161,+4/-4,27486,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ -64,78,Yi-1.5-34B-Chat,1157,+4/-3,25145,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat -65,63,Reka-Flash-21B-online,1156,+5/-5,16031,Reka AI,Proprietary,Online,https://docs.reka.ai/http-api.html#generation -66,62,Mistral-Large-2402,1157,+3/-3,64946,Mistral,Proprietary,Unknown,https://mistral.ai/news/mistral-large/ -67,73,Llama-3-8b-Instruct,1152,+3/-3,109378,Meta,Llama 3 Community,2023/3,https://llama.meta.com/llama3/ -67,88,InternLM2.5-20b-chat,1150,+5/-7,10710,InternLM,Other,2024/8,https://huggingface.co/internlm/internlm2_5-20b-chat -69,62,Claude-1,1149,+4/-4,21160,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/introducing-claude -69,66,Command R (04-2024),1149,+3/-3,56405,Cohere,CC-BY-NC-4.0,2024/3,https://txt.cohere.com/command-r -69,73,Mistral Medium,1148,+4/-3,35551,Mistral,Proprietary,Unknown,https://mistral.ai/news/la-plateforme/ -69,72,Reka-Flash-21B,1148,+4/-5,25807,Reka AI,Proprietary,2023/11,https://www.reka.ai/news/reka-flash-efficient-and-capable-multimodal-language-models -69,65,Mixtral-8x22b-Instruct-v0.1,1147,+3/-3,53840,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ -70,66,Qwen1.5-72B-Chat,1147,+3/-3,40647,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -78,88,Gemma-2-2b-it,1139,+4/-4,28101,Google,Gemma license,2024/7,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-2b-it -78,66,Claude-2.0,1132,+5/-5,12762,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/claude-2 -78,66,Gemini-1.0-Pro-001,1131,+5/-3,18789,Google,Proprietary,2023/4,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.0-pro -78,76,Zephyr-ORPO-141b-A35b-v0.1,1127,+8/-7,4857,HuggingFace,Apache 2.0,2024/4,https://huggingface.co/HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1 -79,82,Qwen1.5-32B-Chat,1125,+3/-4,22763,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ -79,64,Mistral-Next,1124,+5/-4,12381,Mistral,Proprietary,Unknown,https://chat.mistral.ai/chat -81,88,Phi-3-Medium-4k-Instruct,1123,+3/-5,26158,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct -81,98,Starling-LM-7B-beta,1119,+4/-5,16673,Nexusflow,Apache-2.0,2024/3,https://huggingface.co/Nexusflow/Starling-LM-7B-beta -82,77,Claude-2.1,1118,+3/-3,37693,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/claude-2-1 -84,74,GPT-3.5-Turbo-0613,1117,+3/-4,38949,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 -85,94,Yi-34B-Chat,1111,+5/-5,15928,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat -85,74,Gemini Pro,1111,+7/-7,6561,Google,Proprietary,2023/4,https://blog.google/technology/ai/gemini-api-developers-cloud/ -86,88,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,76142,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ -86,82,Claude-Instant-1,1111,+4/-5,20625,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/introducing-claude -86,66,GPT-3.5-Turbo-0314,1106,+8/-9,5647,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 -88,91,Qwen1.5-14B-Chat,1109,+5/-4,18674,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -89,90,WizardLM-70B-v1.0,1106,+7/-6,8384,Microsoft,Llama 2 Community,2023/8,https://huggingface.co/WizardLM/WizardLM-70B-V1.0 -89,74,GPT-3.5-Turbo-0125,1106,+3/-3,68902,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5-turbo -89,95,Meta-Llama-3.2-3b-Instruct,1103,+8/-7,8459,Meta,Llama 3.2,2023/12,https://ai.meta.com/blog/llama-3-2-connect-2024-vision-edge-mobile-devices/ -89,88,DBRX-Instruct-Preview,1103,+4/-3,33730,Databricks,DBRX LICENSE,2023/12,https://www.databricks.com/blog/introducing-dbrx-new-state-art-open-llm -91,94,Phi-3-Small-8k-Instruct,1102,+4/-5,18500,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-small-8k-instruct -91,96,Tulu-2-DPO-70B,1099,+6/-8,6668,AllenAI/UW,AI2 ImpACT Low-risk,2023/11,https://huggingface.co/allenai/tulu-2-dpo-70b -98,105,Llama-2-70b-chat,1093,+3/-3,39630,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf -98,94,OpenChat-3.5-0106,1091,+5/-5,12975,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 -99,98,Vicuna-33B,1091,+4/-3,22942,LMSYS,Non-commercial,2023/8,https://huggingface.co/lmsys/vicuna-33b-v1.3 -99,93,Snowflake Arctic Instruct,1090,+4/-4,34178,Snowflake,Apache 2.0,2024/4,https://www.snowflake.com/blog/arctic-open-efficient-foundation-language-models-snowflake/ -99,103,Starling-LM-7B-alpha,1088,+5/-5,10416,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha -99,108,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+9/-8,3836,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO -100,105,NV-Llama2-70B-SteerLM-Chat,1080,+11/-8,3640,Nvidia,Llama 2 Community,2023/11,https://huggingface.co/nvidia/Llama2-70B-SteerLM-Chat -101,94,Gemma-1.1-7b-it,1084,+5/-5,25082,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it -104,97,DeepSeek-LLM-67B-Chat,1077,+8/-8,4984,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat -104,97,OpenHermes-2.5-Mistral-7b,1075,+8/-9,5092,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B -105,107,pplx-70b-online,1078,+5/-7,6893,Perplexity AI,Proprietary,Online,https://blog.perplexity.ai/blog/introducing-pplx-online-llms -105,95,OpenChat-3.5,1076,+6/-6,8115,OpenChat,Apache-2.0,2023/11,https://huggingface.co/openchat/openchat_3.5 -105,110,Qwen1.5-7B-Chat,1070,+10/-7,4864,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -106,110,Phi-3-Mini-4k-Instruct-June-24,1071,+6/-6,12882,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -106,108,Dolphin-2.2.1-Mistral-7B,1062,+14/-13,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b -107,110,Mistral-7B-Instruct-v0.2,1072,+4/-4,20063,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 -107,88,GPT-3.5-Turbo-1106,1068,+4/-4,17031,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 -108,115,Phi-3-Mini-4k-Instruct,1066,+5/-4,21126,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -109,110,SOLAR-10.7B-Instruct-v1.0,1062,+9/-9,4286,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 -112,115,Llama-2-13b-chat,1063,+3/-5,19725,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-13b-chat-hf -114,110,WizardLM-13b-v1.2,1059,+6/-9,7183,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 -117,118,Zephyr-7b-beta,1053,+6/-5,11327,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta -117,121,Meta-Llama-3.2-1b-Instruct,1053,+6/-6,8567,Meta,Llama 3.2,2023/12,https://ai.meta.com/blog/llama-3-2-connect-2024-vision-edge-mobile-devices/ -118,110,MPT-30B-chat,1046,+8/-12,2649,MosaicML,CC-BY-NC-SA-4.0,2023/6,https://huggingface.co/mosaicml/mpt-30b-chat -118,118,CodeLlama-70B-instruct,1042,+14/-16,1191,Meta,Llama 2 Community,2024/1,https://huggingface.co/codellama/CodeLlama-70b-hf -119,124,pplx-7b-online,1045,+6/-6,6334,Perplexity AI,Proprietary,Online,https://blog.perplexity.ai/blog/introducing-pplx-online-llms -119,118,CodeLlama-34B-instruct,1043,+7/-7,7507,Meta,Llama 2 Community,2023/7,https://huggingface.co/codellama/CodeLlama-34b-Instruct-hf -119,115,Zephyr-7b-alpha,1041,+11/-11,1814,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha -121,110,falcon-180b-chat,1034,+15/-18,1327,TII,Falcon-180B TII License,2023/9,https://huggingface.co/tiiuae/falcon-180B-chat -123,113,Vicuna-13B,1042,+4/-4,19790,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-13b-v1.5 -123,120,Gemma-7b-it,1037,+6/-6,9177,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it -123,121,Phi-3-Mini-128k-Instruct,1037,+4/-3,21632,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ -123,135,Llama-2-7b-chat,1037,+6/-4,14554,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-7b-chat-hf -123,111,Qwen-14B-Chat,1035,+8/-6,5070,Alibaba,Qianwen LICENSE,2023/8,https://huggingface.co/Qwen/Qwen-14B-Chat -123,124,Guanaco-33B,1032,+9/-12,2998,UW,Non-commercial,2023/5,https://huggingface.co/timdettmers/guanaco-33b-merged -132,129,StripedHyena-Nous-7B,1017,+9/-9,5271,Together AI,Apache 2.0,2023/12,https://huggingface.co/togethercomputer/StripedHyena-Nous-7B -133,124,Gemma-1.1-2b-it,1021,+5/-5,11348,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-2b-it -133,142,OLMo-7B-instruct,1015,+6/-5,6499,Allen AI,Apache-2.0,2024/2,https://huggingface.co/allenai/OLMo-7B-Instruct -135,133,Mistral-7B-Instruct-v0.1,1008,+7/-6,9146,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 -136,135,Vicuna-7B,1005,+7/-7,7019,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-7b-v1.5 -136,124,PaLM-Chat-Bison-001,1003,+7/-8,8741,Google,Proprietary,2021/6,https://cloud.google.com/vertex-ai/docs/generative-ai/learn/models#foundation_models -139,139,Gemma-2b-it,990,+9/-8,4918,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it -141,137,Qwen1.5-4B-Chat,988,+7/-6,7814,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -143,142,Koala-13B,964,+9/-8,7035,UC Berkeley,Non-commercial,2023/4,https://bair.berkeley.edu/blog/2023/04/03/koala/ -143,142,ChatGLM3-6B,955,+8/-10,4763,Tsinghua,Apache-2.0,2023/10,https://huggingface.co/THUDM/chatglm3-6b -144,143,GPT4All-13B-Snoozy,932,+15/-16,1786,Nomic AI,Non-commercial,2023/3,https://huggingface.co/nomic-ai/gpt4all-13b-snoozy -145,143,MPT-7B-Chat,928,+10/-10,4013,MosaicML,CC-BY-NC-SA-4.0,2023/5,https://huggingface.co/mosaicml/mpt-7b-chat -145,148,ChatGLM2-6B,924,+10/-12,2707,Tsinghua,Apache-2.0,2023/6,https://huggingface.co/THUDM/chatglm2-6b -145,147,RWKV-4-Raven-14B,922,+8/-8,4935,RWKV,Apache 2.0,2023/4,https://huggingface.co/BlinkDL/rwkv-4-raven -149,143,Alpaca-13B,902,+10/-10,5872,Stanford,Non-commercial,2023/3,https://crfm.stanford.edu/2023/03/13/alpaca.html -149,149,OpenAssistant-Pythia-12B,893,+7/-10,6382,OpenAssistant,Apache 2.0,2023/4,https://huggingface.co/OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5 -150,151,ChatGLM-6B,879,+10/-8,4996,Tsinghua,Non-commercial,2023/3,https://huggingface.co/THUDM/chatglm-6b -151,151,FastChat-T5-3B,868,+9/-11,4303,LMSYS,Apache 2.0,2023/4,https://huggingface.co/lmsys/fastchat-t5-3b-v1.0 -153,154,StableLM-Tuned-Alpha-7B,840,+10/-10,3336,Stability AI,CC-BY-NC-SA-4.0,2023/4,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b -153,151,Dolly-V2-12B,822,+12/-10,3486,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b -155,152,LLaMA-13B,799,+12/-12,2445,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 +1,1,ChatGPT-4o-latest (2024-09-03),1340,+3/-4,37712,OpenAI,Proprietary,2023/10,https://help.openai.com/en/articles/9624314-model-release-notes +1,1,o1-preview,1334,+4/-5,23562,OpenAI,Proprietary,2023/10,https://platform.openai.com/docs/models/o1 +3,6,o1-mini,1308,+4/-4,26062,OpenAI,Proprietary,2023/10,https://platform.openai.com/docs/models/o1 +3,4,Gemini-1.5-Pro-002,1301,+5/-3,19523,Google,Proprietary,Unknown,https://aistudio.google.com/app/prompts/new_chat?instructions=lmsys&model=gemini-1.5-pro-002 +4,4,Gemini-1.5-Pro-Exp-0827,1299,+3/-3,32380,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-pro-exp-0827 +6,9,Grok-2-08-13,1290,+4/-4,43774,xAI,Proprietary,2024/3,https://x.ai/blog/grok-2 +6,11,Yi-Lightning,1287,+4/-3,24473,01 AI,Proprietary,Unknown,https://platform.lingyiwanwu.com/docs#%E6%A8%A1%E5%9E%8B%E4%B8%8E%E8%AE%A1%E8%B4%B9 +6,4,GPT-4o-2024-05-13,1285,+2/-2,105541,OpenAI,Proprietary,2023/10,https://openai.com/index/hello-gpt-4o/ +6,3,Claude 3.5 Sonnet (20241022),1283,+5/-4,19005,Anthropic,Proprietary,2024/4,https://www.anthropic.com/news/3-5-models-and-computer-use +9,16,GLM-4-Plus,1275,+4/-4,22574,Zhipu AI,Proprietary,Unknown,https://bigmodel.cn/dev/howuse/glm-4 +10,18,GPT-4o-mini-2024-07-18,1273,+3/-3,45274,OpenAI,Proprietary,2023/10,https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/ +10,18,Gemini-1.5-Flash-002,1272,+5/-5,15030,Google,Proprietary,Unknown,https://aistudio.google.com/app/prompts/new_chat?instructions=lmsys&model=gemini-1.5-flash-002 +10,27,Llama-3.1-Nemotron-70B-Instruct,1271,+6/-6,6572,Nvidia,Llama 3.1,2023/12,https://huggingface.co/nvidia/Llama-3.1-Nemotron-70B-Instruct +10,14,Gemini-1.5-Flash-Exp-0827,1269,+3/-4,25491,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-flash-exp-0827 +11,6,Claude 3.5 Sonnet (20240620),1268,+2/-3,83825,Anthropic,Proprietary,2024/4,https://www.anthropic.com/news/claude-3-5-sonnet +11,7,Meta-Llama-3.1-405B-Instruct-fp8,1267,+3/-3,45768,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ +11,8,Meta-Llama-3.1-405B-Instruct-bf16,1266,+5/-4,14608,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ +11,14,Yi-Lightning-lite,1264,+6/-4,17293,01 AI,Proprietary,Unknown,https://platform.lingyiwanwu.com/docs#%E6%A8%A1%E5%9E%8B%E4%B8%8E%E8%AE%A1%E8%B4%B9 +12,25,Grok-2-Mini-08-13,1267,+3/-4,36342,xAI,Proprietary,2024/3,https://x.ai/blog/grok-2 +12,7,Gemini Advanced App (2024-05-14),1266,+3/-3,52230,Google,Proprietary,Online,https://gemini.google.com/advanced +12,8,GPT-4o-2024-08-06,1264,+4/-3,37444,OpenAI,Proprietary,2023/10,https://platform.openai.com/docs/models/gpt-4o +12,18,Qwen-Max-0919,1264,+5/-4,17658,Alibaba,Qwen,Unknown,https://help.aliyun.com/zh/dashscope/developer-reference/model-introduction +19,25,Qwen2.5-72B-Instruct,1259,+4/-4,20113,Alibaba,Qwen,2024/9,https://qwenlm.github.io/blog/qwen2.5/ +20,14,Gemini-1.5-Pro-001,1260,+2/-3,82660,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-pro +20,24,Deepseek-v2.5,1257,+4/-5,20034,DeepSeek,DeepSeek,Unknown,https://huggingface.co/deepseek-ai/DeepSeek-V2.5 +23,14,GPT-4-Turbo-2024-04-09,1257,+2/-2,100404,OpenAI,Proprietary,2023/12,https://platform.openai.com/docs/models/gpt-4-turbo-and-gpt-4 +24,19,Mistral-Large-2407,1251,+3/-4,42110,Mistral,Mistral Research,2024/7,https://mistral.ai/news/mistral-large-2407/ +24,25,Athene-70B,1250,+5/-3,20709,NexusFlow,CC-BY-NC-4.0,2024/7,https://huggingface.co/Nexusflow/Athene-70B +27,16,GPT-4-1106-preview,1250,+2/-3,103894,OpenAI,Proprietary,2023/4,https://openai.com/blog/new-models-and-developer-products-announced-at-devday +27,14,Claude 3 Opus,1248,+2/-2,180601,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family +27,31,Meta-Llama-3.1-70B-Instruct,1247,+3/-3,41484,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ +28,19,GPT-4-0125-preview,1245,+2/-3,97214,OpenAI,Proprietary,2023/12,https://openai.com/blog/new-models-and-developer-products-announced-at-devday +33,32,Yi-Large-preview,1240,+2/-3,51722,01 AI,Proprietary,Unknown,https://platform.lingyiwanwu.com/docs#%E6%A8%A1%E5%9E%8B +33,31,Reka-Core-20240904,1235,+7/-6,8013,Reka AI,Proprietary,Unknown,https://docs.reka.ai/available-models +34,31,Reka-Core-20240722,1230,+4/-5,13331,Reka AI,Proprietary,Unknown,https://docs.reka.ai/available-models +34,31,Qwen-Plus-0828,1227,+4/-5,14751,Alibaba,Proprietary,Unknown,https://help.aliyun.com/zh/model-studio/getting-started/models +34,33,Gemini-1.5-Flash-001,1227,+3/-3,65808,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-flash +35,32,Jamba-1.5-Large,1221,+6/-6,9188,AI21 Labs,Jamba Open,2024/3,https://www.ai21.com/jamba +36,33,Deepseek-v2-API-0628,1219,+4/-4,19616,DeepSeek AI,DeepSeek,Unknown,https://platform.deepseek.com/api-docs/updates#deepseek-chat +38,32,Gemma-2-27B-it,1219,+3/-3,52532,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-27b-it +38,33,Gemma-2-9B-it-SimPO,1215,+5/-6,10618,Princeton,MIT,2024/7,https://huggingface.co/princeton-nlp/gemma-2-9b-it-SimPO +38,34,Command R+ (08-2024),1215,+4/-5,10602,Cohere,CC-BY-NC-4.0,2024/8,https://docs.cohere.com/docs/command-r-plus#model-details +38,34,Deepseek-Coder-v2-0724,1214,+6/-5,11774,DeepSeek,Proprietary,Unknown,https://platform.deepseek.com/api-docs/updates/#version-2024-07-24 +38,39,Yi-Large,1212,+4/-4,16666,01 AI,Proprietary,Unknown,https://platform.01.ai/docs#models-and-pricing +38,52,Gemini-1.5-Flash-8B-001,1212,+5/-4,16178,Google,Proprietary,Unknown,https://aistudio.google.com/app/prompts/new_chat?instructions=lmsys&model=gemini-1.5-flash-8b +38,31,Llama-3.1-Nemotron-51B-Instruct,1208,+11/-10,3153,Nvidia,Llama 3.1,2023/12,https://huggingface.co/nvidia/Llama-3_1-Nemotron-51B-Instruct +41,35,Nemotron-4-340B-Instruct,1209,+5/-4,20645,Nvidia,NVIDIA Open Model,2023/6,https://huggingface.co/nvidia/Nemotron-4-340B-Instruct +41,43,GLM-4-0520,1207,+5/-5,10229,Zhipu AI,Proprietary,Unknown,https://open.bigmodel.cn/dev/api#language +41,39,Reka-Flash-20240904,1206,+8/-5,8204,Reka AI,Proprietary,Unknown,https://docs.reka.ai/available-models +42,56,Gemini-1.5-Flash-8B-Exp-0827,1205,+5/-4,25491,Google,Proprietary,2023/11,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.5-flash-8b-exp-0827 +45,41,Llama-3-70B-Instruct,1206,+2/-2,163936,Meta,Llama 3 Community,2023/12,https://llama.meta.com/llama3/ +46,51,Reka-Flash-20240722,1201,+5/-6,13774,Reka AI,Proprietary,Unknown,https://docs.reka.ai/available-models +48,35,Claude 3 Sonnet,1201,+2/-2,113076,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family +48,54,Reka-Core-20240501,1200,+3/-3,62623,Reka AI,Proprietary,Unknown,https://www.reka.ai/news/reka-core-our-frontier-class-multimodal-language-model +55,51,Command R+ (04-2024),1190,+2/-3,80907,Cohere,CC-BY-NC-4.0,2024/3,https://txt.cohere.com/command-r-plus-microsoft-azure/ +55,54,Gemma-2-9B-it,1190,+3/-3,37949,Google,Gemma license,2024/6,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-9b-it +55,51,Qwen2-72B-Instruct,1187,+3/-3,38985,Alibaba,Qianwen LICENSE,2024/6,https://qwenlm.github.io/blog/qwen2/ +55,33,GPT-4-0314,1186,+4/-4,55978,OpenAI,Proprietary,2021/9,https://openai.com/research/gpt-4 +55,62,GLM-4-0116,1183,+6/-6,7582,Zhipu AI,Proprietary,Unknown,https://open.bigmodel.cn/ +56,56,Qwen-Max-0428,1183,+3/-3,25725,Alibaba,Proprietary,Unknown,https://help.aliyun.com/zh/dashscope/developer-reference/api-details +57,53,Command R (08-2024),1180,+5/-5,10931,Cohere,CC-BY-NC-4.0,2024/8,https://docs.cohere.com/docs/command-r-plus#model-details +59,54,Claude 3 Haiku,1179,+3/-2,122440,Anthropic,Proprietary,2023/8,https://www.anthropic.com/news/claude-3-family +59,51,DeepSeek-Coder-V2-Instruct,1178,+4/-5,15798,DeepSeek AI,DeepSeek License,2024/6,https://huggingface.co/deepseek-ai/DeepSeek-Coder-V2-Instruct +59,64,Jamba-1.5-Mini,1176,+6/-5,9298,AI21 Labs,Jamba Open,2024/3,https://www.ai21.com/jamba +60,84,Meta-Llama-3.1-8B-Instruct,1175,+3/-3,39806,Meta,Llama 3.1 Community,2023/12,https://ai.meta.com/blog/meta-llama-3-1/ +66,67,Reka-Flash-Preview-20240611,1165,+3/-4,20467,Reka AI,Proprietary,Unknown,https://docs.reka.ai/http-api.html#generation +66,50,GPT-4-0613,1163,+2/-2,91664,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo +66,64,Qwen1.5-110B-Chat,1161,+4/-4,27474,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ +68,64,Mistral-Large-2402,1157,+3/-2,64939,Mistral,Proprietary,Unknown,https://mistral.ai/news/mistral-large/ +68,80,Yi-1.5-34B-Chat,1157,+3/-3,25143,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat +68,64,Reka-Flash-21B-online,1156,+4/-4,16037,Reka AI,Proprietary,Online,https://docs.reka.ai/http-api.html#generation +69,90,InternLM2.5-20B-chat,1150,+6/-5,10716,InternLM,Other,2024/8,https://huggingface.co/internlm/internlm2_5-20b-chat +71,74,Llama-3-8B-Instruct,1152,+2/-3,109373,Meta,Llama 3 Community,2023/3,https://llama.meta.com/llama3/ +71,64,Claude-1,1149,+4/-4,21157,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/introducing-claude +72,69,Command R (04-2024),1149,+2/-3,56405,Cohere,CC-BY-NC-4.0,2024/3,https://txt.cohere.com/command-r +72,71,Mistral Medium,1148,+3/-4,35552,Mistral,Proprietary,Unknown,https://mistral.ai/news/la-plateforme/ +72,72,Reka-Flash-21B,1148,+3/-4,25811,Reka AI,Proprietary,2023/11,https://www.reka.ai/news/reka-flash-efficient-and-capable-multimodal-language-models +72,68,Mixtral-8x22b-Instruct-v0.1,1147,+3/-3,53841,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ +72,68,Qwen1.5-72B-Chat,1147,+3/-3,40646,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +80,90,Gemma-2-2b-it,1139,+4/-3,29470,Google,Gemma license,2024/7,https://aistudio.google.com/app/prompts/new_chat?model=gemma-2-2b-it +80,69,Claude-2.0,1132,+5/-6,12765,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/claude-2 +81,68,Gemini-1.0-Pro-001,1131,+4/-5,18785,Google,Proprietary,2023/4,https://aistudio.google.com/app/prompts/new_chat?model=gemini-1.0-pro +81,79,Zephyr-ORPO-141b-A35b-v0.1,1127,+8/-9,4857,HuggingFace,Apache 2.0,2024/4,https://huggingface.co/HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1 +81,84,Qwen1.5-32B-Chat,1125,+5/-3,22760,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ +81,64,Mistral-Next,1124,+6/-7,12381,Mistral,Proprietary,Unknown,https://chat.mistral.ai/chat +82,90,Phi-3-Medium-4k-Instruct,1123,+3/-3,26149,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct +83,99,Starling-LM-7B-beta,1119,+4/-4,16670,Nexusflow,Apache-2.0,2024/3,https://huggingface.co/Nexusflow/Starling-LM-7B-beta +84,77,Claude-2.1,1118,+3/-4,37694,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/claude-2-1 +84,77,GPT-3.5-Turbo-0613,1117,+4/-3,38957,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 +86,79,Gemini Pro,1111,+7/-8,6561,Google,Proprietary,2023/4,https://blog.google/technology/ai/gemini-api-developers-cloud/ +87,96,Yi-34B-Chat,1111,+5/-5,15928,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat +87,84,Claude-Instant-1,1111,+4/-4,20623,Anthropic,Proprietary,Unknown,https://www.anthropic.com/index/introducing-claude +87,69,GPT-3.5-Turbo-0314,1106,+8/-8,5647,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 +89,91,Mixtral-8x7B-Instruct-v0.1,1114,+0/-0,76141,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ +91,93,Qwen1.5-14B-Chat,1109,+5/-4,18669,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +91,92,WizardLM-70B-v1.0,1106,+7/-6,8382,Microsoft,Llama 2 Community,2023/8,https://huggingface.co/WizardLM/WizardLM-70B-V1.0 +91,77,GPT-3.5-Turbo-0125,1106,+3/-3,68889,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5-turbo +91,98,Meta-Llama-3.2-3B-Instruct,1103,+5/-6,8467,Meta,Llama 3.2,2023/12,https://ai.meta.com/blog/llama-3-2-connect-2024-vision-edge-mobile-devices/ +92,90,DBRX-Instruct-Preview,1103,+4/-3,33725,Databricks,DBRX LICENSE,2023/12,https://www.databricks.com/blog/introducing-dbrx-new-state-art-open-llm +93,97,Phi-3-Small-8k-Instruct,1102,+3/-4,18497,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-small-8k-instruct +94,99,Tulu-2-DPO-70B,1099,+6/-7,6666,AllenAI/UW,AI2 ImpACT Low-risk,2023/11,https://huggingface.co/allenai/tulu-2-dpo-70b +101,107,Llama-2-70B-chat,1093,+3/-3,39621,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf +101,95,OpenChat-3.5-0106,1091,+5/-4,12973,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 +101,100,Vicuna-33B,1091,+4/-4,22945,LMSYS,Non-commercial,2023/8,https://huggingface.co/lmsys/vicuna-33b-v1.3 +101,95,Snowflake Arctic Instruct,1090,+3/-3,34192,Snowflake,Apache 2.0,2024/4,https://www.snowflake.com/blog/arctic-open-efficient-foundation-language-models-snowflake/ +101,103,Starling-LM-7B-alpha,1088,+6/-5,10415,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha +102,110,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+8/-8,3836,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO +103,97,Gemma-1.1-7B-it,1084,+4/-4,25090,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it +103,108,NV-Llama2-70B-SteerLM-Chat,1080,+8/-9,3638,Nvidia,Llama 2 Community,2023/11,https://huggingface.co/nvidia/Llama2-70B-SteerLM-Chat +106,110,pplx-70B-online,1078,+8/-7,6893,Perplexity AI,Proprietary,Online,https://blog.perplexity.ai/blog/introducing-pplx-online-llms +106,99,DeepSeek-LLM-67B-Chat,1077,+7/-7,4983,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat +107,97,OpenChat-3.5,1076,+5/-7,8112,OpenChat,Apache-2.0,2023/11,https://huggingface.co/openchat/openchat_3.5 +107,98,OpenHermes-2.5-Mistral-7B,1074,+8/-7,5092,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B +108,112,Mistral-7B-Instruct-v0.2,1072,+5/-4,20065,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 +108,112,Phi-3-Mini-4K-Instruct-June-24,1071,+6/-4,12881,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +108,112,Qwen1.5-7B-Chat,1070,+8/-9,4865,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +108,110,Dolphin-2.2.1-Mistral-7B,1062,+16/-13,1713,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b +109,92,GPT-3.5-Turbo-1106,1068,+6/-6,17029,OpenAI,Proprietary,2021/9,https://platform.openai.com/docs/models/gpt-3-5 +110,112,SOLAR-10.7B-Instruct-v1.0,1062,+9/-8,4287,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 +112,117,Phi-3-Mini-4k-Instruct,1066,+4/-6,21119,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +114,120,Llama-2-13b-chat,1063,+5/-4,19727,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-13b-chat-hf +115,112,WizardLM-13b-v1.2,1058,+8/-7,7185,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 +119,124,Meta-Llama-3.2-1B-Instruct,1054,+6/-6,8578,Meta,Llama 3.2,2023/12,https://ai.meta.com/blog/llama-3-2-connect-2024-vision-edge-mobile-devices/ +120,120,Zephyr-7B-beta,1053,+6/-7,11327,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +120,112,MPT-30B-chat,1045,+9/-10,2649,MosaicML,CC-BY-NC-SA-4.0,2023/6,https://huggingface.co/mosaicml/mpt-30b-chat +120,117,CodeLlama-70B-instruct,1042,+17/-14,1189,Meta,Llama 2 Community,2024/1,https://huggingface.co/codellama/CodeLlama-70b-hf +121,125,pplx-7B-online,1044,+9/-8,6335,Perplexity AI,Proprietary,Online,https://blog.perplexity.ai/blog/introducing-pplx-online-llms +121,117,Zephyr-7B-alpha,1041,+11/-12,1813,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha +122,122,CodeLlama-34B-instruct,1043,+7/-6,7508,Meta,Llama 2 Community,2023/7,https://huggingface.co/codellama/CodeLlama-34b-Instruct-hf +122,111,falcon-180b-chat,1034,+15/-13,1326,TII,Falcon-180B TII License,2023/9,https://huggingface.co/tiiuae/falcon-180B-chat +124,115,Vicuna-13B,1042,+4/-5,19788,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-13b-v1.5 +125,123,Gemma-7B-it,1037,+5/-6,9175,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it +125,122,Phi-3-Mini-128k-Instruct,1037,+4/-4,21621,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ +125,136,Llama-2-7B-chat,1037,+5/-5,14556,Meta,Llama 2 Community,2023/7,https://huggingface.co/meta-llama/Llama-2-7b-chat-hf +125,113,Qwen-14B-Chat,1035,+8/-8,5068,Alibaba,Qianwen LICENSE,2023/8,https://huggingface.co/Qwen/Qwen-14B-Chat +125,125,Guanaco-33B,1032,+10/-9,2998,UW,Non-commercial,2023/5,https://huggingface.co/timdettmers/guanaco-33b-merged +135,126,Gemma-1.1-2b-it,1021,+6/-7,11347,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-2b-it +135,128,StripedHyena-Nous-7B,1018,+7/-8,5271,Together AI,Apache 2.0,2023/12,https://huggingface.co/togethercomputer/StripedHyena-Nous-7B +136,143,OLMo-7B-instruct,1015,+7/-7,6499,Allen AI,Apache-2.0,2024/2,https://huggingface.co/allenai/OLMo-7B-Instruct +137,135,Mistral-7B-Instruct-v0.1,1008,+6/-6,9143,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 +138,137,Vicuna-7B,1005,+8/-9,7017,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-7b-v1.5 +138,126,PaLM-Chat-Bison-001,1003,+7/-6,8742,Google,Proprietary,2021/6,https://cloud.google.com/vertex-ai/docs/generative-ai/learn/models#foundation_models +141,141,Gemma-2B-it,990,+8/-9,4919,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it +143,139,Qwen1.5-4B-Chat,988,+6/-6,7812,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +145,144,Koala-13B,964,+8/-7,7033,UC Berkeley,Non-commercial,2023/4,https://bair.berkeley.edu/blog/2023/04/03/koala/ +145,145,ChatGLM3-6B,955,+8/-8,4762,Tsinghua,Apache-2.0,2023/10,https://huggingface.co/THUDM/chatglm3-6b +147,145,GPT4All-13B-Snoozy,932,+14/-16,1786,Nomic AI,Non-commercial,2023/3,https://huggingface.co/nomic-ai/gpt4all-13b-snoozy +147,145,MPT-7B-Chat,928,+9/-10,4013,MosaicML,CC-BY-NC-SA-4.0,2023/5,https://huggingface.co/mosaicml/mpt-7b-chat +147,150,ChatGLM2-6B,924,+11/-10,2707,Tsinghua,Apache-2.0,2023/6,https://huggingface.co/THUDM/chatglm2-6b +147,150,RWKV-4-Raven-14B,922,+9/-8,4934,RWKV,Apache 2.0,2023/4,https://huggingface.co/BlinkDL/rwkv-4-raven +151,145,Alpaca-13B,902,+8/-7,5872,Stanford,Non-commercial,2023/3,https://crfm.stanford.edu/2023/03/13/alpaca.html +151,150,OpenAssistant-Pythia-12B,893,+9/-10,6382,OpenAssistant,Apache 2.0,2023/4,https://huggingface.co/OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5 +152,153,ChatGLM-6B,879,+10/-8,4995,Tsinghua,Non-commercial,2023/3,https://huggingface.co/THUDM/chatglm-6b +153,153,FastChat-T5-3B,868,+8/-10,4302,LMSYS,Apache 2.0,2023/4,https://huggingface.co/lmsys/fastchat-t5-3b-v1.0 +155,155,StableLM-Tuned-Alpha-7B,840,+12/-11,3336,Stability AI,CC-BY-NC-SA-4.0,2023/4,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b +155,153,Dolly-V2-12B,822,+10/-9,3486,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b +157,154,LLaMA-13B,799,+13/-13,2445,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 diff --git a/csv/merged.csv b/csv/merged.csv index bd975fb..b2dcd96 100644 --- a/csv/merged.csv +++ b/csv/merged.csv @@ -1,56 +1,56 @@ key,t,model.x,average,arc,hellaswag,mmlu,truthfulqa,winogrande,gsm8k,type,architecture,weight_type,precision,merged,hub_license,params_b,hub_hearts,available_on_the_hub,model_sha,flagged,moe,date,fullname,url.x,rank,rank_stylectrl,model.y,arena_score,95_pct_ci,votes,organization,license,knowledge_cutoff,url.y -deepseek-llm-67b-chat,💬,deepseek-ai/deepseek-llm-67b-chat,71.79,67.75,86.82,72.42,55.85,84.21,63.68,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,other,67,168,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2023-12-01T07:45:30Z,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat,104,97,DeepSeek-LLM-67B-Chat,1077,+8/-8,4984,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat -deepseek-llm-67b-chat,🔶,deepseek-ai/deepseek-llm-67b-chat,71.52,67.75,86.8,72.19,55.83,84.21,62.32,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,67,168,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2024-01-19T19:12:01Z,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat,104,97,DeepSeek-LLM-67B-Chat,1077,+8/-8,4984,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat -dolly-v2-12b,🔶,databricks/dolly-v2-12b,39.46,42.41,72.53,25.92,33.83,60.85,1.21,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,mit,12,1943,TRUE,19308160448536e378e3db21a73a751579ee7fdd,TRUE,TRUE,2023-09-09T10:52:17Z,databricks/dolly-v2-12b,https://huggingface.co/databricks/dolly-v2-12b,153,151,Dolly-V2-12B,822,+12/-10,3486,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b -dolphin-2.2.1-mistral-7b,🔶,cognitivecomputations/dolphin-2.2.1-mistral-7b,65.01,63.23,83.8,63.16,53.14,78.61,48.14,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,187,TRUE,2022924c0bb13588308d429e0b7f51568c07629c,TRUE,TRUE,2023-12-30T19:55:50Z,cognitivecomputations/dolphin-2.2.1-mistral-7b,https://huggingface.co/cognitivecomputations/dolphin-2.2.1-mistral-7b,106,108,Dolphin-2.2.1-Mistral-7B,1062,+14/-13,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b -dolphin-2.2.1-mistral-7b,🔶,ehartford/dolphin-2.2.1-mistral-7b,64.93,63.31,83.76,63.17,53.11,78.14,48.07,🔶 fine-tuned on domain-specific datasets,Unknown,Original,bfloat16,TRUE,"",7,0,FALSE,001b48e9aebffb395c698af47b6b48364cc3cbe8,TRUE,TRUE,2023-12-02T05:25:26Z,ehartford/dolphin-2.2.1-mistral-7b,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b,106,108,Dolphin-2.2.1-Mistral-7B,1062,+14/-13,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b -dolphin-2.2.1-mistral-7b,🔶,ehartford/dolphin-2.2.1-mistral-7b,60.54,63.48,83.86,63.28,53.17,78.37,21.08,🔶 fine-tuned on domain-specific datasets,Unknown,Original,float16,TRUE,"",7,0,FALSE,001b48e9aebffb395c698af47b6b48364cc3cbe8,TRUE,TRUE,2023-11-15T20:44:49Z,ehartford/dolphin-2.2.1-mistral-7b,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b,106,108,Dolphin-2.2.1-Mistral-7B,1062,+14/-13,1714,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b -gemma-1.1-7b-it,💬,google/gemma-1.1-7b-it,60.09,60.07,76.14,60.92,50.74,69.69,42.99,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,float16,TRUE,gemma,8,251,TRUE,689f62a7dfc06893ea915ca75f1cd26825c76146,TRUE,TRUE,2024-04-11T19:11:38Z,google/gemma-1.1-7b-it,https://huggingface.co/google/gemma-1.1-7b-it,101,94,Gemma-1.1-7b-it,1084,+5/-5,25082,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it -gemma-1.1-7b-it,💬,OpenModels4all/gemma-1.1-7b-it,59.78,59.98,76.21,60.39,50.4,69.93,41.77,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,gemma,8,3,TRUE,484670e31c44eededf8c64064eb0207e7af4a2b3,TRUE,TRUE,2024-04-09T09:05:33Z,OpenModels4all/gemma-1.1-7b-it,https://huggingface.co/OpenModels4all/gemma-1.1-7b-it,101,94,Gemma-1.1-7b-it,1084,+5/-5,25082,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it -gemma-2b-it,🔶,google/gemma-2b-it,42.75,43.94,62.7,37.65,45.82,60.93,5.46,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,float16,TRUE,gemma,2,566,TRUE,9642e777f24fde593d204a9b2471dce33334e64a,TRUE,TRUE,2024-02-22T13:13:54Z,google/gemma-2b-it,https://huggingface.co/google/gemma-2b-it,139,139,Gemma-2b-it,990,+9/-8,4918,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it -gemma-7b-it,🔶,google/gemma-7b-it,53.56,51.45,71.96,53.52,47.29,67.96,29.19,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,float16,TRUE,gemma,8,1099,TRUE,dec4b13d574762bd36f0a1b75541439bd852b2e8,TRUE,TRUE,2024-02-22T13:13:37Z,google/gemma-7b-it,https://huggingface.co/google/gemma-7b-it,123,120,Gemma-7b-it,1037,+6/-6,9177,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it -llama-13b,🟢,huggingface/llama-13b,51.36,56.23,80.93,47.67,39.48,76.24,7.58,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,other,13,0,FALSE,4022c52fcc7473ce7364bb5ac166195903ea1efb,TRUE,TRUE,2023-10-16T12:48:18Z,huggingface/llama-13b,https://huggingface.co/huggingface/llama-13b,155,152,LLaMA-13B,799,+12/-12,2445,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 -llama-13b,🟢,huggyllama/llama-13b,51.33,56.14,80.92,47.61,39.48,76.24,7.58,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,other,13,137,TRUE,bf57045473f207bb1de1ed035ace226f4d9f9bba,TRUE,TRUE,2023-09-09T10:52:17Z,huggyllama/llama-13b,https://huggingface.co/huggyllama/llama-13b,155,152,LLaMA-13B,799,+12/-12,2445,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 -mistral-7b-instruct-v0.1,💬,mistralai/Mistral-7B-Instruct-v0.1,54.96,54.52,75.63,55.38,56.28,73.72,14.25,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,1456,TRUE,7961f5aa9b736bf8e364b2e6f201190f97a27931,TRUE,TRUE,2023-10-16T12:48:18Z,mistralai/Mistral-7B-Instruct-v0.1,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1,135,133,Mistral-7B-Instruct-v0.1,1008,+7/-6,9146,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 -mistral-7b-instruct-v0.2,💬,mistralai/Mistral-7B-Instruct-v0.2,65.71,63.14,84.88,60.78,68.26,77.19,40.03,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,2382,TRUE,c72e5d1908b1e2929ec8fc4c8820e9706af1f80f,TRUE,TRUE,2023-12-11T20:10:06Z,mistralai/Mistral-7B-Instruct-v0.2,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2,107,110,Mistral-7B-Instruct-v0.2,1072,+4/-4,20063,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 -mistral-7b-instruct-v0.2,💬,dfurman/Mistral-7B-Instruct-v0.2,61.79,60.15,82.79,60.07,56.06,76.87,34.8,"💬 chat models (RLHF, DPO, IFT, ...)",?,Adapter,float16,TRUE,apache-2.0,7,5,TRUE,322faff8bb0c72b772762de7635f5aea9864a24a,TRUE,TRUE,2024-01-02T17:44:20Z,dfurman/Mistral-7B-Instruct-v0.2,https://huggingface.co/dfurman/Mistral-7B-Instruct-v0.2,107,110,Mistral-7B-Instruct-v0.2,1072,+4/-4,20063,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 -mixtral-8x22b-instruct-v0.1,💬,mistralai/Mixtral-8x22B-Instruct-v0.1,79.15,72.7,89.08,77.77,68.14,85.16,82.03,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,140,613,TRUE,eb69dca9c68bbdcffd5f522f632d5c04ab6c65b3,TRUE,FALSE,2024-04-17T15:30:22Z,mistralai/Mixtral-8x22B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1,69,65,Mixtral-8x22b-Instruct-v0.1,1147,+3/-3,53840,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ -mixtral-8x7b-instruct-v0.1,🔶,mistralai/Mixtral-8x7B-Instruct-v0.1,72.7,70.14,87.55,71.4,64.98,81.06,61.11,🔶 fine-tuned on domain-specific datasets,MixtralForCausalLM,Original,float16,TRUE,apache-2.0,46,3920,TRUE,125c431e2ff41a156b9f9076f744d2f35dd6e67a,TRUE,FALSE,2024-01-01T02:10:03Z,mistralai/Mixtral-8x7B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1,86,88,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,76142,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ -mixtral-8x7b-instruct-v0.1,💬,mistralai/Mixtral-8x7B-Instruct-v0.1,72.62,70.22,87.63,71.16,64.58,81.37,60.73,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,3920,TRUE,3de0408ae8b591d9ac516a2384925dd98ebc66f4,TRUE,FALSE,2023-12-11T12:54:17Z,mistralai/Mixtral-8x7B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1,86,88,Mixtral-8x7b-Instruct-v0.1,1114,+0/-0,76142,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ -mpt-30b-chat,🔶,mosaicml/mpt-30b-chat,55.38,58.7,82.54,51.16,52.42,75.3,12.13,🔶 fine-tuned on domain-specific datasets,MPTForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,30,199,TRUE,54f33278a04aa4e612bca482b82f801ab658e890,TRUE,TRUE,2023-09-09T10:52:17Z,mosaicml/mpt-30b-chat,https://huggingface.co/mosaicml/mpt-30b-chat,118,110,MPT-30B-chat,1046,+8/-12,2649,MosaicML,CC-BY-NC-SA-4.0,2023/6,https://huggingface.co/mosaicml/mpt-30b-chat -mpt-7b-chat,🔶,mosaicml/mpt-7b-chat,45.39,46.5,75.51,37.62,40.16,68.43,4.09,🔶 fine-tuned on domain-specific datasets,MPTForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,7,513,TRUE,64e5c9c9fb53a8e89690c2dee75a5add37f7113e,TRUE,TRUE,2023-09-09T10:52:17Z,mosaicml/mpt-7b-chat,https://huggingface.co/mosaicml/mpt-7b-chat,145,143,MPT-7B-Chat,928,+10/-10,4013,MosaicML,CC-BY-NC-SA-4.0,2023/5,https://huggingface.co/mosaicml/mpt-7b-chat -nous-hermes-2-mixtral-8x7b-dpo,🔶,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,73.35,71.08,87.29,72.17,54.83,83.11,71.65,🔶 fine-tuned on domain-specific datasets,MixtralForCausalLM,Original,float16,TRUE,apache-2.0,46,383,TRUE,566cdea53950f86eb51dae62812c29e79405cffe,TRUE,FALSE,2024-01-22T08:41:28Z,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,99,108,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+9/-8,3836,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO -nous-hermes-2-mixtral-8x7b-dpo,?,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,73.12,71.42,87.21,72.28,54.53,82.64,70.66,"",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,383,TRUE,6ba531f1aec62375bf94ad9c7bb064953c4e9868,TRUE,FALSE,2024-06-09T15:01:07Z,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,99,108,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+9/-8,3836,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO -openchat-3.5-0106,💬,openchat/openchat-3.5-0106,69.3,66.04,82.93,65.04,51.9,81.77,68.16,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,341,TRUE,9619fb7d2a8e25fa6b0633c0f57f7f4aa79b45c4,TRUE,TRUE,2024-01-10T09:45:30Z,openchat/openchat-3.5-0106,https://huggingface.co/openchat/openchat-3.5-0106,98,94,OpenChat-3.5-0106,1091,+5/-5,12975,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 -openhermes-2.5-mistral-7b,🔶,teknium/OpenHermes-2.5-Mistral-7B,61.52,64.93,84.18,63.64,52.24,78.06,26.08,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,787,TRUE,2a54cad766bc90828354db5c4199795aecfd0df1,TRUE,TRUE,2023-11-17T19:50:31Z,teknium/OpenHermes-2.5-Mistral-7B,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B,104,97,OpenHermes-2.5-Mistral-7b,1075,+8/-9,5092,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B -openhermes-2.5-mistral-7b,🔶,teknium/OpenHermes-2.5-Mistral-7B,61.45,64.93,84.3,63.82,52.31,77.9,25.47,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,787,TRUE,2a54cad766bc90828354db5c4199795aecfd0df1,TRUE,TRUE,2023-11-14T15:14:43Z,teknium/OpenHermes-2.5-Mistral-7B,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B,104,97,OpenHermes-2.5-Mistral-7b,1075,+8/-9,5092,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B -phi-3-medium-4k-instruct,🟢,unsloth/Phi-3-medium-4k-instruct,73.57,67.06,85.69,77.85,57.75,72.85,80.21,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,mit,13,23,TRUE,1099cff4ded0cc74fb38a90951c4e21865cddd73,TRUE,TRUE,2024-05-28T06:35:31Z,unsloth/Phi-3-medium-4k-instruct,https://huggingface.co/unsloth/Phi-3-medium-4k-instruct,81,88,Phi-3-Medium-4k-Instruct,1123,+3/-5,26158,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct -phi-3-medium-4k-instruct,🔶,microsoft/Phi-3-medium-4k-instruct,73.45,67.32,85.76,77.83,57.71,72.69,79.38,🔶 fine-tuned on domain-specific datasets,Phi3ForCausalLM,Original,bfloat16,TRUE,mit,13,136,TRUE,d27c49ed6abea9167240288dceb4ab6bca855293,TRUE,FALSE,2024-05-27T15:40:50Z,microsoft/Phi-3-medium-4k-instruct,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct,81,88,Phi-3-Medium-4k-Instruct,1123,+3/-5,26158,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct -phi-3-mini-128k-instruct,💬,microsoft/Phi-3-mini-128k-instruct,68.07,63.14,80.09,68.7,54.12,72.85,69.52,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,float16,TRUE,mit,3,1355,TRUE,ebee18c488086b396dde649f2aa6548b9b8d2404,TRUE,FALSE,2024-04-25T13:14:03Z,microsoft/Phi-3-mini-128k-instruct,https://huggingface.co/microsoft/Phi-3-mini-128k-instruct,123,121,Phi-3-Mini-128k-Instruct,1037,+4/-3,21632,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ -phi-3-mini-4k-instruct,💬,microsoft/Phi-3-mini-4k-instruct,69.91,62.97,80.6,69.08,59.88,72.38,74.53,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,float16,TRUE,mit,3,724,TRUE,b86bcaf57ea4dfdec5dbe12a377028b2fab0d480,TRUE,FALSE,2024-04-26T08:51:19Z,microsoft/Phi-3-mini-4k-instruct,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct,108,115,Phi-3-Mini-4k-Instruct,1066,+5/-4,21126,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -phi-3-mini-4k-instruct,🟢,unsloth/Phi-3-mini-4k-instruct,69.86,62.97,80.61,69.08,59.88,72.69,73.92,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,mit,3,27,TRUE,4caf5ac193b82d28dea55dcbb22aa51d2a3be453,TRUE,TRUE,2024-05-11T07:51:45Z,unsloth/Phi-3-mini-4k-instruct,https://huggingface.co/unsloth/Phi-3-mini-4k-instruct,108,115,Phi-3-Mini-4k-Instruct,1066,+5/-4,21126,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct -qwen1.5-110b-chat,💬,Qwen/Qwen1.5-110B-Chat,68.01,72.01,84.67,78.04,65.86,77.35,30.1,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,110,117,TRUE,5e04700b8091f10a98f1fe0b20c48c10d195ef5f,TRUE,FALSE,2024-04-29T12:55:18Z,Qwen/Qwen1.5-110B-Chat,https://huggingface.co/Qwen/Qwen1.5-110B-Chat,64,62,Qwen1.5-110B-Chat,1161,+4/-4,27486,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ -qwen1.5-14b-chat,🔶,Qwen/Qwen1.5-14B-Chat,62.37,58.79,82.33,68.52,60.38,73.32,30.86,🔶 fine-tuned on domain-specific datasets,Qwen2ForCausalLM,Original,float16,TRUE,other,14,99,TRUE,17e11c306ed235e970c9bb8e5f7233527140cdcf,TRUE,FALSE,2024-03-01T12:30:06Z,Qwen/Qwen1.5-14B-Chat,https://huggingface.co/Qwen/Qwen1.5-14B-Chat,88,91,Qwen1.5-14B-Chat,1109,+5/-4,18674,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-14b-chat,💬,Qwen/Qwen1.5-14B-Chat,62.27,58.7,82.27,68.57,60.36,73.09,30.63,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,14,99,TRUE,9492b22871f43e975435455f5c616c77fe7a50ec,TRUE,FALSE,2024-05-16T07:47:25Z,Qwen/Qwen1.5-14B-Chat,https://huggingface.co/Qwen/Qwen1.5-14B-Chat,88,91,Qwen1.5-14B-Chat,1109,+5/-4,18674,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-32b-chat,💬,Qwen/Qwen1.5-32B-Chat,62.95,66.04,85.49,74.99,66.95,77.19,7.05,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,32,102,TRUE,0b1785d88bbe93aa90a8a19da8af78eccbf010a6,TRUE,TRUE,2024-04-05T21:01:12Z,Qwen/Qwen1.5-32B-Chat,https://huggingface.co/Qwen/Qwen1.5-32B-Chat,79,82,Qwen1.5-32B-Chat,1125,+3/-4,22763,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ -qwen1.5-4b-chat,💬,Qwen/Qwen1.5-4B-Chat,46.79,43.26,69.73,55.55,44.79,64.96,2.43,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,3,34,TRUE,15bf46b13b1e6b6dd18ff7fa3242af406cc7e791,TRUE,FALSE,2024-02-12T17:13:33Z,Qwen/Qwen1.5-4B-Chat,https://huggingface.co/Qwen/Qwen1.5-4B-Chat,141,137,Qwen1.5-4B-Chat,988,+7/-6,7814,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-72b-chat,💬,Qwen/Qwen1.5-72B-Chat,65.98,68.26,86.47,77.46,63.84,78.93,20.92,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,214,TRUE,bc11a298a0c6a5cd737064db62c6ad20ec6331be,TRUE,FALSE,2024-02-17T04:34:39Z,Qwen/Qwen1.5-72B-Chat,https://huggingface.co/Qwen/Qwen1.5-72B-Chat,70,66,Qwen1.5-72B-Chat,1147,+3/-3,40647,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-72b-chat,💬,Qwen/Qwen1.5-72B-Chat,65.96,68.52,86.42,77.44,63.9,79.08,20.39,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,72,214,TRUE,1a6ccc1215278f962c794b1848c710c29ef4053d,TRUE,FALSE,2024-03-07T14:52:34Z,Qwen/Qwen1.5-72B-Chat,https://huggingface.co/Qwen/Qwen1.5-72B-Chat,70,66,Qwen1.5-72B-Chat,1147,+3/-3,40647,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-7b-chat,💬,Qwen/Qwen1.5-7B-Chat,55.15,55.89,78.56,61.65,53.54,67.72,13.57,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,7,153,TRUE,0addb6bfd79e59bce8f61ed60cdafd906c04d447,TRUE,FALSE,2024-02-12T17:13:18Z,Qwen/Qwen1.5-7B-Chat,https://huggingface.co/Qwen/Qwen1.5-7B-Chat,105,110,Qwen1.5-7B-Chat,1070,+10/-7,4864,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -qwen1.5-7b-chat,💬,Qwen/Qwen1.5-7B-Chat,55.13,55.89,78.56,61.7,53.65,67.8,13.19,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,7,153,TRUE,0addb6bfd79e59bce8f61ed60cdafd906c04d447,TRUE,FALSE,2024-02-18T04:43:41Z,Qwen/Qwen1.5-7B-Chat,https://huggingface.co/Qwen/Qwen1.5-7B-Chat,105,110,Qwen1.5-7B-Chat,1070,+10/-7,4864,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ -solar-10.7b-instruct-v1.0,?,upstage/SOLAR-10.7B-Instruct-v1.0,74.2,71.08,88.16,66.21,71.43,83.58,64.75,"",LlamaForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,10,591,TRUE,d3167df97a44b8632538b32ee8cd887893ea1435,TRUE,FALSE,2024-06-09T15:01:03Z,upstage/SOLAR-10.7B-Instruct-v1.0,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0,109,110,SOLAR-10.7B-Instruct-v1.0,1062,+9/-9,4286,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 -stablelm-tuned-alpha-7b,🔶,stabilityai/stablelm-tuned-alpha-7b,34.04,31.91,53.59,24.41,40.37,53.12,0.83,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,7,359,TRUE,25071b093c15c0d1cb2b2876c6deb621b764fcf5,TRUE,TRUE,2023-09-09T10:52:17Z,stabilityai/stablelm-tuned-alpha-7b,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b,153,154,StableLM-Tuned-Alpha-7B,840,+10/-10,3336,Stability AI,CC-BY-NC-SA-4.0,2023/4,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b -starling-lm-7b-alpha,🔶,berkeley-nest/Starling-LM-7B-alpha,67.13,63.82,84.9,64.67,46.39,80.58,62.4,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,551,TRUE,f721e85293598f2ef774e483ae95343e39811577,FALSE,TRUE,2023-11-30T20:12:15Z,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha,99,103,Starling-LM-7B-alpha,1088,+5/-5,10416,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha -starling-lm-7b-alpha,🔶,berkeley-nest/Starling-LM-7B-alpha,67.05,63.65,84.87,64.7,46.32,80.43,62.32,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,551,TRUE,76e60ca9807f55acd8eff3ec7ae022c5fbdf1e0e,FALSE,TRUE,2023-11-28T06:48:55Z,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha,99,103,Starling-LM-7B-alpha,1088,+5/-5,10416,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha -starling-lm-7b-beta,💬,Nexusflow/Starling-LM-7B-beta,69.88,67.24,83.47,65.14,55.47,81.29,66.64,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,326,TRUE,ee26b7c2cf9db00e1d9a92c9989d5b2a0b891dbd,TRUE,TRUE,2024-03-23T21:12:48Z,Nexusflow/Starling-LM-7B-beta,https://huggingface.co/Nexusflow/Starling-LM-7B-beta,81,98,Starling-LM-7B-beta,1119,+4/-5,16673,Nexusflow,Apache-2.0,2024/3,https://huggingface.co/Nexusflow/Starling-LM-7B-beta -tulu-2-dpo-70b,💬,allenai/tulu-2-dpo-70b,73.77,72.1,88.99,69.84,65.78,83.27,62.62,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,68,146,TRUE,0ab5c875f0070d5aee8d36bc55f41de440a13f02,TRUE,TRUE,2024-02-01T13:38:05Z,allenai/tulu-2-dpo-70b,https://huggingface.co/allenai/tulu-2-dpo-70b,91,96,Tulu-2-DPO-70B,1099,+6/-8,6668,AllenAI/UW,AI2 ImpACT Low-risk,2023/11,https://huggingface.co/allenai/tulu-2-dpo-70b -vicuna-13b,🔶,eachadea/vicuna-13b,52.3,51.71,79.94,50.84,52.68,71.03,7.58,🔶 fine-tuned on domain-specific datasets,Unknown,Original,float16,TRUE,"",12,0,FALSE,ac4218770a58baaaaf25201076fe082abb6ffd13,TRUE,TRUE,2023-10-16T12:46:18Z,eachadea/vicuna-13b,https://huggingface.co/eachadea/vicuna-13b,123,113,Vicuna-13B,1042,+4/-4,19790,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-13b-v1.5 -wizardlm-13b-v1.2,🔶,WizardLM/WizardLM-13B-V1.2,54.76,59.04,82.21,54.64,47.27,71.9,13.5,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,"",13,0,FALSE,6760d0c07ffdc2405295ed7a29437cf4dc414bac,TRUE,TRUE,2023-09-09T10:52:17Z,WizardLM/WizardLM-13B-V1.2,https://huggingface.co/WizardLM/WizardLM-13B-V1.2,114,110,WizardLM-13b-v1.2,1059,+6/-9,7183,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 -wizardlm-70b-v1.0,💬,WizardLM/WizardLM-70B-V1.0,61.25,65.44,84.41,64.05,54.81,80.82,17.97,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,4bit,TRUE,"",70,0,FALSE,6dae38060d70b82dcfe787a612d04aaf0adf0738,TRUE,TRUE,2023-09-09T10:52:17Z,WizardLM/WizardLM-70B-V1.0,https://huggingface.co/WizardLM/WizardLM-70B-V1.0,89,90,WizardLM-70B-v1.0,1106,+7/-6,8384,Microsoft,Llama 2 Community,2023/8,https://huggingface.co/WizardLM/WizardLM-70B-V1.0 -yi-1.5-34b-chat,?,01-ai/Yi-1.5-34B-Chat,74.82,70.48,85.97,77.08,62.16,81.61,71.65,"",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,180,TRUE,fa695ee438bfcd0ec2b378fa1c7e0dea1b40393e,TRUE,TRUE,2024-06-09T15:02:51Z,01-ai/Yi-1.5-34B-Chat,https://huggingface.co/01-ai/Yi-1.5-34B-Chat,64,78,Yi-1.5-34B-Chat,1157,+4/-3,25145,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat -yi-34b-chat,💬,01-ai/Yi-34B-Chat,65.32,65.44,84.16,74.9,55.37,80.11,31.92,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,332,TRUE,a99ec35331cbfc9da596af7d4538fe2efecff03c,TRUE,FALSE,2023-12-04T08:52:11Z,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat,85,94,Yi-34B-Chat,1111,+5/-5,15928,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat -yi-34b-chat,💬,01-ai/Yi-34B-Chat,63.17,65.1,84.08,74.87,55.41,79.79,19.79,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,apache-2.0,34,332,TRUE,a99ec35331cbfc9da596af7d4538fe2efecff03c,TRUE,FALSE,2023-11-23T10:23:14Z,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat,85,94,Yi-34B-Chat,1111,+5/-5,15928,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat -zephyr-7b-alpha,🔶,HuggingFaceH4/zephyr-7b-alpha,59.5,61.01,84.04,61.39,57.9,78.61,14.03,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1085,TRUE,2cd2cd16a6ab22585d643cf264fac73b18e7852a,TRUE,TRUE,2023-10-16T12:48:18Z,HuggingFaceH4/zephyr-7b-alpha,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha,119,115,Zephyr-7b-alpha,1041,+11/-11,1814,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha -zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,61.95,62.03,84.36,61.07,57.45,77.74,29.04,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1493,TRUE,8af01af3d4f9dc9b962447180d6d0f8c5315da86,TRUE,TRUE,2023-11-16T02:50:49Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,117,118,Zephyr-7b-beta,1053,+6/-5,11327,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta -zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,61.59,62.46,84.35,60.7,57.83,77.11,27.07,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,8bit,TRUE,mit,7,1493,TRUE,0f17b36adfbe7d86ea1c591a9efeeae17b313f48,TRUE,TRUE,2023-12-04T06:04:15Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,117,118,Zephyr-7b-beta,1053,+6/-5,11327,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta -zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,59.08,62.03,84.53,61.06,57.44,78.06,11.37,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,mit,7,1493,TRUE,8af01af3d4f9dc9b962447180d6d0f8c5315da86,TRUE,TRUE,2023-11-16T02:50:38Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,117,118,Zephyr-7b-beta,1053,+6/-5,11327,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +deepseek-llm-67b-chat,💬,deepseek-ai/deepseek-llm-67b-chat,71.79,67.75,86.82,72.42,55.85,84.21,63.68,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,other,67,168,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2023-12-01T07:45:30Z,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat,106,99,DeepSeek-LLM-67B-Chat,1077,+7/-7,4983,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat +deepseek-llm-67b-chat,🔶,deepseek-ai/deepseek-llm-67b-chat,71.52,67.75,86.8,72.19,55.83,84.21,62.32,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,bfloat16,TRUE,other,67,168,TRUE,79648bef7658bb824e4630740f6e1484c1b0620b,TRUE,TRUE,2024-01-19T19:12:01Z,deepseek-ai/deepseek-llm-67b-chat,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat,106,99,DeepSeek-LLM-67B-Chat,1077,+7/-7,4983,DeepSeek AI,DeepSeek License,2023/11,https://huggingface.co/deepseek-ai/deepseek-llm-67b-chat +dolly-v2-12b,🔶,databricks/dolly-v2-12b,39.46,42.41,72.53,25.92,33.83,60.85,1.21,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,mit,12,1943,TRUE,19308160448536e378e3db21a73a751579ee7fdd,TRUE,TRUE,2023-09-09T10:52:17Z,databricks/dolly-v2-12b,https://huggingface.co/databricks/dolly-v2-12b,155,153,Dolly-V2-12B,822,+10/-9,3486,Databricks,MIT,2023/4,https://huggingface.co/databricks/dolly-v2-12b +dolphin-2.2.1-mistral-7b,🔶,cognitivecomputations/dolphin-2.2.1-mistral-7b,65.01,63.23,83.8,63.16,53.14,78.61,48.14,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,187,TRUE,2022924c0bb13588308d429e0b7f51568c07629c,TRUE,TRUE,2023-12-30T19:55:50Z,cognitivecomputations/dolphin-2.2.1-mistral-7b,https://huggingface.co/cognitivecomputations/dolphin-2.2.1-mistral-7b,108,110,Dolphin-2.2.1-Mistral-7B,1062,+16/-13,1713,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b +dolphin-2.2.1-mistral-7b,🔶,ehartford/dolphin-2.2.1-mistral-7b,64.93,63.31,83.76,63.17,53.11,78.14,48.07,🔶 fine-tuned on domain-specific datasets,Unknown,Original,bfloat16,TRUE,"",7,0,FALSE,001b48e9aebffb395c698af47b6b48364cc3cbe8,TRUE,TRUE,2023-12-02T05:25:26Z,ehartford/dolphin-2.2.1-mistral-7b,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b,108,110,Dolphin-2.2.1-Mistral-7B,1062,+16/-13,1713,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b +dolphin-2.2.1-mistral-7b,🔶,ehartford/dolphin-2.2.1-mistral-7b,60.54,63.48,83.86,63.28,53.17,78.37,21.08,🔶 fine-tuned on domain-specific datasets,Unknown,Original,float16,TRUE,"",7,0,FALSE,001b48e9aebffb395c698af47b6b48364cc3cbe8,TRUE,TRUE,2023-11-15T20:44:49Z,ehartford/dolphin-2.2.1-mistral-7b,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b,108,110,Dolphin-2.2.1-Mistral-7B,1062,+16/-13,1713,Cognitive Computations,Apache-2.0,2023/10,https://huggingface.co/ehartford/dolphin-2.2.1-mistral-7b +gemma-1.1-7b-it,💬,google/gemma-1.1-7b-it,60.09,60.07,76.14,60.92,50.74,69.69,42.99,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,float16,TRUE,gemma,8,251,TRUE,689f62a7dfc06893ea915ca75f1cd26825c76146,TRUE,TRUE,2024-04-11T19:11:38Z,google/gemma-1.1-7b-it,https://huggingface.co/google/gemma-1.1-7b-it,103,97,Gemma-1.1-7B-it,1084,+4/-4,25090,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it +gemma-1.1-7b-it,💬,OpenModels4all/gemma-1.1-7b-it,59.78,59.98,76.21,60.39,50.4,69.93,41.77,"💬 chat models (RLHF, DPO, IFT, ...)",GemmaForCausalLM,Original,bfloat16,TRUE,gemma,8,3,TRUE,484670e31c44eededf8c64064eb0207e7af4a2b3,TRUE,TRUE,2024-04-09T09:05:33Z,OpenModels4all/gemma-1.1-7b-it,https://huggingface.co/OpenModels4all/gemma-1.1-7b-it,103,97,Gemma-1.1-7B-it,1084,+4/-4,25090,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-1.1-7b-it +gemma-2b-it,🔶,google/gemma-2b-it,42.75,43.94,62.7,37.65,45.82,60.93,5.46,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,float16,TRUE,gemma,2,566,TRUE,9642e777f24fde593d204a9b2471dce33334e64a,TRUE,TRUE,2024-02-22T13:13:54Z,google/gemma-2b-it,https://huggingface.co/google/gemma-2b-it,141,141,Gemma-2B-it,990,+8/-9,4919,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-2b-it +gemma-7b-it,🔶,google/gemma-7b-it,53.56,51.45,71.96,53.52,47.29,67.96,29.19,🔶 fine-tuned on domain-specific datasets,GemmaForCausalLM,Original,float16,TRUE,gemma,8,1099,TRUE,dec4b13d574762bd36f0a1b75541439bd852b2e8,TRUE,TRUE,2024-02-22T13:13:37Z,google/gemma-7b-it,https://huggingface.co/google/gemma-7b-it,125,123,Gemma-7B-it,1037,+5/-6,9175,Google,Gemma license,2024/2,https://huggingface.co/google/gemma-7b-it +llama-13b,🟢,huggingface/llama-13b,51.36,56.23,80.93,47.67,39.48,76.24,7.58,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,other,13,0,FALSE,4022c52fcc7473ce7364bb5ac166195903ea1efb,TRUE,TRUE,2023-10-16T12:48:18Z,huggingface/llama-13b,https://huggingface.co/huggingface/llama-13b,157,154,LLaMA-13B,799,+13/-13,2445,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 +llama-13b,🟢,huggyllama/llama-13b,51.33,56.14,80.92,47.61,39.48,76.24,7.58,🟢 pretrained,LlamaForCausalLM,Original,float16,TRUE,other,13,137,TRUE,bf57045473f207bb1de1ed035ace226f4d9f9bba,TRUE,TRUE,2023-09-09T10:52:17Z,huggyllama/llama-13b,https://huggingface.co/huggyllama/llama-13b,157,154,LLaMA-13B,799,+13/-13,2445,Meta,Non-commercial,2023/2,https://arxiv.org/abs/2302.13971 +mistral-7b-instruct-v0.1,💬,mistralai/Mistral-7B-Instruct-v0.1,54.96,54.52,75.63,55.38,56.28,73.72,14.25,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,1456,TRUE,7961f5aa9b736bf8e364b2e6f201190f97a27931,TRUE,TRUE,2023-10-16T12:48:18Z,mistralai/Mistral-7B-Instruct-v0.1,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1,137,135,Mistral-7B-Instruct-v0.1,1008,+6/-6,9143,Mistral,Apache 2.0,2023/9,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1 +mistral-7b-instruct-v0.2,💬,mistralai/Mistral-7B-Instruct-v0.2,65.71,63.14,84.88,60.78,68.26,77.19,40.03,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,2382,TRUE,c72e5d1908b1e2929ec8fc4c8820e9706af1f80f,TRUE,TRUE,2023-12-11T20:10:06Z,mistralai/Mistral-7B-Instruct-v0.2,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2,108,112,Mistral-7B-Instruct-v0.2,1072,+5/-4,20065,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 +mistral-7b-instruct-v0.2,💬,dfurman/Mistral-7B-Instruct-v0.2,61.79,60.15,82.79,60.07,56.06,76.87,34.8,"💬 chat models (RLHF, DPO, IFT, ...)",?,Adapter,float16,TRUE,apache-2.0,7,5,TRUE,322faff8bb0c72b772762de7635f5aea9864a24a,TRUE,TRUE,2024-01-02T17:44:20Z,dfurman/Mistral-7B-Instruct-v0.2,https://huggingface.co/dfurman/Mistral-7B-Instruct-v0.2,108,112,Mistral-7B-Instruct-v0.2,1072,+5/-4,20065,Mistral,Apache-2.0,2023/12,https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2 +mixtral-8x22b-instruct-v0.1,💬,mistralai/Mixtral-8x22B-Instruct-v0.1,79.15,72.7,89.08,77.77,68.14,85.16,82.03,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,140,613,TRUE,eb69dca9c68bbdcffd5f522f632d5c04ab6c65b3,TRUE,FALSE,2024-04-17T15:30:22Z,mistralai/Mixtral-8x22B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1,72,68,Mixtral-8x22b-Instruct-v0.1,1147,+3/-3,53841,Mistral,Apache 2.0,2024/4,https://mistral.ai/news/mixtral-8x22b/ +mixtral-8x7b-instruct-v0.1,🔶,mistralai/Mixtral-8x7B-Instruct-v0.1,72.7,70.14,87.55,71.4,64.98,81.06,61.11,🔶 fine-tuned on domain-specific datasets,MixtralForCausalLM,Original,float16,TRUE,apache-2.0,46,3920,TRUE,125c431e2ff41a156b9f9076f744d2f35dd6e67a,TRUE,FALSE,2024-01-01T02:10:03Z,mistralai/Mixtral-8x7B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1,89,91,Mixtral-8x7B-Instruct-v0.1,1114,+0/-0,76141,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ +mixtral-8x7b-instruct-v0.1,💬,mistralai/Mixtral-8x7B-Instruct-v0.1,72.62,70.22,87.63,71.16,64.58,81.37,60.73,"💬 chat models (RLHF, DPO, IFT, ...)",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,3920,TRUE,3de0408ae8b591d9ac516a2384925dd98ebc66f4,TRUE,FALSE,2023-12-11T12:54:17Z,mistralai/Mixtral-8x7B-Instruct-v0.1,https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1,89,91,Mixtral-8x7B-Instruct-v0.1,1114,+0/-0,76141,Mistral,Apache 2.0,2023/12,https://mistral.ai/news/mixtral-of-experts/ +mpt-30b-chat,🔶,mosaicml/mpt-30b-chat,55.38,58.7,82.54,51.16,52.42,75.3,12.13,🔶 fine-tuned on domain-specific datasets,MPTForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,30,199,TRUE,54f33278a04aa4e612bca482b82f801ab658e890,TRUE,TRUE,2023-09-09T10:52:17Z,mosaicml/mpt-30b-chat,https://huggingface.co/mosaicml/mpt-30b-chat,120,112,MPT-30B-chat,1045,+9/-10,2649,MosaicML,CC-BY-NC-SA-4.0,2023/6,https://huggingface.co/mosaicml/mpt-30b-chat +mpt-7b-chat,🔶,mosaicml/mpt-7b-chat,45.39,46.5,75.51,37.62,40.16,68.43,4.09,🔶 fine-tuned on domain-specific datasets,MPTForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,7,513,TRUE,64e5c9c9fb53a8e89690c2dee75a5add37f7113e,TRUE,TRUE,2023-09-09T10:52:17Z,mosaicml/mpt-7b-chat,https://huggingface.co/mosaicml/mpt-7b-chat,147,145,MPT-7B-Chat,928,+9/-10,4013,MosaicML,CC-BY-NC-SA-4.0,2023/5,https://huggingface.co/mosaicml/mpt-7b-chat +nous-hermes-2-mixtral-8x7b-dpo,🔶,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,73.35,71.08,87.29,72.17,54.83,83.11,71.65,🔶 fine-tuned on domain-specific datasets,MixtralForCausalLM,Original,float16,TRUE,apache-2.0,46,383,TRUE,566cdea53950f86eb51dae62812c29e79405cffe,TRUE,FALSE,2024-01-22T08:41:28Z,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,102,110,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+8/-8,3836,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO +nous-hermes-2-mixtral-8x7b-dpo,?,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,73.12,71.42,87.21,72.28,54.53,82.64,70.66,"",MixtralForCausalLM,Original,bfloat16,TRUE,apache-2.0,46,383,TRUE,6ba531f1aec62375bf94ad9c7bb064953c4e9868,TRUE,FALSE,2024-06-09T15:01:07Z,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,102,110,Nous-Hermes-2-Mixtral-8x7B-DPO,1084,+8/-8,3836,NousResearch,Apache-2.0,2024/1,https://huggingface.co/NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO +openchat-3.5-0106,💬,openchat/openchat-3.5-0106,69.3,66.04,82.93,65.04,51.9,81.77,68.16,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,341,TRUE,9619fb7d2a8e25fa6b0633c0f57f7f4aa79b45c4,TRUE,TRUE,2024-01-10T09:45:30Z,openchat/openchat-3.5-0106,https://huggingface.co/openchat/openchat-3.5-0106,101,95,OpenChat-3.5-0106,1091,+5/-4,12973,OpenChat,Apache-2.0,2024/1,https://huggingface.co/openchat/openchat-3.5-0106 +openhermes-2.5-mistral-7b,🔶,teknium/OpenHermes-2.5-Mistral-7B,61.52,64.93,84.18,63.64,52.24,78.06,26.08,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,787,TRUE,2a54cad766bc90828354db5c4199795aecfd0df1,TRUE,TRUE,2023-11-17T19:50:31Z,teknium/OpenHermes-2.5-Mistral-7B,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B,107,98,OpenHermes-2.5-Mistral-7B,1074,+8/-7,5092,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B +openhermes-2.5-mistral-7b,🔶,teknium/OpenHermes-2.5-Mistral-7B,61.45,64.93,84.3,63.82,52.31,77.9,25.47,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,787,TRUE,2a54cad766bc90828354db5c4199795aecfd0df1,TRUE,TRUE,2023-11-14T15:14:43Z,teknium/OpenHermes-2.5-Mistral-7B,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B,107,98,OpenHermes-2.5-Mistral-7B,1074,+8/-7,5092,NousResearch,Apache-2.0,2023/11,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B +phi-3-medium-4k-instruct,🟢,unsloth/Phi-3-medium-4k-instruct,73.57,67.06,85.69,77.85,57.75,72.85,80.21,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,mit,13,23,TRUE,1099cff4ded0cc74fb38a90951c4e21865cddd73,TRUE,TRUE,2024-05-28T06:35:31Z,unsloth/Phi-3-medium-4k-instruct,https://huggingface.co/unsloth/Phi-3-medium-4k-instruct,82,90,Phi-3-Medium-4k-Instruct,1123,+3/-3,26149,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct +phi-3-medium-4k-instruct,🔶,microsoft/Phi-3-medium-4k-instruct,73.45,67.32,85.76,77.83,57.71,72.69,79.38,🔶 fine-tuned on domain-specific datasets,Phi3ForCausalLM,Original,bfloat16,TRUE,mit,13,136,TRUE,d27c49ed6abea9167240288dceb4ab6bca855293,TRUE,FALSE,2024-05-27T15:40:50Z,microsoft/Phi-3-medium-4k-instruct,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct,82,90,Phi-3-Medium-4k-Instruct,1123,+3/-3,26149,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-medium-4k-instruct +phi-3-mini-128k-instruct,💬,microsoft/Phi-3-mini-128k-instruct,68.07,63.14,80.09,68.7,54.12,72.85,69.52,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,float16,TRUE,mit,3,1355,TRUE,ebee18c488086b396dde649f2aa6548b9b8d2404,TRUE,FALSE,2024-04-25T13:14:03Z,microsoft/Phi-3-mini-128k-instruct,https://huggingface.co/microsoft/Phi-3-mini-128k-instruct,125,122,Phi-3-Mini-128k-Instruct,1037,+4/-4,21621,Microsoft,MIT,2023/10,https://azure.microsoft.com/en-us/blog/introducing-phi-3-redefining-whats-possible-with-slms/ +phi-3-mini-4k-instruct,💬,microsoft/Phi-3-mini-4k-instruct,69.91,62.97,80.6,69.08,59.88,72.38,74.53,"💬 chat models (RLHF, DPO, IFT, ...)",Unknown,Original,float16,TRUE,mit,3,724,TRUE,b86bcaf57ea4dfdec5dbe12a377028b2fab0d480,TRUE,FALSE,2024-04-26T08:51:19Z,microsoft/Phi-3-mini-4k-instruct,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct,112,117,Phi-3-Mini-4k-Instruct,1066,+4/-6,21119,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +phi-3-mini-4k-instruct,🟢,unsloth/Phi-3-mini-4k-instruct,69.86,62.97,80.61,69.08,59.88,72.69,73.92,🟢 pretrained,MistralForCausalLM,Original,bfloat16,TRUE,mit,3,27,TRUE,4caf5ac193b82d28dea55dcbb22aa51d2a3be453,TRUE,TRUE,2024-05-11T07:51:45Z,unsloth/Phi-3-mini-4k-instruct,https://huggingface.co/unsloth/Phi-3-mini-4k-instruct,112,117,Phi-3-Mini-4k-Instruct,1066,+4/-6,21119,Microsoft,MIT,2023/10,https://huggingface.co/microsoft/Phi-3-mini-4k-instruct +qwen1.5-110b-chat,💬,Qwen/Qwen1.5-110B-Chat,68.01,72.01,84.67,78.04,65.86,77.35,30.1,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,110,117,TRUE,5e04700b8091f10a98f1fe0b20c48c10d195ef5f,TRUE,FALSE,2024-04-29T12:55:18Z,Qwen/Qwen1.5-110B-Chat,https://huggingface.co/Qwen/Qwen1.5-110B-Chat,66,64,Qwen1.5-110B-Chat,1161,+4/-4,27474,Alibaba,Qianwen LICENSE,2024/4,https://qwenlm.github.io/blog/qwen1.5-110b/ +qwen1.5-14b-chat,🔶,Qwen/Qwen1.5-14B-Chat,62.37,58.79,82.33,68.52,60.38,73.32,30.86,🔶 fine-tuned on domain-specific datasets,Qwen2ForCausalLM,Original,float16,TRUE,other,14,99,TRUE,17e11c306ed235e970c9bb8e5f7233527140cdcf,TRUE,FALSE,2024-03-01T12:30:06Z,Qwen/Qwen1.5-14B-Chat,https://huggingface.co/Qwen/Qwen1.5-14B-Chat,91,93,Qwen1.5-14B-Chat,1109,+5/-4,18669,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-14b-chat,💬,Qwen/Qwen1.5-14B-Chat,62.27,58.7,82.27,68.57,60.36,73.09,30.63,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,14,99,TRUE,9492b22871f43e975435455f5c616c77fe7a50ec,TRUE,FALSE,2024-05-16T07:47:25Z,Qwen/Qwen1.5-14B-Chat,https://huggingface.co/Qwen/Qwen1.5-14B-Chat,91,93,Qwen1.5-14B-Chat,1109,+5/-4,18669,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-32b-chat,💬,Qwen/Qwen1.5-32B-Chat,62.95,66.04,85.49,74.99,66.95,77.19,7.05,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,32,102,TRUE,0b1785d88bbe93aa90a8a19da8af78eccbf010a6,TRUE,TRUE,2024-04-05T21:01:12Z,Qwen/Qwen1.5-32B-Chat,https://huggingface.co/Qwen/Qwen1.5-32B-Chat,81,84,Qwen1.5-32B-Chat,1125,+5/-3,22760,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5-32b/ +qwen1.5-4b-chat,💬,Qwen/Qwen1.5-4B-Chat,46.79,43.26,69.73,55.55,44.79,64.96,2.43,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,3,34,TRUE,15bf46b13b1e6b6dd18ff7fa3242af406cc7e791,TRUE,FALSE,2024-02-12T17:13:33Z,Qwen/Qwen1.5-4B-Chat,https://huggingface.co/Qwen/Qwen1.5-4B-Chat,143,139,Qwen1.5-4B-Chat,988,+6/-6,7812,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-72b-chat,💬,Qwen/Qwen1.5-72B-Chat,65.98,68.26,86.47,77.46,63.84,78.93,20.92,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,72,214,TRUE,bc11a298a0c6a5cd737064db62c6ad20ec6331be,TRUE,FALSE,2024-02-17T04:34:39Z,Qwen/Qwen1.5-72B-Chat,https://huggingface.co/Qwen/Qwen1.5-72B-Chat,72,68,Qwen1.5-72B-Chat,1147,+3/-3,40646,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-72b-chat,💬,Qwen/Qwen1.5-72B-Chat,65.96,68.52,86.42,77.44,63.9,79.08,20.39,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,72,214,TRUE,1a6ccc1215278f962c794b1848c710c29ef4053d,TRUE,FALSE,2024-03-07T14:52:34Z,Qwen/Qwen1.5-72B-Chat,https://huggingface.co/Qwen/Qwen1.5-72B-Chat,72,68,Qwen1.5-72B-Chat,1147,+3/-3,40646,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-7b-chat,💬,Qwen/Qwen1.5-7B-Chat,55.15,55.89,78.56,61.65,53.54,67.72,13.57,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,float16,TRUE,other,7,153,TRUE,0addb6bfd79e59bce8f61ed60cdafd906c04d447,TRUE,FALSE,2024-02-12T17:13:18Z,Qwen/Qwen1.5-7B-Chat,https://huggingface.co/Qwen/Qwen1.5-7B-Chat,108,112,Qwen1.5-7B-Chat,1070,+8/-9,4865,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +qwen1.5-7b-chat,💬,Qwen/Qwen1.5-7B-Chat,55.13,55.89,78.56,61.7,53.65,67.8,13.19,"💬 chat models (RLHF, DPO, IFT, ...)",Qwen2ForCausalLM,Original,bfloat16,TRUE,other,7,153,TRUE,0addb6bfd79e59bce8f61ed60cdafd906c04d447,TRUE,FALSE,2024-02-18T04:43:41Z,Qwen/Qwen1.5-7B-Chat,https://huggingface.co/Qwen/Qwen1.5-7B-Chat,108,112,Qwen1.5-7B-Chat,1070,+8/-9,4865,Alibaba,Qianwen LICENSE,2024/2,https://qwenlm.github.io/blog/qwen1.5/ +solar-10.7b-instruct-v1.0,?,upstage/SOLAR-10.7B-Instruct-v1.0,74.2,71.08,88.16,66.21,71.43,83.58,64.75,"",LlamaForCausalLM,Original,float16,TRUE,cc-by-nc-4.0,10,591,TRUE,d3167df97a44b8632538b32ee8cd887893ea1435,TRUE,FALSE,2024-06-09T15:01:03Z,upstage/SOLAR-10.7B-Instruct-v1.0,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0,110,112,SOLAR-10.7B-Instruct-v1.0,1062,+9/-8,4287,Upstage AI,CC-BY-NC-4.0,2023/11,https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0 +stablelm-tuned-alpha-7b,🔶,stabilityai/stablelm-tuned-alpha-7b,34.04,31.91,53.59,24.41,40.37,53.12,0.83,🔶 fine-tuned on domain-specific datasets,GPTNeoXForCausalLM,Original,float16,TRUE,cc-by-nc-sa-4.0,7,359,TRUE,25071b093c15c0d1cb2b2876c6deb621b764fcf5,TRUE,TRUE,2023-09-09T10:52:17Z,stabilityai/stablelm-tuned-alpha-7b,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b,155,155,StableLM-Tuned-Alpha-7B,840,+12/-11,3336,Stability AI,CC-BY-NC-SA-4.0,2023/4,https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b +starling-lm-7b-alpha,🔶,berkeley-nest/Starling-LM-7B-alpha,67.13,63.82,84.9,64.67,46.39,80.58,62.4,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,apache-2.0,7,551,TRUE,f721e85293598f2ef774e483ae95343e39811577,FALSE,TRUE,2023-11-30T20:12:15Z,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha,101,103,Starling-LM-7B-alpha,1088,+6/-5,10415,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha +starling-lm-7b-alpha,🔶,berkeley-nest/Starling-LM-7B-alpha,67.05,63.65,84.87,64.7,46.32,80.43,62.32,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,551,TRUE,76e60ca9807f55acd8eff3ec7ae022c5fbdf1e0e,FALSE,TRUE,2023-11-28T06:48:55Z,berkeley-nest/Starling-LM-7B-alpha,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha,101,103,Starling-LM-7B-alpha,1088,+6/-5,10415,UC Berkeley,CC-BY-NC-4.0,2023/11,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha +starling-lm-7b-beta,💬,Nexusflow/Starling-LM-7B-beta,69.88,67.24,83.47,65.14,55.47,81.29,66.64,"💬 chat models (RLHF, DPO, IFT, ...)",MistralForCausalLM,Original,bfloat16,TRUE,apache-2.0,7,326,TRUE,ee26b7c2cf9db00e1d9a92c9989d5b2a0b891dbd,TRUE,TRUE,2024-03-23T21:12:48Z,Nexusflow/Starling-LM-7B-beta,https://huggingface.co/Nexusflow/Starling-LM-7B-beta,83,99,Starling-LM-7B-beta,1119,+4/-4,16670,Nexusflow,Apache-2.0,2024/3,https://huggingface.co/Nexusflow/Starling-LM-7B-beta +tulu-2-dpo-70b,💬,allenai/tulu-2-dpo-70b,73.77,72.1,88.99,69.84,65.78,83.27,62.62,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,other,68,146,TRUE,0ab5c875f0070d5aee8d36bc55f41de440a13f02,TRUE,TRUE,2024-02-01T13:38:05Z,allenai/tulu-2-dpo-70b,https://huggingface.co/allenai/tulu-2-dpo-70b,94,99,Tulu-2-DPO-70B,1099,+6/-7,6666,AllenAI/UW,AI2 ImpACT Low-risk,2023/11,https://huggingface.co/allenai/tulu-2-dpo-70b +vicuna-13b,🔶,eachadea/vicuna-13b,52.3,51.71,79.94,50.84,52.68,71.03,7.58,🔶 fine-tuned on domain-specific datasets,Unknown,Original,float16,TRUE,"",12,0,FALSE,ac4218770a58baaaaf25201076fe082abb6ffd13,TRUE,TRUE,2023-10-16T12:46:18Z,eachadea/vicuna-13b,https://huggingface.co/eachadea/vicuna-13b,124,115,Vicuna-13B,1042,+4/-5,19788,LMSYS,Llama 2 Community,2023/7,https://huggingface.co/lmsys/vicuna-13b-v1.5 +wizardlm-13b-v1.2,🔶,WizardLM/WizardLM-13B-V1.2,54.76,59.04,82.21,54.64,47.27,71.9,13.5,🔶 fine-tuned on domain-specific datasets,LlamaForCausalLM,Original,float16,TRUE,"",13,0,FALSE,6760d0c07ffdc2405295ed7a29437cf4dc414bac,TRUE,TRUE,2023-09-09T10:52:17Z,WizardLM/WizardLM-13B-V1.2,https://huggingface.co/WizardLM/WizardLM-13B-V1.2,115,112,WizardLM-13b-v1.2,1058,+8/-7,7185,Microsoft,Llama 2 Community,2023/7,https://huggingface.co/WizardLM/WizardLM-13B-V1.2 +wizardlm-70b-v1.0,💬,WizardLM/WizardLM-70B-V1.0,61.25,65.44,84.41,64.05,54.81,80.82,17.97,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,4bit,TRUE,"",70,0,FALSE,6dae38060d70b82dcfe787a612d04aaf0adf0738,TRUE,TRUE,2023-09-09T10:52:17Z,WizardLM/WizardLM-70B-V1.0,https://huggingface.co/WizardLM/WizardLM-70B-V1.0,91,92,WizardLM-70B-v1.0,1106,+7/-6,8382,Microsoft,Llama 2 Community,2023/8,https://huggingface.co/WizardLM/WizardLM-70B-V1.0 +yi-1.5-34b-chat,?,01-ai/Yi-1.5-34B-Chat,74.82,70.48,85.97,77.08,62.16,81.61,71.65,"",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,180,TRUE,fa695ee438bfcd0ec2b378fa1c7e0dea1b40393e,TRUE,TRUE,2024-06-09T15:02:51Z,01-ai/Yi-1.5-34B-Chat,https://huggingface.co/01-ai/Yi-1.5-34B-Chat,68,80,Yi-1.5-34B-Chat,1157,+3/-3,25143,01 AI,Apache-2.0,2024/5,https://huggingface.co/01-ai/Yi-1.5-34B-Chat +yi-34b-chat,💬,01-ai/Yi-34B-Chat,65.32,65.44,84.16,74.9,55.37,80.11,31.92,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,bfloat16,TRUE,apache-2.0,34,332,TRUE,a99ec35331cbfc9da596af7d4538fe2efecff03c,TRUE,FALSE,2023-12-04T08:52:11Z,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat,87,96,Yi-34B-Chat,1111,+5/-5,15928,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat +yi-34b-chat,💬,01-ai/Yi-34B-Chat,63.17,65.1,84.08,74.87,55.41,79.79,19.79,"💬 chat models (RLHF, DPO, IFT, ...)",LlamaForCausalLM,Original,float16,TRUE,apache-2.0,34,332,TRUE,a99ec35331cbfc9da596af7d4538fe2efecff03c,TRUE,FALSE,2023-11-23T10:23:14Z,01-ai/Yi-34B-Chat,https://huggingface.co/01-ai/Yi-34B-Chat,87,96,Yi-34B-Chat,1111,+5/-5,15928,01 AI,Yi License,2023/6,https://huggingface.co/01-ai/Yi-34B-Chat +zephyr-7b-alpha,🔶,HuggingFaceH4/zephyr-7b-alpha,59.5,61.01,84.04,61.39,57.9,78.61,14.03,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1085,TRUE,2cd2cd16a6ab22585d643cf264fac73b18e7852a,TRUE,TRUE,2023-10-16T12:48:18Z,HuggingFaceH4/zephyr-7b-alpha,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha,121,117,Zephyr-7B-alpha,1041,+11/-12,1813,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha +zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,61.95,62.03,84.36,61.07,57.45,77.74,29.04,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,bfloat16,TRUE,mit,7,1493,TRUE,8af01af3d4f9dc9b962447180d6d0f8c5315da86,TRUE,TRUE,2023-11-16T02:50:49Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,120,120,Zephyr-7B-beta,1053,+6/-7,11327,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,61.59,62.46,84.35,60.7,57.83,77.11,27.07,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,8bit,TRUE,mit,7,1493,TRUE,0f17b36adfbe7d86ea1c591a9efeeae17b313f48,TRUE,TRUE,2023-12-04T06:04:15Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,120,120,Zephyr-7B-beta,1053,+6/-7,11327,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta +zephyr-7b-beta,🔶,HuggingFaceH4/zephyr-7b-beta,59.08,62.03,84.53,61.06,57.44,78.06,11.37,🔶 fine-tuned on domain-specific datasets,MistralForCausalLM,Original,float16,TRUE,mit,7,1493,TRUE,8af01af3d4f9dc9b962447180d6d0f8c5315da86,TRUE,TRUE,2023-11-16T02:50:38Z,HuggingFaceH4/zephyr-7b-beta,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta,120,120,Zephyr-7B-beta,1053,+6/-7,11327,HuggingFace,MIT,2023/10,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta