From 5f3b1b953f039876f79790696ccd888c730d24b0 Mon Sep 17 00:00:00 2001 From: Yagil Burowski Date: Mon, 5 Feb 2024 11:16:14 -0500 Subject: [PATCH 1/2] Qwen/Qwen1.5 --- models/qwen-1.5.json | 59 ++++++++++++++++++++++++++++++++++++++++++++ schema.json | 6 ++--- 2 files changed, 62 insertions(+), 3 deletions(-) create mode 100644 models/qwen-1.5.json diff --git a/models/qwen-1.5.json b/models/qwen-1.5.json new file mode 100644 index 0000000..1f4648e --- /dev/null +++ b/models/qwen-1.5.json @@ -0,0 +1,59 @@ +{ + "_descriptorVersion": "0.0.1", + "datePublished": "2024-02-03T11:59:54", + "name": "Qwen 1.5", + "description": "Qwen1.5 is the large language model series developed by Qwen Team, Alibaba Group. It is a transformer-based decoder-only language model pretrained on large-scale multilingual data covering a wide range of domains and it is aligned with human preferences.", + "author": { + "name": "Qwen Team, Alibaba Group", + "url": "https://huggingface.co/Qwen", + "blurb": "Qwen (abbr. for Tongyi Qianwen 通义千问) refers to the large language model family built by Alibaba Cloud" + }, + "numParameters": "3B", + "resources": { + "canonicalUrl": "https://github.com/QwenLM/Qwen1.5", + "paperUrl": "https://qwenlm.github.io/blog/qwen1.5/", + "downloadUrl": "https://huggingface.co/Qwen/Qwen1.5-7B-Chat-GGUF" + }, + "trainedFor": "chat", + "arch": "qwen2", + "files": { + "highlighted": { + "most_capable": { + "name": "qwen1_5-7b-chat-q5_k_m.gguf" + }, + "economical": { + "name": "qwen2-beta-0_5b-chat-q8_0.gguf" + } + }, + "all": [ + { + "name": "qwen1_5-7b-chat-q5_k_m.gguf", + "url": "https://huggingface.co/Qwen/Qwen1.5-7B-Chat-GGUF/resolve/main/qwen1_5-7b-chat-q5_k_m.gguf", + "sizeBytes": 5530664096, + "quantization": "Q5_K_M", + "format": "gguf", + "sha256checksum": "758799c9db5ab1cf2ab56f6bd0b529463d9dd0067f8cb594b853cc4053270aa1", + "publisher": { + "name": "Qwen", + "socialUrl": "https://huggingface.co/Qwen" + }, + "respository": "Qwen/Qwen1.5-7B-Chat-GGUF", + "repositoryUrl": "https://huggingface.co/Qwen/Qwen1.5-7B-Chat-GGUF" + }, + { + "name": "qwen2-beta-0_5b-chat-q8_0.gguf", + "url": "https://huggingface.co/Qwen/Qwen1.5-0.5B-Chat-GGUF/resolve/main/phi-2.Q6_K.gguf", + "sizeBytes": 664602400, + "quantization": "Q8_0", + "format": "gguf", + "sha256checksum": "8373c4479c0bf038b8000eb2f560906c5f81ad78a3662af2748e6a90c3d9727b", + "publisher": { + "name": "Qwen", + "socialUrl": "https://huggingface.co/Qwen" + }, + "respository": "Qwen/Qwen1.5-0.5B-Chat-GGUF", + "repositoryUrl": "https://huggingface.co/Qwen/Qwen1.5-0.5B-Chat-GGUF" + } + ] + } + } diff --git a/schema.json b/schema.json index f486e4a..12cf4e7 100644 --- a/schema.json +++ b/schema.json @@ -51,7 +51,7 @@ }, "numParameters": { "type": "string", - "enum": ["3B", "6.7B", "7B", "13B", "15B", "30B", "65B", "unknown"] + "enum": ["1.5B", "3B", "4B", "6.7B", "7B", "13B", "15B", "30B", "65B", "unknown"] }, "trainedFor": { "type": "string", @@ -59,7 +59,7 @@ }, "arch": { "type": "string", - "enum": ["llama", "pythia", "gpt-neo-x", "gpt-j", "mpt", "replit", "starcoder", "falcon", "mistral", "stablelm", "phi2"] + "enum": ["llama", "pythia", "gpt-neo-x", "gpt-j", "mpt", "replit", "starcoder", "falcon", "mistral", "stablelm", "phi2", "qwen2"] }, "description": { "type": "string" @@ -118,7 +118,7 @@ }, "quantization": { "type": "string", - "enum": ["q4_0", "q4_1", "q5_0", "q5_1", "q8_0", "Q2_K", "Q3_K_S", "Q3_K_M", "Q4_K_S", "Q4_K_M", "Q5_K_S", "Q5_K_M", "Q6_K", "unknown"] + "enum": ["q4_0", "q4_1", "q5_0", "q5_1", "q8_0", "Q8_0", "Q2_K", "Q3_K_S", "Q3_K_M", "Q4_K_S", "Q4_K_M", "Q5_K_S", "Q5_K_M", "Q6_K", "unknown"] }, "format": { "type": "string" From 354285d7aa0acbaa71bad40278fefe269eed0288 Mon Sep 17 00:00:00 2001 From: Yagil Burowski Date: Mon, 5 Feb 2024 11:19:07 -0500 Subject: [PATCH 2/2] 7B only --- models/qwen-1.5.json | 17 ----------------- 1 file changed, 17 deletions(-) diff --git a/models/qwen-1.5.json b/models/qwen-1.5.json index 1f4648e..555a8c6 100644 --- a/models/qwen-1.5.json +++ b/models/qwen-1.5.json @@ -20,9 +20,6 @@ "highlighted": { "most_capable": { "name": "qwen1_5-7b-chat-q5_k_m.gguf" - }, - "economical": { - "name": "qwen2-beta-0_5b-chat-q8_0.gguf" } }, "all": [ @@ -39,20 +36,6 @@ }, "respository": "Qwen/Qwen1.5-7B-Chat-GGUF", "repositoryUrl": "https://huggingface.co/Qwen/Qwen1.5-7B-Chat-GGUF" - }, - { - "name": "qwen2-beta-0_5b-chat-q8_0.gguf", - "url": "https://huggingface.co/Qwen/Qwen1.5-0.5B-Chat-GGUF/resolve/main/phi-2.Q6_K.gguf", - "sizeBytes": 664602400, - "quantization": "Q8_0", - "format": "gguf", - "sha256checksum": "8373c4479c0bf038b8000eb2f560906c5f81ad78a3662af2748e6a90c3d9727b", - "publisher": { - "name": "Qwen", - "socialUrl": "https://huggingface.co/Qwen" - }, - "respository": "Qwen/Qwen1.5-0.5B-Chat-GGUF", - "repositoryUrl": "https://huggingface.co/Qwen/Qwen1.5-0.5B-Chat-GGUF" } ] }