@@ -79,6 +79,20 @@ export enum ModelFamily {
7979 DEEPSEEK = "DeepSeek" ,
8080}
8181
82+ const qwen3_common_configs = {
83+ display_name : "Qwen" ,
84+ provider : "Alibaba" ,
85+ family : ModelFamily . QWEN ,
86+ // Recommended config is for non-thinking mode
87+ // For thinking mode, see webllm.ts where temperature=0.6 and top_p=0.95 are applied
88+ recommended_config : {
89+ temperature : 0.7 ,
90+ presence_penalty : 0 ,
91+ frequency_penalty : 0 ,
92+ top_p : 0.8 ,
93+ } ,
94+ } ;
95+
8296const DEFAULT_MODEL_BASES : ModelRecord [ ] = [
8397 // Phi-3.5 Vision
8498 {
@@ -410,6 +424,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
410424 top_p : 1 ,
411425 } ,
412426 } ,
427+ // Mistral
413428 {
414429 name : "Mistral-7B-Instruct-v0.3-q4f16_1-MLC" ,
415430 display_name : "Mistral" ,
@@ -464,6 +479,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
464479 top_p : 0.95 ,
465480 } ,
466481 } ,
482+ // WizardMath
467483 {
468484 name : "WizardMath-7B-V1.1-q4f16_1-MLC" ,
469485 display_name : "WizardMath" ,
@@ -571,20 +587,50 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
571587 top_p : 1 ,
572588 } ,
573589 } ,
590+ // Qwen3
574591 {
575- name : "Qwen2.5-0.5B-Instruct-q4f16_1-MLC" ,
576- display_name : "Qwen" ,
577- provider : "Alibaba" ,
578- family : ModelFamily . QWEN ,
579- recommended_config : {
580- temperature : 0.7 ,
581- presence_penalty : 0 ,
582- frequency_penalty : 0 ,
583- top_p : 0.8 ,
584- } ,
592+ name : "Qwen3-0.6B-q4f16_1-MLC" ,
593+ ...qwen3_common_configs ,
585594 } ,
586595 {
587- name : "Qwen2.5-0.5B-Instruct-q4f32_1-MLC" ,
596+ name : "Qwen3-0.6B-q4f32_1-MLC" ,
597+ ...qwen3_common_configs ,
598+ } ,
599+ {
600+ name : "Qwen3-0.6B-q0f16-MLC" ,
601+ ...qwen3_common_configs ,
602+ } ,
603+ {
604+ name : "Qwen3-0.6B-q0f32-MLC" ,
605+ ...qwen3_common_configs ,
606+ } ,
607+ {
608+ name : "Qwen3-1.7B-q4f16_1-MLC" ,
609+ ...qwen3_common_configs ,
610+ } ,
611+ {
612+ name : "Qwen3-1.7B-q4f32_1-MLC" ,
613+ ...qwen3_common_configs ,
614+ } ,
615+ {
616+ name : "Qwen3-4B-q4f16_1-MLC" ,
617+ ...qwen3_common_configs ,
618+ } ,
619+ {
620+ name : "Qwen3-4B-q4f32_1-MLC" ,
621+ ...qwen3_common_configs ,
622+ } ,
623+ {
624+ name : "Qwen3-8B-q4f16_1-MLC" ,
625+ ...qwen3_common_configs ,
626+ } ,
627+ {
628+ name : "Qwen3-8B-q4f32_1-MLC" ,
629+ ...qwen3_common_configs ,
630+ } ,
631+ // Qwen2.5
632+ {
633+ name : "Qwen2.5-0.5B-Instruct-q4f16_1-MLC" ,
588634 display_name : "Qwen" ,
589635 provider : "Alibaba" ,
590636 family : ModelFamily . QWEN ,
@@ -596,7 +642,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
596642 } ,
597643 } ,
598644 {
599- name : "Qwen2.5-0.5B-Instruct-q4f16_1 -MLC" ,
645+ name : "Qwen2.5-0.5B-Instruct-q4f32_1 -MLC" ,
600646 display_name : "Qwen" ,
601647 provider : "Alibaba" ,
602648 family : ModelFamily . QWEN ,
@@ -873,6 +919,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
873919 top_p : 0.8 ,
874920 } ,
875921 } ,
922+ // Gemma 2
876923 {
877924 name : "gemma-2-2b-it-q4f16_1-MLC" ,
878925 display_name : "Gemma" ,
@@ -969,6 +1016,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
9691016 top_p : 0.9 ,
9701017 } ,
9711018 } ,
1019+ // StableLM
9721020 {
9731021 name : "stablelm-2-zephyr-1_6b-q4f16_1-MLC" ,
9741022 display_name : "StableLM" ,
@@ -1017,6 +1065,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
10171065 top_p : 0.95 ,
10181066 } ,
10191067 } ,
1068+ // RedPajama
10201069 {
10211070 name : "RedPajama-INCITE-Chat-3B-v1-q4f16_1-MLC" ,
10221071 display_name : "RedPajama" ,
@@ -1057,6 +1106,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
10571106 top_p : 0.95 ,
10581107 } ,
10591108 } ,
1109+ // TinyLlama
10601110 {
10611111 name : "TinyLlama-1.1B-Chat-v1.0-q4f16_1-MLC" ,
10621112 display_name : "TinyLlama" ,
@@ -1105,6 +1155,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
11051155 top_p : 1 ,
11061156 } ,
11071157 } ,
1158+ // Older models
11081159 {
11091160 name : "Llama-3.1-70B-Instruct-q3f16_1-MLC" ,
11101161 display_name : "Llama" ,
0 commit comments