@@ -79,6 +79,20 @@ export enum ModelFamily {
79
79
DEEPSEEK = "DeepSeek" ,
80
80
}
81
81
82
+ const qwen3_common_configs = {
83
+ display_name : "Qwen" ,
84
+ provider : "Alibaba" ,
85
+ family : ModelFamily . QWEN ,
86
+ // Recommended config is for non-thinking mode
87
+ // For thinking mode, see webllm.ts where temperature=0.6 and top_p=0.95 are applied
88
+ recommended_config : {
89
+ temperature : 0.7 ,
90
+ presence_penalty : 0 ,
91
+ frequency_penalty : 0 ,
92
+ top_p : 0.8 ,
93
+ } ,
94
+ } ;
95
+
82
96
const DEFAULT_MODEL_BASES : ModelRecord [ ] = [
83
97
// Phi-3.5 Vision
84
98
{
@@ -410,6 +424,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
410
424
top_p : 1 ,
411
425
} ,
412
426
} ,
427
+ // Mistral
413
428
{
414
429
name : "Mistral-7B-Instruct-v0.3-q4f16_1-MLC" ,
415
430
display_name : "Mistral" ,
@@ -464,6 +479,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
464
479
top_p : 0.95 ,
465
480
} ,
466
481
} ,
482
+ // WizardMath
467
483
{
468
484
name : "WizardMath-7B-V1.1-q4f16_1-MLC" ,
469
485
display_name : "WizardMath" ,
@@ -571,20 +587,50 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
571
587
top_p : 1 ,
572
588
} ,
573
589
} ,
590
+ // Qwen3
574
591
{
575
- name : "Qwen2.5-0.5B-Instruct-q4f16_1-MLC" ,
576
- display_name : "Qwen" ,
577
- provider : "Alibaba" ,
578
- family : ModelFamily . QWEN ,
579
- recommended_config : {
580
- temperature : 0.7 ,
581
- presence_penalty : 0 ,
582
- frequency_penalty : 0 ,
583
- top_p : 0.8 ,
584
- } ,
592
+ name : "Qwen3-0.6B-q4f16_1-MLC" ,
593
+ ...qwen3_common_configs ,
585
594
} ,
586
595
{
587
- name : "Qwen2.5-0.5B-Instruct-q4f32_1-MLC" ,
596
+ name : "Qwen3-0.6B-q4f32_1-MLC" ,
597
+ ...qwen3_common_configs ,
598
+ } ,
599
+ {
600
+ name : "Qwen3-0.6B-q0f16-MLC" ,
601
+ ...qwen3_common_configs ,
602
+ } ,
603
+ {
604
+ name : "Qwen3-0.6B-q0f32-MLC" ,
605
+ ...qwen3_common_configs ,
606
+ } ,
607
+ {
608
+ name : "Qwen3-1.7B-q4f16_1-MLC" ,
609
+ ...qwen3_common_configs ,
610
+ } ,
611
+ {
612
+ name : "Qwen3-1.7B-q4f32_1-MLC" ,
613
+ ...qwen3_common_configs ,
614
+ } ,
615
+ {
616
+ name : "Qwen3-4B-q4f16_1-MLC" ,
617
+ ...qwen3_common_configs ,
618
+ } ,
619
+ {
620
+ name : "Qwen3-4B-q4f32_1-MLC" ,
621
+ ...qwen3_common_configs ,
622
+ } ,
623
+ {
624
+ name : "Qwen3-8B-q4f16_1-MLC" ,
625
+ ...qwen3_common_configs ,
626
+ } ,
627
+ {
628
+ name : "Qwen3-8B-q4f32_1-MLC" ,
629
+ ...qwen3_common_configs ,
630
+ } ,
631
+ // Qwen2.5
632
+ {
633
+ name : "Qwen2.5-0.5B-Instruct-q4f16_1-MLC" ,
588
634
display_name : "Qwen" ,
589
635
provider : "Alibaba" ,
590
636
family : ModelFamily . QWEN ,
@@ -596,7 +642,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
596
642
} ,
597
643
} ,
598
644
{
599
- name : "Qwen2.5-0.5B-Instruct-q4f16_1 -MLC" ,
645
+ name : "Qwen2.5-0.5B-Instruct-q4f32_1 -MLC" ,
600
646
display_name : "Qwen" ,
601
647
provider : "Alibaba" ,
602
648
family : ModelFamily . QWEN ,
@@ -873,6 +919,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
873
919
top_p : 0.8 ,
874
920
} ,
875
921
} ,
922
+ // Gemma 2
876
923
{
877
924
name : "gemma-2-2b-it-q4f16_1-MLC" ,
878
925
display_name : "Gemma" ,
@@ -969,6 +1016,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
969
1016
top_p : 0.9 ,
970
1017
} ,
971
1018
} ,
1019
+ // StableLM
972
1020
{
973
1021
name : "stablelm-2-zephyr-1_6b-q4f16_1-MLC" ,
974
1022
display_name : "StableLM" ,
@@ -1017,6 +1065,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
1017
1065
top_p : 0.95 ,
1018
1066
} ,
1019
1067
} ,
1068
+ // RedPajama
1020
1069
{
1021
1070
name : "RedPajama-INCITE-Chat-3B-v1-q4f16_1-MLC" ,
1022
1071
display_name : "RedPajama" ,
@@ -1057,6 +1106,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
1057
1106
top_p : 0.95 ,
1058
1107
} ,
1059
1108
} ,
1109
+ // TinyLlama
1060
1110
{
1061
1111
name : "TinyLlama-1.1B-Chat-v1.0-q4f16_1-MLC" ,
1062
1112
display_name : "TinyLlama" ,
@@ -1105,6 +1155,7 @@ const DEFAULT_MODEL_BASES: ModelRecord[] = [
1105
1155
top_p : 1 ,
1106
1156
} ,
1107
1157
} ,
1158
+ // Older models
1108
1159
{
1109
1160
name : "Llama-3.1-70B-Instruct-q3f16_1-MLC" ,
1110
1161
display_name : "Llama" ,
0 commit comments