Add quantized qwen2-0.5b (#490)

Add quantized(q4f16) qwen2-0.5b to the list of supported models. [PR](mlc-ai/binary-mlc-llm-libs#128) must be merged before merging this.
mlc-ai · Jun 27, 2024 · 1da0f76 · 1da0f76
1 parent b7537a6
commit 1da0f76
Showing 1 changed file with 13 additions and 0 deletions.
diff --git a/src/config.ts b/src/config.ts
@@ -601,6 +601,19 @@ export const prebuiltAppConfig: AppConfig = {
       },
     },
     // Qwen-2
+    {
+      model: "https://huggingface.co/mlc-ai/Qwen2-0.5B-Instruct-q4f16_1-MLC",
+      model_id: "Qwen2-0.5B-Instruct-q4f16_1-MLC",
+      model_lib:
+        modelLibURLPrefix +
+        modelVersion +
+        "/Qwen2-0.5B-Instruct-q4f16_1-ctx4k_cs2k-webgpu.wasm",
+      low_resource_required: true,
+      vram_required_MB: 944.62,
+      overrides: {
+        context_window_size: 4096,
+      },
+    },
     {
       model: "https://huggingface.co/mlc-ai/Qwen2-0.5B-Instruct-q0f16-MLC",
       model_id: "Qwen2-0.5B-Instruct-q0f16-MLC",