Skip to content

Commit 0617dbb

Browse files
authored
feat: add quantized qwen2-0.5b model (#44)
to add support for quantized(q4f16) qwen2-0.5b
1 parent 6a06f4b commit 0617dbb

File tree

1 file changed

+17
-0
lines changed

1 file changed

+17
-0
lines changed

app/constant.ts

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -347,6 +347,23 @@ export const DEFAULT_MODELS: ModelRecord[] = [
347347
temperature: 0.7,
348348
top_p: 0.95,
349349
},
350+
},
351+
{
352+
name: "Qwen2-0.5B-Instruct-q4f16-MLC",
353+
display_name: "Qwen",
354+
provider: "Alibaba",
355+
size: "0.5B",
356+
quantization: "q4f16_1",
357+
context_length: "4k",
358+
family: "Qwen 2",
359+
vram_required_MB: 500, //rough estimate
360+
low_resource_required: true,
361+
recommended_config: {
362+
temperature: 0.7,
363+
presence_penalty: 0,
364+
frequency_penalty: 0,
365+
top_p: 0.8,
366+
},
350367
},
351368
{
352369
name: "Qwen2-0.5B-Instruct-q0f16-MLC",

0 commit comments

Comments
 (0)