From e8a326a0e0423393ac1665cfc2a4708bd90208b8 Mon Sep 17 00:00:00 2001 From: Victor Nogueira Date: Wed, 20 Nov 2024 13:50:11 +0200 Subject: [PATCH] Fix VRAM required by Qwen2.5-Coder-1.5B-Instruct model Currently, it has the same VRAM values as the `Qwen2.5-Coder-7B-Instruct` model. This change fixes it using the same values from the `Qwen2.5-1.5B-Instruct` model. --- src/config.ts | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/config.ts b/src/config.ts index 30d301c3..c0352d70 100644 --- a/src/config.ts +++ b/src/config.ts @@ -1134,7 +1134,7 @@ export const prebuiltAppConfig: AppConfig = { modelVersion + "/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm", low_resource_required: false, - vram_required_MB: 5106.67, + vram_required_MB: 1629.75, overrides: { context_window_size: 4096, }, @@ -1148,7 +1148,7 @@ export const prebuiltAppConfig: AppConfig = { modelVersion + "/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm", low_resource_required: false, - vram_required_MB: 5900.09, + vram_required_MB: 1888.97, overrides: { context_window_size: 4096, },