Skip to content

Commit

Permalink
[Config] Fix VRAM required by Qwen2.5-Coder-1.5B-Instruct model (#632)
Browse files Browse the repository at this point in the history
Currently, it has the same VRAM values as the
`Qwen2.5-Coder-7B-Instruct` model.

This change fixes it using the same values from the
`Qwen2.5-1.5B-Instruct` model.
  • Loading branch information
felladrin authored Nov 22, 2024
1 parent f5f6edf commit 6504047
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions src/config.ts
Original file line number Diff line number Diff line change
Expand Up @@ -1134,7 +1134,7 @@ export const prebuiltAppConfig: AppConfig = {
modelVersion +
"/Qwen2-1.5B-Instruct-q4f16_1-ctx4k_cs1k-webgpu.wasm",
low_resource_required: false,
vram_required_MB: 5106.67,
vram_required_MB: 1629.75,
overrides: {
context_window_size: 4096,
},
Expand All @@ -1148,7 +1148,7 @@ export const prebuiltAppConfig: AppConfig = {
modelVersion +
"/Qwen2-1.5B-Instruct-q4f32_1-ctx4k_cs1k-webgpu.wasm",
low_resource_required: false,
vram_required_MB: 5900.09,
vram_required_MB: 1888.97,
overrides: {
context_window_size: 4096,
},
Expand Down

0 comments on commit 6504047

Please sign in to comment.