From 967b7f2d6e9d2238491aa4d7c621149d0096a272 Mon Sep 17 00:00:00 2001 From: laurent Date: Wed, 2 Oct 2024 09:06:25 +0200 Subject: [PATCH] Update the candle and cudarc versions. --- rust/Cargo.toml | 8 ++++---- rust/moshi-backend/config-q8.json | 2 +- rust/moshi-backend/config.json | 2 +- rust/moshi-core/Cargo.toml | 3 +-- 4 files changed, 7 insertions(+), 8 deletions(-) diff --git a/rust/Cargo.toml b/rust/Cargo.toml index 5ec85f9..f7fecc5 100644 --- a/rust/Cargo.toml +++ b/rust/Cargo.toml @@ -18,10 +18,10 @@ categories = ["science"] [workspace.dependencies] -candle = { version = "0.7.1", package = "candle-core" } -candle-nn = "0.7.1" -candle-transformers = "0.7.1" -candle-flash-attn = "0.7.1" +candle = { version = "0.7.2", package = "candle-core" } +candle-nn = "0.7.2" +candle-transformers = "0.7.2" +candle-flash-attn = "0.7.2" [profile.release] debug = true diff --git a/rust/moshi-backend/config-q8.json b/rust/moshi-backend/config-q8.json index b5e74af..dcb7a1e 100644 --- a/rust/moshi-backend/config-q8.json +++ b/rust/moshi-backend/config-q8.json @@ -1,7 +1,7 @@ { "instance_name": "foo", "hf_repo": "kyutai/moshiko-candle-q8", - "lm_model_file": "$HOME/tmp/model.q8.gguf", + "lm_model_file": "$HOME/tmp/moshiko_rs_301e30bf@120.q8.gguf", "text_tokenizer_file": "$HOME/tmp/tokenizer_spm_32k_3.model", "log_dir": "$HOME/tmp/moshi-logs", "encodec_model_file": "$HOME/tmp/tokenizer-e351c8d8-checkpoint125.safetensors", diff --git a/rust/moshi-backend/config.json b/rust/moshi-backend/config.json index eb7f82c..5efcab4 100644 --- a/rust/moshi-backend/config.json +++ b/rust/moshi-backend/config.json @@ -1,7 +1,7 @@ { "instance_name": "foo", "hf_repo": "kyutai/moshiko-candle-bf16", - "lm_model_file": "$HOME/tmp/model.safetensors", + "lm_model_file": "$HOME/tmp/moshiko_rs_301e30bf@120.safetensors", "text_tokenizer_file": "$HOME/tmp/tokenizer_spm_32k_3.model", "log_dir": "$HOME/tmp/moshi-logs", "encodec_model_file": "$HOME/tmp/tokenizer-e351c8d8-checkpoint125.safetensors", diff --git a/rust/moshi-core/Cargo.toml b/rust/moshi-core/Cargo.toml index ab80075..df8850b 100644 --- a/rust/moshi-core/Cargo.toml +++ b/rust/moshi-core/Cargo.toml @@ -14,7 +14,6 @@ candle = { workspace = true } candle-nn = { workspace = true } candle-transformers = { workspace = true } candle-flash-attn = { workspace = true, optional = true } -cudarc = { version = "=0.11.6", features = ["std", "cublas", "cublaslt", "curand", "driver", "nvrtc", "f16", "cuda-version-from-build-system", "dynamic-linking"], default-features=false, optional = true } rayon = "1.8.1" serde = { version = "1.0", features = ["derive"] } @@ -22,6 +21,6 @@ tracing = "0.1.40" [features] default = [] -cuda = ["candle/cuda", "candle-nn/cuda", "cudarc"] +cuda = ["candle/cuda", "candle-nn/cuda"] metal = ["candle/metal", "candle-nn/metal"] flash-attn = ["cuda", "dep:candle-flash-attn"]