diff --git a/package.json b/package.json
index b4c3e6c..b18022a 100644
--- a/package.json
+++ b/package.json
@@ -1,7 +1,7 @@
 {
   "name": "lycoris",
   "private": true,
-  "version": "0.9.21",
+  "version": "0.9.22",
   "type": "module",
   "license": "MIT",
   "engines": {
@@ -44,6 +44,6 @@
     "postcss": "^8.4.41",
     "tailwindcss": "^3.4.10",
     "typescript": "^5.5.4",
-    "vite": "^5.4.2"
+    "vite": "^5.4.6"
   }
 }
diff --git a/src-tauri/Cargo.lock b/src-tauri/Cargo.lock
index b6675b9..f05c24c 100644
--- a/src-tauri/Cargo.lock
+++ b/src-tauri/Cargo.lock
@@ -27,6 +27,12 @@ version = "1.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "f26201604c87b1e01bd3d98f8d5d9a8fcbb815e8cedb41ffccbeb4bf593a35fe"
 
+[[package]]
+name = "adler2"
+version = "2.0.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "512761e0bb2578dd7380c6baaa0f4ce03e84f95e960231d1dec8bf4d7d6e2627"
+
 [[package]]
 name = "ahash"
 version = "0.8.11"
@@ -170,9 +176,9 @@ dependencies = [
 
 [[package]]
 name = "anyhow"
-version = "1.0.83"
+version = "1.0.89"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "25bdb32cbbdce2b519a9cd7df3a678443100e265d5e25ca763b7572a5104f5f3"
+checksum = "86fdf8605db99b54d3cd748a44c6d04df638eb5dafb219b135d0149bd0db01f6"
 
 [[package]]
 name = "arbitrary"
@@ -220,6 +226,12 @@ version = "0.7.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "96d30a06541fbafbc7f82ed10c06164cfbd2c401138f6addd8404629c4b16711"
 
+[[package]]
+name = "as-any"
+version = "0.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5b8a30a44e99a1c83ccb2a6298c563c888952a1c9134953db26876528f84c93a"
+
 [[package]]
 name = "async-broadcast"
 version = "0.5.1"
@@ -469,7 +481,7 @@ dependencies = [
  "cc",
  "cfg-if",
  "libc",
- "miniz_oxide",
+ "miniz_oxide 0.7.2",
  "object",
  "rustc-demangle",
 ]
@@ -719,11 +731,12 @@ dependencies = [
 
 [[package]]
 name = "candle-core"
-version = "0.6.0"
-source = "git+https://github.com/EricLBuehler/candle.git?rev=3c8e120#3c8e120e8a6ae88b41ee251ec6255035864858d6"
+version = "0.7.2"
+source = "git+https://github.com/EricLBuehler/candle.git?rev=628775#6287750d26e2a9ed6e5f4f4774c51e6af109536c"
 dependencies = [
  "byteorder",
  "candle-metal-kernels",
+ "float8",
  "gemm",
  "half",
  "memmap2",
@@ -741,8 +754,8 @@ dependencies = [
 
 [[package]]
 name = "candle-metal-kernels"
-version = "0.6.0"
-source = "git+https://github.com/EricLBuehler/candle.git?rev=3c8e120#3c8e120e8a6ae88b41ee251ec6255035864858d6"
+version = "0.7.2"
+source = "git+https://github.com/EricLBuehler/candle.git?rev=628775#6287750d26e2a9ed6e5f4f4774c51e6af109536c"
 dependencies = [
  "metal",
  "once_cell",
@@ -752,8 +765,8 @@ dependencies = [
 
 [[package]]
 name = "candle-nn"
-version = "0.6.0"
-source = "git+https://github.com/EricLBuehler/candle.git?rev=3c8e120#3c8e120e8a6ae88b41ee251ec6255035864858d6"
+version = "0.7.2"
+source = "git+https://github.com/EricLBuehler/candle.git?rev=628775#6287750d26e2a9ed6e5f4f4774c51e6af109536c"
 dependencies = [
  "candle-core",
  "candle-metal-kernels",
@@ -903,6 +916,7 @@ dependencies = [
  "anstyle",
  "clap_lex",
  "strsim 0.11.1",
+ "terminal_size",
 ]
 
 [[package]]
@@ -947,9 +961,9 @@ dependencies = [
 
 [[package]]
 name = "cmake"
-version = "0.1.50"
+version = "0.1.51"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a31c789563b815f77f4250caee12365734369f942439b7defd71e18a48197130"
+checksum = "fb1e43aa7fd152b1f968787f7dbcdeb306d1867ff373c69955211876c053f91a"
 dependencies = [
  "cc",
 ]
@@ -1363,16 +1377,16 @@ dependencies = [
 
 [[package]]
 name = "ct2rs"
-version = "0.7.3"
+version = "0.9.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a02ec8476ffc2a7330384ae07bc69e05d3a9366167e6479d9b827818e677977e"
+checksum = "d755bc515349d0a0a7c1b61bc2439a7afbf01be00a3139af73618045a6ea3614"
 dependencies = [
  "anyhow",
  "cmake",
  "cxx",
  "cxx-build",
  "sentencepiece",
- "tokenizers",
+ "tokenizers 0.20.1",
  "walkdir",
 ]
 
@@ -1388,9 +1402,9 @@ dependencies = [
 
 [[package]]
 name = "cxx"
-version = "1.0.122"
+version = "1.0.129"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bb497fad022245b29c2a0351df572e2d67c1046bcef2260ebc022aec81efea82"
+checksum = "cbdc8cca144dce1c4981b5c9ab748761619979e515c3d53b5df385c677d1d007"
 dependencies = [
  "cc",
  "cxxbridge-flags",
@@ -1400,9 +1414,9 @@ dependencies = [
 
 [[package]]
 name = "cxx-build"
-version = "1.0.122"
+version = "1.0.129"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9327c7f9fbd6329a200a5d4aa6f674c60ab256525ff0084b52a889d4e4c60cee"
+checksum = "c5764c3142ab44fcf857101d12c0ddf09c34499900557c764f5ad0597159d1fc"
 dependencies = [
  "cc",
  "codespan-reporting",
@@ -1415,15 +1429,15 @@ dependencies = [
 
 [[package]]
 name = "cxxbridge-flags"
-version = "1.0.122"
+version = "1.0.129"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "688c799a4a846f1c0acb9f36bb9c6272d9b3d9457f3633c7753c6057270df13c"
+checksum = "d422aff542b4fa28c2ce8e5cc202d42dbf24702345c1fba3087b2d3f8a1b90ff"
 
 [[package]]
 name = "cxxbridge-macro"
-version = "1.0.122"
+version = "1.0.129"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "928bc249a7e3cd554fd2e8e08a426e9670c50bbfc9a621653cfa9accc9641783"
+checksum = "a1719100f31492cd6adeeab9a0f46cdbc846e615fdb66d7b398aa46ec7fdd06f"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -1679,6 +1693,17 @@ dependencies = [
  "syn 2.0.61",
 ]
 
+[[package]]
+name = "derive-new"
+version = "0.7.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2cdc8d50f426189eef89dac62fabfa0abb27d5cc008f25bf4156a0203325becc"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.61",
+]
+
 [[package]]
 name = "derive_arbitrary"
 version = "1.3.2"
@@ -1904,6 +1929,70 @@ version = "0.3.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "a357d28ed41a50f9c765dbfe56cbc04a64e53e5fc58ba79fbc34c10ef3df831f"
 
+[[package]]
+name = "encoding"
+version = "0.2.33"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6b0d943856b990d12d3b55b359144ff341533e516d94098b1d3fc1ac666d36ec"
+dependencies = [
+ "encoding-index-japanese",
+ "encoding-index-korean",
+ "encoding-index-simpchinese",
+ "encoding-index-singlebyte",
+ "encoding-index-tradchinese",
+]
+
+[[package]]
+name = "encoding-index-japanese"
+version = "1.20141219.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "04e8b2ff42e9a05335dbf8b5c6f7567e5591d0d916ccef4e0b1710d32a0d0c91"
+dependencies = [
+ "encoding_index_tests",
+]
+
+[[package]]
+name = "encoding-index-korean"
+version = "1.20141219.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4dc33fb8e6bcba213fe2f14275f0963fd16f0a02c878e3095ecfdf5bee529d81"
+dependencies = [
+ "encoding_index_tests",
+]
+
+[[package]]
+name = "encoding-index-simpchinese"
+version = "1.20141219.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d87a7194909b9118fc707194baa434a4e3b0fb6a5a757c73c3adb07aa25031f7"
+dependencies = [
+ "encoding_index_tests",
+]
+
+[[package]]
+name = "encoding-index-singlebyte"
+version = "1.20141219.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3351d5acffb224af9ca265f435b859c7c01537c0849754d3db3fdf2bfe2ae84a"
+dependencies = [
+ "encoding_index_tests",
+]
+
+[[package]]
+name = "encoding-index-tradchinese"
+version = "1.20141219.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fd0e20d5688ce3cab59eb3ef3a2083a5c77bf496cb798dc6fcdb75f323890c18"
+dependencies = [
+ "encoding_index_tests",
+]
+
+[[package]]
+name = "encoding_index_tests"
+version = "0.1.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a246d82be1c9d791c5dfde9a2bd045fc3cbba3fa2b11ad558f27d01712f00569"
+
 [[package]]
 name = "encoding_rs"
 version = "0.8.33"
@@ -1913,6 +2002,15 @@ dependencies = [
  "cfg-if",
 ]
 
+[[package]]
+name = "encoding_rs_io"
+version = "0.1.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1cc3c5651fb62ab8aa3103998dade57efdd028544bd300516baa31840c252a83"
+dependencies = [
+ "encoding_rs",
+]
+
 [[package]]
 name = "endian-type"
 version = "0.1.2"
@@ -1952,6 +2050,29 @@ dependencies = [
  "syn 2.0.61",
 ]
 
+[[package]]
+name = "env_filter"
+version = "0.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4f2c92ceda6ceec50f43169f9ee8424fe2db276791afde7b2cd8bc084cb376ab"
+dependencies = [
+ "log",
+ "regex",
+]
+
+[[package]]
+name = "env_logger"
+version = "0.11.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e13fa619b91fb2381732789fc5de83b45675e882f66623b7d8cb4f643017018d"
+dependencies = [
+ "anstream",
+ "anstyle",
+ "env_filter",
+ "humantime",
+ "log",
+]
+
 [[package]]
 name = "equivalent"
 version = "1.0.1"
@@ -2063,7 +2184,7 @@ dependencies = [
  "flume",
  "half",
  "lebe",
- "miniz_oxide",
+ "miniz_oxide 0.7.2",
  "rayon-core",
  "smallvec",
  "zune-inflate",
@@ -2141,12 +2262,24 @@ checksum = "0ce7134b9999ecaf8bcd65542e436736ef32ddca1b3e06094cb6ec5755203b80"
 
 [[package]]
 name = "flate2"
-version = "1.0.28"
+version = "1.0.33"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "46303f565772937ffe1d394a4fac6f411c6013172fadde9dcdb1e147a086940e"
+checksum = "324a1be68054ef05ad64b861cc9eaf1d623d2d8cb25b4bf2cb9cdd902b4bf253"
 dependencies = [
  "crc32fast",
- "miniz_oxide",
+ "miniz_oxide 0.8.0",
+]
+
+[[package]]
+name = "float8"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c7c3475274d374d263c4c40c43ad854c5bdf733c7db775bbd3c1ca2ad7427978"
+dependencies = [
+ "half",
+ "num-traits",
+ "rand 0.8.5",
+ "rand_distr",
 ]
 
 [[package]]
@@ -3075,6 +3208,12 @@ version = "1.0.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "df3b46402a9d5adb4c86a0cf463f42e19994e3ee891101b1841f30a545cb49a9"
 
+[[package]]
+name = "humantime"
+version = "2.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9a3a5bfb195931eeb336b2a7b4d761daec841b97f947d34394601737a7bba5e4"
+
 [[package]]
 name = "hyper"
 version = "0.14.28"
@@ -3466,6 +3605,15 @@ dependencies = [
  "system-deps 5.0.0",
 ]
 
+[[package]]
+name = "jlabel"
+version = "0.1.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "145ee6f495871a0cde6d49ddfa0d103d07430c449d95b6d92fbfb032d622f0b7"
+dependencies = [
+ "thiserror",
+]
+
 [[package]]
 name = "jni"
 version = "0.19.0"
@@ -3518,6 +3666,124 @@ dependencies = [
  "rayon",
 ]
 
+[[package]]
+name = "jpreprocess"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d05ad4316553f214144e04abb54a95f0ec55d9b8b5c4ae004f420ead40d07fe4"
+dependencies = [
+ "jlabel",
+ "jpreprocess-core",
+ "jpreprocess-dictionary",
+ "jpreprocess-dictionary-builder",
+ "jpreprocess-jpcommon",
+ "jpreprocess-naist-jdic",
+ "jpreprocess-njd",
+ "lindera-core",
+ "lindera-dictionary",
+ "lindera-tokenizer",
+ "phf 0.11.2",
+]
+
+[[package]]
+name = "jpreprocess-core"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fe30c65ff4c092320f1bba3418ac111443a4827a9155442f6a7d8d0e3707cb51"
+dependencies = [
+ "aho-corasick",
+ "bincode",
+ "lindera-core",
+ "lindera-tokenizer",
+ "once_cell",
+ "regex",
+ "serde",
+ "thiserror",
+]
+
+[[package]]
+name = "jpreprocess-dictionary"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c156a875d35ef6fedf31cb9d6bb3c562d16faad4506a5be27e2ed44357d755d4"
+dependencies = [
+ "anyhow",
+ "bincode",
+ "byteorder",
+ "jpreprocess-core",
+ "lindera-core",
+ "lindera-ipadic-builder",
+ "lindera-tokenizer",
+ "once_cell",
+ "serde",
+]
+
+[[package]]
+name = "jpreprocess-dictionary-builder"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0cd89b119949a5071e6f49d805829f3dc17169eb7c6aab809e4f373c70098709"
+dependencies = [
+ "anyhow",
+ "bincode",
+ "byteorder",
+ "csv",
+ "glob",
+ "jpreprocess-core",
+ "jpreprocess-dictionary",
+ "lindera-core",
+ "log",
+ "rayon",
+ "serde",
+ "yada",
+]
+
+[[package]]
+name = "jpreprocess-jpcommon"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8a95684847dcf9a95a94d74f725ca207e5106f2c0084959d9b328b7f8fcf3184"
+dependencies = [
+ "jlabel",
+ "jpreprocess-core",
+ "jpreprocess-njd",
+]
+
+[[package]]
+name = "jpreprocess-naist-jdic"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "472767e7dc48354e3b42759721ffc6b457856a339b10f9cb039749011f570cc2"
+dependencies = [
+ "encoding",
+ "flate2",
+ "jpreprocess-dictionary",
+ "jpreprocess-dictionary-builder",
+ "lindera-core",
+ "tar",
+ "ureq",
+]
+
+[[package]]
+name = "jpreprocess-njd"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "25fc5071bd75e17af650bfe4697dfe7f5af8254965ce3242476698cee3c3b7af"
+dependencies = [
+ "aho-corasick",
+ "jpreprocess-core",
+ "jpreprocess-dictionary",
+ "jpreprocess-window",
+ "lindera-tokenizer",
+ "phf 0.11.2",
+]
+
+[[package]]
+name = "jpreprocess-window"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9c06d7aceb8ce626a3318183096aa6dad82f046b3cec5d43e90066d1b07445a2"
+
 [[package]]
 name = "js-sys"
 version = "0.3.69"
@@ -3658,6 +3924,149 @@ dependencies = [
  "vcpkg",
 ]
 
+[[package]]
+name = "lindera-cc-cedict-builder"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "85b8f642bc9c9130682569975772a17336c6aab26d11fc0f823f3e663167ace6"
+dependencies = [
+ "anyhow",
+ "lindera-core",
+ "lindera-decompress",
+ "lindera-dictionary-builder",
+]
+
+[[package]]
+name = "lindera-core"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0c28191456debc98af6aa5f7db77872471983e9fa2a737b1c232b6ef543aed62"
+dependencies = [
+ "anyhow",
+ "bincode",
+ "byteorder",
+ "encoding_rs",
+ "log",
+ "once_cell",
+ "serde",
+ "thiserror",
+ "yada",
+]
+
+[[package]]
+name = "lindera-decompress"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4788a1ead2f63f3fc2888109272921dedd86a87b7d0bf05e9daab46600daac51"
+dependencies = [
+ "anyhow",
+ "flate2",
+ "serde",
+]
+
+[[package]]
+name = "lindera-dictionary"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bdf5f91725e32b9a21b1656baa7030766c9bafc4de4b4ddeb8ffdde7224dd2f6"
+dependencies = [
+ "anyhow",
+ "bincode",
+ "byteorder",
+ "lindera-cc-cedict-builder",
+ "lindera-core",
+ "lindera-ipadic-builder",
+ "lindera-ipadic-neologd-builder",
+ "lindera-ko-dic-builder",
+ "lindera-unidic-builder",
+ "serde",
+ "strum",
+ "strum_macros",
+]
+
+[[package]]
+name = "lindera-dictionary-builder"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e41f00ba7ac541b0ffd8c30e7a73f2dd197546cc5780462ec4f2e4782945a780"
+dependencies = [
+ "anyhow",
+ "bincode",
+ "byteorder",
+ "csv",
+ "derive_builder",
+ "encoding",
+ "encoding_rs",
+ "encoding_rs_io",
+ "glob",
+ "lindera-core",
+ "lindera-decompress",
+ "log",
+ "yada",
+]
+
+[[package]]
+name = "lindera-ipadic-builder"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bf5031c52686128db13f774b2c5a8abfd52b4cc1f904041d8411aa19d630ce4d"
+dependencies = [
+ "anyhow",
+ "lindera-core",
+ "lindera-decompress",
+ "lindera-dictionary-builder",
+]
+
+[[package]]
+name = "lindera-ipadic-neologd-builder"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "abf36e40ace904741efdd883ed5c4dba6425f65156a0fb5d3f73a386335950dc"
+dependencies = [
+ "anyhow",
+ "lindera-core",
+ "lindera-decompress",
+ "lindera-dictionary-builder",
+]
+
+[[package]]
+name = "lindera-ko-dic-builder"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9f2c60425abc1548570c2568858f74a1f042105ecd89faa39c651b4315350fd9"
+dependencies = [
+ "anyhow",
+ "lindera-core",
+ "lindera-decompress",
+ "lindera-dictionary-builder",
+]
+
+[[package]]
+name = "lindera-tokenizer"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "903e558981bcb6f59870aa7d6b4bcb09e8f7db778886a6a70f67fd74c9fa2ca3"
+dependencies = [
+ "bincode",
+ "lindera-core",
+ "lindera-dictionary",
+ "once_cell",
+ "serde",
+ "serde_json",
+]
+
+[[package]]
+name = "lindera-unidic-builder"
+version = "0.32.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "99e2c50015c242e02c451acb6748667ac6fd1d3d667cd7db48cd89e2f2d2377e"
+dependencies = [
+ "anyhow",
+ "lindera-core",
+ "lindera-decompress",
+ "lindera-dictionary-builder",
+]
+
 [[package]]
 name = "line-wrap"
 version = "0.2.0"
@@ -3740,7 +4149,7 @@ dependencies = [
 
 [[package]]
 name = "lycoris"
-version = "0.9.21"
+version = "0.9.22"
 dependencies = [
  "chrono",
  "core-graphics 0.24.0",
@@ -3759,6 +4168,7 @@ dependencies = [
  "reqwest 0.12.5",
  "rusqlite",
  "samplerate-rs",
+ "sbv2_core",
  "screencapturekit",
  "serde",
  "serde_json",
@@ -3770,7 +4180,6 @@ dependencies = [
  "tokio",
  "unicode-segmentation",
  "urlencoding",
- "uuid 1.10.0",
  "vosk",
  "whisper-rs",
  "xcap",
@@ -3868,6 +4277,16 @@ version = "0.1.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "2532096657941c2fea9c289d370a250971c689d4f143798ff67113ec042024a5"
 
+[[package]]
+name = "matrixmultiply"
+version = "0.3.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9380b911e3e96d10c1f415da0876389aaf1b56759054eeb0de7df940c456ba1a"
+dependencies = [
+ "autocfg",
+ "rawpointer",
+]
+
 [[package]]
 name = "maybe-rayon"
 version = "0.1.1"
@@ -3998,6 +4417,15 @@ dependencies = [
  "simd-adler32",
 ]
 
+[[package]]
+name = "miniz_oxide"
+version = "0.8.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e2d80299ef12ff69b16a84bb182e3b9df68b5a91574d3d4fa6e41b65deec4df1"
+dependencies = [
+ "adler2",
+]
+
 [[package]]
 name = "mio"
 version = "0.8.11"
@@ -4012,8 +4440,8 @@ dependencies = [
 
 [[package]]
 name = "mistralrs"
-version = "0.3.0"
-source = "git+https://github.com/EricLBuehler/mistral.rs.git?tag=v0.3.0#ae71578be27f4369a4d9a0c7d9b849be14c82162"
+version = "0.3.1"
+source = "git+https://github.com/EricLBuehler/mistral.rs.git?rev=32e8945#32e894510696e9aa3c11db79268ee031a3ecefa6"
 dependencies = [
  "anyhow",
  "candle-core",
@@ -4031,11 +4459,12 @@ dependencies = [
 
 [[package]]
 name = "mistralrs-core"
-version = "0.3.0"
-source = "git+https://github.com/EricLBuehler/mistral.rs.git?tag=v0.3.0#ae71578be27f4369a4d9a0c7d9b849be14c82162"
+version = "0.3.1"
+source = "git+https://github.com/EricLBuehler/mistral.rs.git?rev=32e8945#32e894510696e9aa3c11db79268ee031a3ecefa6"
 dependencies = [
  "akin",
  "anyhow",
+ "as-any",
  "async-trait",
  "base64 0.22.1",
  "buildstructor",
@@ -4047,10 +4476,11 @@ dependencies = [
  "chrono",
  "clap",
  "csv",
- "derive-new",
+ "derive-new 0.7.0",
  "derive_more",
  "dirs",
  "either",
+ "float8",
  "futures",
  "galil-seiferas",
  "half",
@@ -4073,14 +4503,16 @@ dependencies = [
  "regex-automata 0.4.6",
  "reqwest 0.12.5",
  "rustc-hash 2.0.0",
+ "safetensors",
  "schemars",
  "serde",
  "serde_json",
+ "serde_plain",
  "serde_yaml",
  "strum",
  "sysinfo",
  "thiserror",
- "tokenizers",
+ "tokenizers 0.19.1",
  "tokio",
  "tokio-rayon",
  "toml 0.8.12",
@@ -4094,13 +4526,16 @@ dependencies = [
 
 [[package]]
 name = "mistralrs-quant"
-version = "0.3.0"
-source = "git+https://github.com/EricLBuehler/mistral.rs.git?tag=v0.3.0#ae71578be27f4369a4d9a0c7d9b849be14c82162"
+version = "0.3.1"
+source = "git+https://github.com/EricLBuehler/mistral.rs.git?rev=32e8945#32e894510696e9aa3c11db79268ee031a3ecefa6"
 dependencies = [
+ "byteorder",
  "candle-core",
  "candle-nn",
+ "float8",
  "half",
  "lazy_static",
+ "once_cell",
  "paste",
  "rayon",
  "serde",
@@ -4109,8 +4544,8 @@ dependencies = [
 
 [[package]]
 name = "mistralrs-vision"
-version = "0.3.0"
-source = "git+https://github.com/EricLBuehler/mistral.rs.git?tag=v0.3.0#ae71578be27f4369a4d9a0c7d9b849be14c82162"
+version = "0.3.1"
+source = "git+https://github.com/EricLBuehler/mistral.rs.git?rev=32e8945#32e894510696e9aa3c11db79268ee031a3ecefa6"
 dependencies = [
  "candle-core",
  "image 0.25.2",
@@ -4155,6 +4590,21 @@ dependencies = [
  "tempfile",
 ]
 
+[[package]]
+name = "ndarray"
+version = "0.16.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "882ed72dce9365842bf196bdeedf5055305f11fc8c03dee7bb0194a6cad34841"
+dependencies = [
+ "matrixmultiply",
+ "num-complex",
+ "num-integer",
+ "num-traits",
+ "portable-atomic",
+ "portable-atomic-util",
+ "rawpointer",
+]
+
 [[package]]
 name = "ndk"
 version = "0.6.0"
@@ -4647,6 +5097,32 @@ dependencies = [
  "pin-project-lite",
 ]
 
+[[package]]
+name = "ort"
+version = "2.0.0-rc.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a5f95fe501e1cb81dec2f66ee3129025759b602817aa2c77ff421390c418cc34"
+dependencies = [
+ "half",
+ "libloading",
+ "ndarray",
+ "ort-sys",
+ "tracing",
+]
+
+[[package]]
+name = "ort-sys"
+version = "2.0.0-rc.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b4174960a7b93a17564a05b26e05889f0dea9ee70e68db5841f27b40c0c9804e"
+dependencies = [
+ "flate2",
+ "pkg-config",
+ "sha2",
+ "tar",
+ "ureq",
+]
+
 [[package]]
 name = "os_info"
 version = "3.8.2"
@@ -5003,7 +5479,7 @@ dependencies = [
  "crc32fast",
  "fdeflate",
  "flate2",
- "miniz_oxide",
+ "miniz_oxide 0.7.2",
 ]
 
 [[package]]
@@ -5043,6 +5519,15 @@ version = "1.6.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "7170ef9988bc169ba16dd36a7fa041e5c4cbeb6a35b76d4c03daded371eae7c0"
 
+[[package]]
+name = "portable-atomic-util"
+version = "0.2.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fcdd8420072e66d54a407b3316991fe946ce3ab1083a7f575b2463866624704d"
+dependencies = [
+ "portable-atomic",
+]
+
 [[package]]
 name = "powerfmt"
 version = "0.2.0"
@@ -5063,9 +5548,9 @@ checksum = "925383efa346730478fb4838dbe9137d2a47675ad789c546d150a6e1dd4ab31c"
 
 [[package]]
 name = "prettyplease"
-version = "0.2.17"
+version = "0.2.20"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8d3928fb5db768cb86f891ff014f0144589297e3c6a1aba6ed7cecfdace270c7"
+checksum = "5f12335488a2f3b0a83b14edad48dca9879ce89b2edd10e80237e4e852dd645e"
 dependencies = [
  "proc-macro2",
  "syn 2.0.61",
@@ -5391,6 +5876,12 @@ version = "0.5.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "f2ff9a1f06a88b01621b7ae906ef0211290d1c8a168a15542486a8f61c0833b9"
 
+[[package]]
+name = "rawpointer"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "60a357793950651c4ed0f3f52338f53b2f809f32d83a07f72909fa13e4c6c1e3"
+
 [[package]]
 name = "rayon"
 version = "1.10.0"
@@ -5803,9 +6294,9 @@ checksum = "e86697c916019a8588c99b5fac3cead74ec0b4b819707a682fd4d23fa0ce1ba1"
 
 [[package]]
 name = "safetensors"
-version = "0.4.3"
+version = "0.4.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8ced76b22c7fba1162f11a5a75d9d8405264b467a07ae0c9c29be119b9297db9"
+checksum = "44560c11236a6130a46ce36c836a62936dc81ebf8c36a37947423571be0e55b6"
 dependencies = [
  "serde",
  "serde_json",
@@ -5829,6 +6320,30 @@ dependencies = [
  "libsamplerate",
 ]
 
+[[package]]
+name = "sbv2_core"
+version = "0.1.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "aa89a844f9b5e6e7bf8353bfca5f6f414c12c2cfcffa86e17da7d58d839208c0"
+dependencies = [
+ "anyhow",
+ "dotenvy",
+ "env_logger",
+ "hound",
+ "jpreprocess",
+ "ndarray",
+ "num_cpus",
+ "once_cell",
+ "ort",
+ "regex",
+ "serde",
+ "serde_json",
+ "tar",
+ "thiserror",
+ "tokenizers 0.20.1",
+ "zstd",
+]
+
 [[package]]
 name = "schannel"
 version = "0.1.23"
@@ -6002,18 +6517,18 @@ checksum = "a3f0bf26fd526d2a95683cd0f87bf103b8539e2ca1ef48ce002d67aad59aa0b4"
 
 [[package]]
 name = "serde"
-version = "1.0.197"
+version = "1.0.210"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3fb1c873e1b9b056a4dc4c0c198b24c3ffa059243875552b2bd0933b1aee4ce2"
+checksum = "c8e3592472072e6e22e0a54d5904d9febf8508f65fb8552499a1abc7d1078c3a"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.197"
+version = "1.0.210"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7eb0b34b42edc17f6b7cac84a52a1c5f0e1bb2227e997ca9011ea3dd34e8610b"
+checksum = "243902eda00fad750862fc144cea25caca5e20d615af0a81bee94ca738f1df1f"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -6033,16 +6548,26 @@ dependencies = [
 
 [[package]]
 name = "serde_json"
-version = "1.0.114"
+version = "1.0.128"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c5f09b1bd632ef549eaa9f60a1f8de742bdbc698e6cee2095fc84dde5f549ae0"
+checksum = "6ff5456707a1de34e7e37f2a6fd3d3f808c318259cbd01ab6377795054b483d8"
 dependencies = [
  "indexmap 2.2.6",
  "itoa 1.0.10",
+ "memchr",
  "ryu",
  "serde",
 ]
 
+[[package]]
+name = "serde_plain"
+version = "1.0.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9ce1fc6db65a611022b23a0dec6975d63fb80a302cb3388835ff02c097258d50"
+dependencies = [
+ "serde",
+]
+
 [[package]]
 name = "serde_repr"
 version = "0.1.18"
@@ -6308,6 +6833,17 @@ dependencies = [
  "windows-sys 0.52.0",
 ]
 
+[[package]]
+name = "socks"
+version = "0.3.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f0c3dbbd9ae980613c6dd8e28a9407b50509d3803b57624d5dfe8315218cd58b"
+dependencies = [
+ "byteorder",
+ "libc",
+ "winapi",
+]
+
 [[package]]
 name = "soup2"
 version = "0.2.1"
@@ -6941,9 +7477,9 @@ dependencies = [
 
 [[package]]
 name = "tar"
-version = "0.4.40"
+version = "0.4.41"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b16afcea1f22891c49a00c751c7b63b2233284064f11a200fc624137c51e2ddb"
+checksum = "cb797dad5fb5b76fcf519e702f4a589483b5ef06567f160c392832c1f5e44909"
 dependencies = [
  "filetime",
  "libc",
@@ -7243,6 +7779,16 @@ dependencies = [
  "winapi-util",
 ]
 
+[[package]]
+name = "terminal_size"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "21bebf2b7c9e0a515f6e0f8c51dc0f8e4696391e6f1ff30379559f8365fb0df7"
+dependencies = [
+ "rustix 0.38.32",
+ "windows-sys 0.48.0",
+]
+
 [[package]]
 name = "thin-slice"
 version = "0.1.1"
@@ -7251,18 +7797,18 @@ checksum = "8eaa81235c7058867fa8c0e7314f33dcce9c215f535d1913822a2b3f5e289f3c"
 
 [[package]]
 name = "thiserror"
-version = "1.0.58"
+version = "1.0.63"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "03468839009160513471e86a034bb2c5c0e4baae3b43f79ffc55c4a5427b3297"
+checksum = "c0342370b38b6a11b6cc11d6a805569958d54cfa061a29969c3b5ce2ea405724"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.58"
+version = "1.0.63"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c61f3ba182994efc43764a46c018c347bc492c79f024e705f46567b418f6d4f7"
+checksum = "a4558b58466b9ad7ca0f102865eccc95938dca1a74a856f2b57b6629050da261"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -7368,6 +7914,38 @@ dependencies = [
  "unicode_categories",
 ]
 
+[[package]]
+name = "tokenizers"
+version = "0.20.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b172ffa9a2e5c31bbddc940cd5725d933ced983a9333bbebc4c7eda3bbce1557"
+dependencies = [
+ "aho-corasick",
+ "derive_builder",
+ "esaxx-rs",
+ "getrandom 0.2.12",
+ "indicatif",
+ "itertools 0.12.1",
+ "lazy_static",
+ "log",
+ "macro_rules_attribute",
+ "monostate",
+ "onig",
+ "paste",
+ "rand 0.8.5",
+ "rayon",
+ "rayon-cond",
+ "regex",
+ "regex-syntax 0.8.2",
+ "serde",
+ "serde_json",
+ "spm_precompiled",
+ "thiserror",
+ "unicode-normalization-alignments",
+ "unicode-segmentation",
+ "unicode_categories",
+]
+
 [[package]]
 name = "tokio"
 version = "1.36.0"
@@ -7770,6 +8348,7 @@ dependencies = [
  "rustls-webpki",
  "serde",
  "serde_json",
+ "socks",
  "url",
  "webpki-roots",
 ]
@@ -8244,18 +8823,16 @@ dependencies = [
 
 [[package]]
 name = "whisper-rs"
-version = "0.11.1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ed7a191078e189d96d029244ab1dff159775adec71dc89a222e9bb9d21a7d161"
+version = "0.13.1"
+source = "git+https://github.com/arizhih/whisper-rs.git?branch=whisper-cpp-1-7-x#9f56a7350b31ce09f6e95be928beeea837684a59"
 dependencies = [
  "whisper-rs-sys",
 ]
 
 [[package]]
 name = "whisper-rs-sys"
-version = "0.9.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2834f4ca6472b02748c6c282a60cea538f962428f79e685c3205a08efd711336"
+version = "0.11.1"
+source = "git+https://github.com/arizhih/whisper-rs.git?branch=whisper-cpp-1-7-x#9f56a7350b31ce09f6e95be928beeea837684a59"
 dependencies = [
  "bindgen",
  "cfg-if",
@@ -8757,7 +9334,7 @@ version = "0.8.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "12b41773911497b18ca8553c3daaf8ec9fe9819caf93d451d3055f69de028adb"
 dependencies = [
- "derive-new",
+ "derive-new 0.6.0",
  "libc",
  "log",
  "nix 0.28.0",
@@ -8897,6 +9474,12 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "yada"
+version = "0.5.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "aed111bd9e48a802518765906cbdadf0b45afb72b9c81ab049a3b86252adffdd"
+
 [[package]]
 name = "yoke"
 version = "0.7.4"
@@ -9049,6 +9632,34 @@ dependencies = [
  "thiserror",
 ]
 
+[[package]]
+name = "zstd"
+version = "0.13.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fcf2b778a664581e31e389454a7072dab1647606d44f7feea22cd5abb9c9f3f9"
+dependencies = [
+ "zstd-safe",
+]
+
+[[package]]
+name = "zstd-safe"
+version = "7.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "54a3ab4db68cea366acc5c897c7b4d4d1b8994a9cd6e6f841f8964566a419059"
+dependencies = [
+ "zstd-sys",
+]
+
+[[package]]
+name = "zstd-sys"
+version = "2.0.13+zstd.1.5.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "38ff0f21cfee8f97d94cef41359e0c89aa6113028ab0291aa8ca0038995a95aa"
+dependencies = [
+ "cc",
+ "pkg-config",
+]
+
 [[package]]
 name = "zune-core"
 version = "0.4.12"
diff --git a/src-tauri/Cargo.toml b/src-tauri/Cargo.toml
index 9db86f0..de75e48 100644
--- a/src-tauri/Cargo.toml
+++ b/src-tauri/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "lycoris"
-version = "0.9.21"
+version = "0.9.22"
 description = "Lycoris is an offline voice memo"
 authors = ["solaoi"]
 license = "MIT"
@@ -43,18 +43,15 @@ core-graphics = "0.24.0"
 objc = "0.2"
 objc-foundation = "0.1"
 objc_id = "0.1"
-ct2rs = { version = "0.7.3", features = ["accelerate"] }
-mistralrs = { git = "https://github.com/EricLBuehler/mistral.rs.git", tag = "v0.3.0", features = [
+ct2rs = { version = "0.9.4", features = ["accelerate"] }
+mistralrs = { git = "https://github.com/EricLBuehler/mistral.rs.git", rev = "32e8945", features = [
     "metal",
 ] }
-# mistralrsの要求がtauriの要求と競合するため、tauriの要求を上書きする
-uuid = "=1.10.0"
 tauri-plugin-clipboard = "1.1.4"
-
-[target.'cfg(target_arch = "x86_64")'.dependencies]
-whisper-rs = { version = "0.11.1", features = ["metal"] }
-[target.'cfg(target_arch = "aarch64")'.dependencies]
-whisper-rs = { version = "0.11.1", features = ["metal", "coreml"] }
+sbv2_core = { version = "0.1.4", features = ["dynamic"] }
+# whisper-rs = { version = "0.11.1", features = ["metal"] }
+# whisper-rs = { git = "https://github.com/tazz4843/whisper-rs.git", rev = "67924ca", features = ["metal"] }
+whisper-rs = { git = "https://github.com/arizhih/whisper-rs.git", branch = "whisper-cpp-1-7-x", features = ["metal"] }
 
 [dependencies.tauri-plugin-sql]
 git = "https://github.com/tauri-apps/plugins-workspace"
diff --git a/src-tauri/lib/libonnxruntime.dylib b/src-tauri/lib/libonnxruntime.dylib
new file mode 100755
index 0000000..035534e
Binary files /dev/null and b/src-tauri/lib/libonnxruntime.dylib differ
diff --git a/src-tauri/migrations/001.sql b/src-tauri/migrations/001.sql
index 1e919c2..440d830 100644
--- a/src-tauri/migrations/001.sql
+++ b/src-tauri/migrations/001.sql
@@ -8,6 +8,8 @@ CREATE TABLE speeches (
     id INTEGER PRIMARY KEY AUTOINCREMENT,
     speech_type TEXT,
     -- speech|memo|screenshot|action
+    action_type TEXT,
+    -- chat|suggest
     created_at_unixtime INTEGER DEFAULT (CAST(strftime('%s', 'now') AS INTEGER)),
     content TEXT,
     content_2 TEXT,
@@ -35,7 +37,7 @@ VALUES("settingKeyAmivoice", "");
 INSERT INTO settings(setting_name, setting_status)
 VALUES("settingLanguage", "日本語");
 INSERT INTO settings(setting_name, setting_status)
-VALUES("settingProcess", "文字起こし");
+VALUES("settingProcess", "文字起こし（汎用）");
 INSERT INTO settings(setting_name, setting_status)
 VALUES("settingOnline", "OpenAI");
 INSERT INTO settings(setting_name, setting_status)
@@ -74,10 +76,14 @@ VALUES("base.en", "whisper");
 INSERT INTO models(model_name, model_type)
 VALUES("large", "whisper");
 INSERT INTO models(model_name, model_type)
+VALUES("large-turbo", "whisper");
+INSERT INTO models(model_name, model_type)
 VALUES("large-distil.en", "whisper");
 INSERT INTO models(model_name, model_type)
 VALUES("large-distil.ja", "whisper");
 INSERT INTO models(model_name, model_type)
+VALUES("large-distil.bilingual", "whisper");
+INSERT INTO models(model_name, model_type)
 VALUES("medium", "whisper");
 INSERT INTO models(model_name, model_type)
 VALUES("medium.en", "whisper");
@@ -150,6 +156,24 @@ VALUES("small-cs-0.4-rhasspy", "vosk");
 INSERT INTO models(model_name, model_type)
 VALUES("small-pl-0.22", "vosk");
 INSERT INTO models(model_name, model_type)
-VALUES("fugumt-en-ja", "fugumt");
+VALUES("fugumt-en-ja", "fugumt-en-ja");
+INSERT INTO models(model_name, model_type)
+VALUES("fugumt-ja-en", "fugumt-ja-en");
+INSERT INTO models(model_name, model_type)
+VALUES("honyaku-13b", "honyaku-13b");
+INSERT INTO models(model_name, model_type)
+VALUES("style-bert-vits2", "style-bert-vits2");
+INSERT INTO models(model_name, model_type)
+VALUES("tsukuyomi-chan", "style-bert-vits2-voice");
+INSERT INTO models(model_name, model_type)
+VALUES("amitaro", "style-bert-vits2-voice");
+INSERT INTO models(model_name, model_type)
+VALUES("koharune-ami", "style-bert-vits2-voice");
+INSERT INTO models(model_name, model_type)
+VALUES("jvnv-F1-jp", "style-bert-vits2-voice");
+INSERT INTO models(model_name, model_type)
+VALUES("jvnv-F2-jp", "style-bert-vits2-voice");
+INSERT INTO models(model_name, model_type)
+VALUES("jvnv-M1-jp", "style-bert-vits2-voice");
 INSERT INTO models(model_name, model_type)
-VALUES("honyaku13b-q4-0", "honyaku13b");
\ No newline at end of file
+VALUES("jvnv-M2-jp", "style-bert-vits2-voice");
\ No newline at end of file
diff --git a/src-tauri/resources/whisper/ggml-metal.metal b/src-tauri/resources/whisper/ggml-metal.metal
deleted file mode 100644
index a7d3f9e..0000000
--- a/src-tauri/resources/whisper/ggml-metal.metal
+++ /dev/null
@@ -1,5136 +0,0 @@
-#include <metal_stdlib>
-
-using namespace metal;
-
-#define MAX(x, y) ((x) > (y) ? (x) : (y))
-#define MIN(x, y) ((x) < (y) ? (x) : (y))
-#define SWAP(x, y) { auto tmp = (x); (x) = (y); (y) = tmp; }
-
-#define QK4_0 32
-#define QR4_0 2
-typedef struct {
-    half    d;             // delta
-    uint8_t qs[QK4_0 / 2]; // nibbles / quants
-} block_q4_0;
-
-#define QK4_1 32
-typedef struct {
-    half d;                 // delta
-    half m;                 // min
-    uint8_t qs[QK4_1 / 2];  // nibbles / quants
-} block_q4_1;
-
-#define QK5_0 32
-typedef struct {
-    half d;                // delta
-    uint8_t qh[4];         // 5-th bit of quants
-    uint8_t qs[QK5_0 / 2]; // nibbles / quants
-} block_q5_0;
-
-#define QK5_1 32
-typedef struct {
-    half d;                 // delta
-    half m;                 // min
-    uint8_t qh[4];          // 5-th bit of quants
-    uint8_t qs[QK5_1 / 2];  // nibbles / quants
-} block_q5_1;
-
-#define QK8_0 32
-typedef struct {
-    half    d;         // delta
-    int8_t  qs[QK8_0]; // quants
-} block_q8_0;
-
-#define N_SIMDWIDTH 32 // assuming SIMD group size is 32
-
-enum ggml_sort_order {
-    GGML_SORT_ASC,
-    GGML_SORT_DESC,
-};
-
-// general-purpose kernel for addition, multiplication and division of two tensors
-// pros: works for non-contiguous tensors, supports broadcast across all dims
-// cons: not very efficient
-kernel void kernel_add(
-        device const char * src0,
-        device const char * src1,
-        device       char * dst,
-        constant  int64_t & ne00,
-        constant  int64_t & ne01,
-        constant  int64_t & ne02,
-        constant  int64_t & ne03,
-        constant uint64_t & nb00,
-        constant uint64_t & nb01,
-        constant uint64_t & nb02,
-        constant uint64_t & nb03,
-        constant  int64_t & ne10,
-        constant  int64_t & ne11,
-        constant  int64_t & ne12,
-        constant  int64_t & ne13,
-        constant uint64_t & nb10,
-        constant uint64_t & nb11,
-        constant uint64_t & nb12,
-        constant uint64_t & nb13,
-        constant  int64_t & ne0,
-        constant  int64_t & ne1,
-        constant  int64_t & ne2,
-        constant  int64_t & ne3,
-        constant uint64_t & nb0,
-        constant uint64_t & nb1,
-        constant uint64_t & nb2,
-        constant uint64_t & nb3,
-        constant  int64_t & offs,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig.z;
-    const int64_t i02 = tgpig.y;
-    const int64_t i01 = tgpig.x;
-
-    const int64_t i13 = i03 % ne13;
-    const int64_t i12 = i02 % ne12;
-    const int64_t i11 = i01 % ne11;
-
-    device const char * src0_ptr = src0 + i03*nb03 + i02*nb02 + i01*nb01 + offs;
-    device const char * src1_ptr = src1 + i13*nb13 + i12*nb12 + i11*nb11;
-    device       char * dst_ptr  = dst  + i03*nb3  + i02*nb2  + i01*nb1  + offs;
-
-    for (int i0 = tpitg.x; i0 < ne0; i0 += ntg.x) {
-        const int i10 = i0 % ne10;
-        *((device float *)(dst_ptr + i0*nb0)) = *((device float *)(src0_ptr + i0*nb00)) + *((device float *)(src1_ptr + i10*nb10));
-    }
-}
-
-kernel void kernel_mul(
-        device const char * src0,
-        device const char * src1,
-        device       char * dst,
-        constant  int64_t & ne00,
-        constant  int64_t & ne01,
-        constant  int64_t & ne02,
-        constant  int64_t & ne03,
-        constant uint64_t & nb00,
-        constant uint64_t & nb01,
-        constant uint64_t & nb02,
-        constant uint64_t & nb03,
-        constant  int64_t & ne10,
-        constant  int64_t & ne11,
-        constant  int64_t & ne12,
-        constant  int64_t & ne13,
-        constant uint64_t & nb10,
-        constant uint64_t & nb11,
-        constant uint64_t & nb12,
-        constant uint64_t & nb13,
-        constant  int64_t & ne0,
-        constant  int64_t & ne1,
-        constant  int64_t & ne2,
-        constant  int64_t & ne3,
-        constant uint64_t & nb0,
-        constant uint64_t & nb1,
-        constant uint64_t & nb2,
-        constant uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig.z;
-    const int64_t i02 = tgpig.y;
-    const int64_t i01 = tgpig.x;
-
-    const int64_t i13 = i03 % ne13;
-    const int64_t i12 = i02 % ne12;
-    const int64_t i11 = i01 % ne11;
-
-    device const char * src0_ptr = src0 + i03*nb03 + i02*nb02 + i01*nb01;
-    device const char * src1_ptr = src1 + i13*nb13 + i12*nb12 + i11*nb11;
-    device       char * dst_ptr  = dst  + i03*nb3  + i02*nb2  + i01*nb1;
-
-    for (int i0 = tpitg.x; i0 < ne0; i0 += ntg.x) {
-        const int i10 = i0 % ne10;
-        *((device float *)(dst_ptr + i0*nb0)) = *((device float *)(src0_ptr + i0*nb00)) * *((device float *)(src1_ptr + i10*nb10));
-    }
-}
-
-kernel void kernel_div(
-        device const char * src0,
-        device const char * src1,
-        device       char * dst,
-        constant  int64_t & ne00,
-        constant  int64_t & ne01,
-        constant  int64_t & ne02,
-        constant  int64_t & ne03,
-        constant uint64_t & nb00,
-        constant uint64_t & nb01,
-        constant uint64_t & nb02,
-        constant uint64_t & nb03,
-        constant  int64_t & ne10,
-        constant  int64_t & ne11,
-        constant  int64_t & ne12,
-        constant  int64_t & ne13,
-        constant uint64_t & nb10,
-        constant uint64_t & nb11,
-        constant uint64_t & nb12,
-        constant uint64_t & nb13,
-        constant  int64_t & ne0,
-        constant  int64_t & ne1,
-        constant  int64_t & ne2,
-        constant  int64_t & ne3,
-        constant uint64_t & nb0,
-        constant uint64_t & nb1,
-        constant uint64_t & nb2,
-        constant uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig.z;
-    const int64_t i02 = tgpig.y;
-    const int64_t i01 = tgpig.x;
-
-    const int64_t i13 = i03 % ne13;
-    const int64_t i12 = i02 % ne12;
-    const int64_t i11 = i01 % ne11;
-
-    device const char * src0_ptr = src0 + i03*nb03 + i02*nb02 + i01*nb01;
-    device const char * src1_ptr = src1 + i13*nb13 + i12*nb12 + i11*nb11;
-    device       char * dst_ptr  = dst  + i03*nb3  + i02*nb2  + i01*nb1;
-
-    for (int i0 = tpitg.x; i0 < ne0; i0 += ntg.x) {
-        const int i10 = i0 % ne10;
-        *((device float *)(dst_ptr + i0*nb0)) = *((device float *)(src0_ptr + i0*nb00)) / *((device float *)(src1_ptr + i10*nb10));
-    }
-}
-
-// assumption: src1 is a row
-// broadcast src1 into src0
-kernel void kernel_add_row(
-        device const float4 * src0,
-        device const float4 * src1,
-        device       float4 * dst,
-        constant   uint64_t & nb [[buffer(28)]],
-        uint tpig[[thread_position_in_grid]]) {
-    dst[tpig] = src0[tpig] + src1[tpig % nb];
-}
-
-kernel void kernel_mul_row(
-        device const float4 * src0,
-        device const float4 * src1,
-        device       float4 * dst,
-        constant   uint64_t & nb  [[buffer(28)]],
-        uint tpig[[thread_position_in_grid]]) {
-    dst[tpig] = src0[tpig] * src1[tpig % nb];
-}
-
-kernel void kernel_div_row(
-        device const float4 * src0,
-        device const float4 * src1,
-        device       float4 * dst,
-        constant   uint64_t & nb  [[buffer(28)]],
-        uint tpig[[thread_position_in_grid]]) {
-    dst[tpig] = src0[tpig] / src1[tpig % nb];
-}
-
-kernel void kernel_scale(
-        device const float * src0,
-        device       float * dst,
-        constant     float & scale,
-        uint tpig[[thread_position_in_grid]]) {
-    dst[tpig] = src0[tpig] * scale;
-}
-
-kernel void kernel_scale_4(
-        device const float4 * src0,
-        device       float4 * dst,
-        constant     float  & scale,
-        uint tpig[[thread_position_in_grid]]) {
-    dst[tpig] = src0[tpig] * scale;
-}
-
-kernel void kernel_relu(
-        device const float * src0,
-        device       float * dst,
-        uint tpig[[thread_position_in_grid]]) {
-    dst[tpig] = max(0.0f, src0[tpig]);
-}
-
-kernel void kernel_tanh(
-        device const float * src0,
-        device       float * dst,
-        uint tpig[[thread_position_in_grid]]) {
-    device const float & x = src0[tpig];
-    dst[tpig] = precise::tanh(x);
-}
-
-constant float GELU_COEF_A     = 0.044715f;
-constant float GELU_QUICK_COEF = -1.702f;
-constant float SQRT_2_OVER_PI  = 0.79788456080286535587989211986876f;
-
-kernel void kernel_gelu(
-    device const float4 * src0,
-    device       float4 * dst,
-    uint tpig[[thread_position_in_grid]]) {
-    device const float4 & x = src0[tpig];
-
-    // BEWARE !!!
-    // Simply using "tanh" instead of "precise::tanh" will sometimes results in NaNs!
-    // This was observed with Falcon 7B and 40B models
-    //
-    dst[tpig] = 0.5f*x*(1.0f + precise::tanh(SQRT_2_OVER_PI*x*(1.0f + GELU_COEF_A*x*x)));
-}
-
-kernel void kernel_gelu_quick(
-    device const float4 * src0,
-    device       float4 * dst,
-    uint tpig[[thread_position_in_grid]]) {
-    device const float4 & x = src0[tpig];
-
-    dst[tpig] = x*(1.0f/(1.0f+exp(GELU_QUICK_COEF*x)));
-}
-
-kernel void kernel_silu(
-        device const float4 * src0,
-        device       float4 * dst,
-        uint tpig[[thread_position_in_grid]]) {
-    device const float4 & x = src0[tpig];
-    dst[tpig] = x / (1.0f + exp(-x));
-}
-
-kernel void kernel_sqr(
-        device const float * src0,
-        device       float * dst,
-        uint tpig[[thread_position_in_grid]]) {
-    dst[tpig] = src0[tpig] * src0[tpig];
-}
-
-kernel void kernel_sum_rows(
-        device const float * src0,
-        device       float * dst,
-        constant  int64_t & ne00,
-        constant  int64_t & ne01,
-        constant  int64_t & ne02,
-        constant  int64_t & ne03,
-        constant uint64_t & nb00,
-        constant uint64_t & nb01,
-        constant uint64_t & nb02,
-        constant uint64_t & nb03,
-        constant  int64_t & ne10,
-        constant  int64_t & ne11,
-        constant  int64_t & ne12,
-        constant  int64_t & ne13,
-        constant uint64_t & nb10,
-        constant uint64_t & nb11,
-        constant uint64_t & nb12,
-        constant uint64_t & nb13,
-        constant  int64_t & ne0,
-        constant  int64_t & ne1,
-        constant  int64_t & ne2,
-        constant  int64_t & ne3,
-        constant uint64_t & nb0,
-        constant uint64_t & nb1,
-        constant uint64_t & nb2,
-        constant uint64_t & nb3,
-        uint3 tpig[[thread_position_in_grid]]) {
-    int64_t i3 = tpig.z;
-    int64_t i2 = tpig.y;
-    int64_t i1 = tpig.x;
-
-    if (i3 >= ne03 || i2 >= ne02 || i1 >= ne01) {
-        return;
-    }
-
-    device const float * src_row = (device const float *) ((device const char *) src0 + i1*nb01 + i2*nb02 + i3*nb03);
-    device       float * dst_row = (device       float *) ((device       char *) dst  + i1*nb1  + i2*nb2  + i3*nb3);
-
-    float row_sum = 0;
-
-    for (int64_t i0 = 0; i0 < ne00; i0++) {
-        row_sum += src_row[i0];
-    }
-
-    dst_row[0] = row_sum;
-}
-
-kernel void kernel_soft_max(
-        device const float * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant     float & scale,
-        threadgroup float  * buf [[threadgroup(0)]],
-        uint  tgpig[[threadgroup_position_in_grid]],
-        uint  tpitg[[thread_position_in_threadgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint    ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = (tgpig) / (ne02*ne01);
-    const int64_t i02 = (tgpig - i03*ne02*ne01) / ne01;
-    const int64_t i01 = (tgpig - i03*ne02*ne01 - i02*ne01);
-
-    device const float * psrc0 =         src0 + i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-    device const float * pmask = src1 != src0 ? src1                               + i01*ne00 : nullptr;
-    device       float * pdst  =         dst  + i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    // parallel max
-    float lmax = -INFINITY;
-
-    for (int i00 = tpitg; i00 < ne00; i00 += ntg) {
-        lmax = MAX(lmax, psrc0[i00]*scale + (pmask ? pmask[i00] : 0.0f));
-    }
-
-    // find the max value in the block
-    float max_val = simd_max(lmax);
-    if (ntg > N_SIMDWIDTH) {
-        if (sgitg == 0) {
-            buf[tiisg] = -INFINITY;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        if (tiisg == 0) {
-            buf[sgitg] = max_val;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        max_val = buf[tiisg];
-        max_val = simd_max(max_val);
-    }
-
-    // parallel sum
-    float lsum = 0.0f;
-    for (int i00 = tpitg; i00 < ne00; i00 += ntg) {
-        const float exp_psrc0 = exp((psrc0[i00]*scale + (pmask ? pmask[i00] : 0.0f)) - max_val);
-        lsum += exp_psrc0;
-        pdst[i00] = exp_psrc0;
-    }
-
-    // This barrier fixes a failing test
-    // ref: https://github.com/ggerganov/ggml/pull/621#discussion_r1425156335
-    threadgroup_barrier(mem_flags::mem_none);
-
-    float sum = simd_sum(lsum);
-
-    if (ntg > N_SIMDWIDTH) {
-        if (sgitg == 0) {
-            buf[tiisg] = 0.0f;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        if (tiisg == 0) {
-            buf[sgitg] = sum;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        sum = buf[tiisg];
-        sum = simd_sum(sum);
-    }
-
-    const float inv_sum = 1.0f/sum;
-
-    for (int i00 = tpitg; i00 < ne00; i00 += ntg) {
-        pdst[i00] *= inv_sum;
-    }
-}
-
-kernel void kernel_soft_max_4(
-        device const float * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant     float & scale,
-        threadgroup float  * buf [[threadgroup(0)]],
-        uint  tgpig[[threadgroup_position_in_grid]],
-        uint  tpitg[[thread_position_in_threadgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint    ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = (tgpig) / (ne02*ne01);
-    const int64_t i02 = (tgpig - i03*ne02*ne01) / ne01;
-    const int64_t i01 = (tgpig - i03*ne02*ne01 - i02*ne01);
-
-    device const float4 * psrc4 =                (device const float4 *)(src0 + i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00);
-    device const float4 * pmask = src1 != src0 ? (device const float4 *)(src1 +                                      i01*ne00) : nullptr;
-    device       float4 * pdst4 =                (device       float4 *)(dst  + i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00);
-
-    // parallel max
-    float4 lmax4 = -INFINITY;
-
-    for (int i00 = tpitg; i00 < ne00/4; i00 += ntg) {
-        lmax4 = fmax(lmax4, psrc4[i00]*scale + (pmask ? pmask[i00] : 0.0f));
-    }
-
-    const float lmax = MAX(MAX(lmax4[0], lmax4[1]), MAX(lmax4[2], lmax4[3]));
-
-    float max_val = simd_max(lmax);
-    if (ntg > N_SIMDWIDTH) {
-        if (sgitg == 0) {
-            buf[tiisg] = -INFINITY;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        if (tiisg == 0) {
-            buf[sgitg] = max_val;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        max_val = buf[tiisg];
-        max_val = simd_max(max_val);
-    }
-
-    // parallel sum
-    float4 lsum4 = 0.0f;
-    for (int i00 = tpitg; i00 < ne00/4; i00 += ntg) {
-        const float4 exp_psrc4 = exp((psrc4[i00]*scale + (pmask ? pmask[i00] : 0.0f)) - max_val);
-        lsum4 += exp_psrc4;
-        pdst4[i00] = exp_psrc4;
-    }
-
-    const float lsum = lsum4[0] + lsum4[1] + lsum4[2] + lsum4[3];
-
-    // This barrier fixes a failing test
-    // ref: https://github.com/ggerganov/ggml/pull/621#discussion_r1425156335
-    threadgroup_barrier(mem_flags::mem_none);
-
-    float sum = simd_sum(lsum);
-
-    if (ntg > N_SIMDWIDTH) {
-        if (sgitg == 0) {
-            buf[tiisg] = 0.0f;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        if (tiisg == 0) {
-            buf[sgitg] = sum;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        sum = buf[tiisg];
-        sum = simd_sum(sum);
-    }
-
-    const float inv_sum = 1.0f/sum;
-
-    for (int i00 = tpitg; i00 < ne00/4; i00 += ntg) {
-        pdst4[i00] *= inv_sum;
-    }
-}
-
-kernel void kernel_diag_mask_inf(
-        device const float * src0,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant       int & n_past,
-        uint3 tpig[[thread_position_in_grid]]) {
-    const int64_t i02 = tpig[2];
-    const int64_t i01 = tpig[1];
-    const int64_t i00 = tpig[0];
-
-    if (i00 > n_past + i01) {
-        dst[i02*ne01*ne00 + i01*ne00 + i00] = -INFINITY;
-    } else {
-        dst[i02*ne01*ne00 + i01*ne00 + i00] = src0[i02*ne01*ne00 + i01*ne00 + i00];
-    }
-}
-
-kernel void kernel_diag_mask_inf_8(
-        device const float4 * src0,
-        device       float4 * dst,
-        constant    int64_t & ne00,
-        constant    int64_t & ne01,
-        constant        int & n_past,
-        uint3 tpig[[thread_position_in_grid]]) {
-
-    const int64_t i = 2*tpig[0];
-
-    dst[i+0] = src0[i+0];
-    dst[i+1] = src0[i+1];
-    int64_t i4 = 4*i;
-    const int64_t i02 = i4/(ne00*ne01); i4 -= i02*ne00*ne01;
-    const int64_t i01 = i4/(ne00);      i4 -= i01*ne00;
-    const int64_t i00 = i4;
-    for (int k = 3; k >= 0; --k) {
-        if (i00 + 4 + k <= n_past + i01) {
-            break;
-        }
-        dst[i+1][k] = -INFINITY;
-        if (i00 + k > n_past + i01) {
-            dst[i][k] = -INFINITY;
-        }
-    }
-}
-
-kernel void kernel_norm(
-        device const  void * src0,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant  uint64_t & nb01,
-        constant     float & eps,
-        threadgroup float  * sum [[threadgroup(0)]],
-        uint tgpig[[threadgroup_position_in_grid]],
-        uint tpitg[[thread_position_in_threadgroup]],
-        uint   ntg[[threads_per_threadgroup]]) {
-    device const float * x = (device const float *) ((device const char *) src0 + tgpig*nb01);
-    // MEAN
-    // parallel sum
-    sum[tpitg] = 0.0f;
-    for (int i00 = tpitg; i00 < ne00; i00 += ntg) {
-        sum[tpitg] += x[i00];
-    }
-    // reduce
-    threadgroup_barrier(mem_flags::mem_threadgroup);
-    for (uint i = ntg/2; i > 0; i /= 2) {
-        if (tpitg < i) {
-            sum[tpitg] += sum[tpitg + i];
-        }
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-    }
-    const float mean  = sum[0] / ne00;
-
-    // recenter and VARIANCE
-    threadgroup_barrier(mem_flags::mem_threadgroup);
-    device float * y = dst + tgpig*ne00;
-    sum[tpitg] = 0.0f;
-    for (int i00 = tpitg; i00 < ne00; i00 += ntg) {
-        y[i00] = x[i00] - mean;
-        sum[tpitg] += y[i00] * y[i00];
-    }
-
-    // reduce
-    threadgroup_barrier(mem_flags::mem_threadgroup);
-    for (uint i = ntg/2; i > 0; i /= 2) {
-        if (tpitg < i) {
-            sum[tpitg] += sum[tpitg + i];
-        }
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-    }
-    const float variance = sum[0] / ne00;
-
-    const float scale = 1.0f/sqrt(variance + eps);
-    for (int i00 = tpitg; i00 < ne00; i00 += ntg) {
-        y[i00] = y[i00] * scale;
-    }
-}
-
-kernel void kernel_rms_norm(
-        device const  void * src0,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant  uint64_t & nb01,
-        constant     float & eps,
-        threadgroup float  * buf [[threadgroup(0)]],
-        uint tgpig[[threadgroup_position_in_grid]],
-        uint tpitg[[thread_position_in_threadgroup]],
-        uint sgitg[[simdgroup_index_in_threadgroup]],
-        uint tiisg[[thread_index_in_simdgroup]],
-        uint   ntg[[threads_per_threadgroup]]) {
-    device const float4 * x = (device const float4 *) ((device const char *) src0 + tgpig*nb01);
-
-    float4 sumf = 0;
-    float all_sum = 0;
-
-    // parallel sum
-    for (int i00 = tpitg; i00 < ne00/4; i00 += ntg) {
-        sumf += x[i00] * x[i00];
-    }
-    all_sum = sumf[0] + sumf[1] + sumf[2] + sumf[3];
-    all_sum = simd_sum(all_sum);
-    if (ntg > N_SIMDWIDTH) {
-        if (sgitg == 0) {
-            buf[tiisg] = 0.0f;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        if (tiisg == 0) {
-            buf[sgitg] = all_sum;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        all_sum = buf[tiisg];
-        all_sum = simd_sum(all_sum);
-    }
-
-    const float mean  = all_sum/ne00;
-    const float scale = 1.0f/sqrt(mean + eps);
-
-    device float4 * y = (device float4 *) (dst + tgpig*ne00);
-    for (int i00 = tpitg; i00 < ne00/4; i00 += ntg) {
-        y[i00] = x[i00] * scale;
-    }
-}
-
-kernel void kernel_group_norm(
-        device const float * src0,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int32_t & n_groups,
-        constant     float & eps,
-        threadgroup float  * buf [[threadgroup(0)]],
-        uint tgpig[[threadgroup_position_in_grid]],
-        uint tpitg[[thread_position_in_threadgroup]],
-        uint sgitg[[simdgroup_index_in_threadgroup]],
-        uint tiisg[[thread_index_in_simdgroup]],
-        uint   ntg[[threads_per_threadgroup]]) {
-    const int64_t ne = ne00*ne01*ne02;
-    const int64_t gs = ne00*ne01*((ne02 + n_groups - 1) / n_groups);
-
-    int start = tgpig * gs;
-    int end   = start + gs;
-
-    start += tpitg;
-
-    if (end >= ne) {
-        end = ne;
-    }
-
-    float tmp = 0.0f; // partial sum for thread in warp
-
-    for (int j = start; j < end; j += ntg) {
-        tmp += src0[j];
-    }
-
-    threadgroup_barrier(mem_flags::mem_threadgroup);
-    tmp = simd_sum(tmp);
-    if (ntg > N_SIMDWIDTH) {
-        if (sgitg == 0) {
-            buf[tiisg] = 0.0f;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        if (tiisg == 0) {
-            buf[sgitg] = tmp;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        tmp = buf[tiisg];
-        tmp = simd_sum(tmp);
-    }
-
-    const float mean = tmp / gs;
-    tmp = 0.0f;
-
-    for (int j = start; j < end; j += ntg) {
-        float xi = src0[j] - mean;
-        dst[j] = xi;
-        tmp += xi * xi;
-    }
-
-    tmp = simd_sum(tmp);
-    if (ntg > N_SIMDWIDTH) {
-        if (sgitg == 0) {
-            buf[tiisg] = 0.0f;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        if (tiisg == 0) {
-            buf[sgitg] = tmp;
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        tmp = buf[tiisg];
-        tmp = simd_sum(tmp);
-    }
-
-    const float variance = tmp / gs;
-    const float scale = 1.0f/sqrt(variance + eps);
-    for (int j = start; j < end; j += ntg) {
-        dst[j] *= scale;
-    }
-}
-
-// function for calculate inner product between half a q4_0 block and 16 floats (yl), sumy is SUM(yl[i])
-// il indicates where the q4 quants begin (0 or QK4_0/4)
-// we assume that the yl's have been multiplied with the appropriate scale factor
-// that corresponds to the missing bit shifts (1, 1/16, 1/256, 1/4096)
-inline float block_q_n_dot_y(device const block_q4_0 * qb_curr, float sumy, thread float * yl, int il) {
-    float d = qb_curr->d;
-
-    float2 acc = 0.f;
-
-    device const uint16_t * qs = ((device const uint16_t *)qb_curr + 1 + il/2);
-
-    for (int i = 0; i < 8; i+=2) {
-        acc[0] += yl[i + 0] * (qs[i / 2] & 0x000F)
-                + yl[i + 1] * (qs[i / 2] & 0x0F00);
-        acc[1] += yl[i + 8] * (qs[i / 2] & 0x00F0)
-                + yl[i + 9] * (qs[i / 2] & 0xF000);
-    }
-    return d * (sumy * -8.f + acc[0] + acc[1]);
-}
-
-// function for calculate inner product between half a q4_1 block and 16 floats (yl), sumy is SUM(yl[i])
-// il indicates where the q4 quants begin (0 or QK4_0/4)
-// we assume that the yl's have been multiplied with the appropriate scale factor
-// that corresponds to the missing bit shifts (1, 1/16, 1/256, 1/4096)
-inline float block_q_n_dot_y(device const block_q4_1 * qb_curr, float sumy, thread float * yl, int il) {
-    float d = qb_curr->d;
-    float m = qb_curr->m;
-
-    float2 acc = 0.f;
-
-    device const uint16_t * qs = ((device const uint16_t *)qb_curr + 2 + il/2);
-
-    for (int i = 0; i < 8; i+=2) {
-        acc[0] += yl[i + 0] * (qs[i / 2] & 0x000F)
-                + yl[i + 1] * (qs[i / 2] & 0x0F00);
-        acc[1] += yl[i + 8] * (qs[i / 2] & 0x00F0)
-                + yl[i + 9] * (qs[i / 2] & 0xF000);
-    }
-    return d * (acc[0] + acc[1]) + sumy * m;
-}
-
-// function for calculate inner product between half a q5_0 block and 16 floats (yl), sumy is SUM(yl[i])
-// il indicates where the q5 quants begin (0 or QK5_0/4)
-// we assume that the yl's have been multiplied with the appropriate scale factor
-// that corresponds to the missing bit shifts (1, 1/16, 1/256, 1/4096)
-inline float block_q_n_dot_y(device const block_q5_0 * qb_curr, float sumy, thread float * yl, int il) {
-    float d = qb_curr->d;
-
-    float2 acc = 0.f;
-
-    device const uint16_t * qs =  ((device const uint16_t *)qb_curr + 3 + il/2);
-           const uint32_t   qh = *((device const uint32_t *)qb_curr->qh);
-
-    for (int i = 0; i < 8; i+=2) {
-        acc[0] += yl[i + 0] * ((qs[i / 2] & 0x000F) | ((qh >> (i+0+il        ) << 4 ) & 0x00010))
-                + yl[i + 1] * ((qs[i / 2] & 0x0F00) | ((qh >> (i+1+il        ) << 12) & 0x01000));
-        acc[1] += yl[i + 8] * ((qs[i / 2] & 0x00F0) | ((qh >> (i+0+il+QK5_0/2) << 8 ) & 0x00100))
-                + yl[i + 9] * ((qs[i / 2] & 0xF000) | ((qh >> (i+1+il+QK5_0/2) << 16) & 0x10000));
-    }
-    return d * (sumy * -16.f + acc[0] + acc[1]);
-}
-
-// function for calculate inner product between half a q5_1 block and 16 floats (yl), sumy is SUM(yl[i])
-// il indicates where the q5 quants begin (0 or QK5_1/4)
-// we assume that the yl's have been multiplied with the appropriate scale factor
-// that corresponds to the missing bit shifts (1, 1/16, 1/256, 1/4096)
-inline float block_q_n_dot_y(device const block_q5_1 * qb_curr, float sumy, thread float * yl, int il) {
-    float d = qb_curr->d;
-    float m = qb_curr->m;
-
-    float2 acc = 0.f;
-
-    device const uint16_t * qs =  ((device const uint16_t *)qb_curr + 4 + il/2);
-           const uint32_t   qh = *((device const uint32_t *)qb_curr->qh);
-
-    for (int i = 0; i < 8; i+=2) {
-        acc[0] += yl[i + 0] * ((qs[i / 2] & 0x000F) | ((qh >> (i+0+il        ) << 4 ) & 0x00010))
-                + yl[i + 1] * ((qs[i / 2] & 0x0F00) | ((qh >> (i+1+il        ) << 12) & 0x01000));
-        acc[1] += yl[i + 8] * ((qs[i / 2] & 0x00F0) | ((qh >> (i+0+il+QK5_0/2) << 8 ) & 0x00100))
-                + yl[i + 9] * ((qs[i / 2] & 0xF000) | ((qh >> (i+1+il+QK5_0/2) << 16) & 0x10000));
-    }
-    return d * (acc[0] + acc[1]) + sumy * m;
-}
-
-// putting them in the kernel cause a significant performance penalty
-#define N_DST 4        // each SIMD group works on 4 rows
-#define N_SIMDGROUP 2  // number of SIMD groups in a thread group
-//Note: This is a template, but strictly speaking it only applies to
-//      quantizations where the block size is 32. It also does not
-//      guard against the number of rows not being divisible by
-//      N_DST, so this is another explicit assumption of the implementation.
-template<typename block_q_type, int nr, int nsg, int nw>
-void mul_vec_q_n_f32_impl(
-        device const void  * src0,
-        device const float * src1,
-        device       float * dst,
-                   int64_t   ne00,
-                   int64_t   ne01,
-                   int64_t   ne02,
-                   int64_t   ne10,
-                   int64_t   ne12,
-                   int64_t   ne0,
-                   int64_t   ne1,
-                   uint      r2,
-                   uint      r3,
-                   uint3 tgpig, uint tiisg, uint sgitg) {
-    const int nb = ne00/QK4_0;
-
-    const int r0 = tgpig.x;
-    const int r1 = tgpig.y;
-    const int im = tgpig.z;
-
-    const int first_row = (r0 * nsg + sgitg) * nr;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = first_row * nb + (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q_type * x = (device const block_q_type *) src0 + offset0;
-    device const float        * y = (device const float        *) src1 + r1*ne10 + im*ne00*ne1;
-
-    float yl[16]; // src1 vector cache
-    float sumf[nr] = {0.f};
-
-    const int ix = (tiisg/2);
-    const int il = (tiisg%2)*8;
-
-    device const float * yb = y + ix * QK4_0 + il;
-
-    // each thread in a SIMD group deals with half a block.
-    for (int ib = ix; ib < nb; ib += nw/2) {
-        float sumy = 0;
-        for (int i = 0; i < 8; i += 2) {
-            sumy += yb[i] + yb[i+1];
-            yl[i+0] = yb[i+ 0];
-            yl[i+1] = yb[i+ 1]/256.f;
-
-            sumy += yb[i+16] + yb[i+17];
-            yl[i+8] = yb[i+16]/16.f;
-            yl[i+9] = yb[i+17]/4096.f;
-        }
-
-        for (int row = 0; row < nr; row++) {
-            sumf[row] += block_q_n_dot_y(x+ib+row*nb, sumy, yl, il);
-        }
-
-        yb += QK4_0 * 16;
-    }
-
-    for (int row = 0; row < nr; ++row) {
-        const float tot = simd_sum(sumf[row]);
-        if (tiisg == 0 && first_row + row < ne01) {
-            dst[im*ne0*ne1 + r1*ne0 + first_row + row] = tot;
-        }
-    }
-}
-
-kernel void kernel_mul_mv_q4_0_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-    mul_vec_q_n_f32_impl<block_q4_0, N_DST, N_SIMDGROUP, N_SIMDWIDTH>(src0,src1,dst,ne00,ne01,ne02,ne10,ne12,ne0,ne1,r2,r3,tgpig,tiisg,sgitg);
-}
-
-kernel void kernel_mul_mv_q4_1_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint tiisg[[thread_index_in_simdgroup]],
-        uint sgitg[[simdgroup_index_in_threadgroup]]) {
-     mul_vec_q_n_f32_impl<block_q4_1, N_DST, N_SIMDGROUP, N_SIMDWIDTH>(src0,src1,dst,ne00,ne01,ne02,ne10,ne12,ne0,ne1,r2,r3,tgpig,tiisg,sgitg);
-}
-
-kernel void kernel_mul_mv_q5_0_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-    mul_vec_q_n_f32_impl<block_q5_0, N_DST, N_SIMDGROUP, N_SIMDWIDTH>(src0,src1,dst,ne00,ne01,ne02,ne10,ne12,ne0,ne1,r2,r3,tgpig,tiisg,sgitg);
-}
-
-kernel void kernel_mul_mv_q5_1_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-    mul_vec_q_n_f32_impl<block_q5_1, N_DST, N_SIMDGROUP, N_SIMDWIDTH>(src0,src1,dst,ne00,ne01,ne02,ne10,ne12,ne0,ne1,r2,r3,tgpig,tiisg,sgitg);
-}
-
-
-#define NB_Q8_0 8
-
-void kernel_mul_mv_q8_0_f32_impl(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-    const int nr  = N_DST;
-    const int nsg = N_SIMDGROUP;
-    const int nw  = N_SIMDWIDTH;
-
-    const int nb = ne00/QK8_0;
-    const int r0 = tgpig.x;
-    const int r1 = tgpig.y;
-    const int im = tgpig.z;
-
-    const int first_row = (r0 * nsg + sgitg) * nr;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = first_row * nb + (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q8_0 * x = (device const block_q8_0 *) src0 + offset0;
-    device const float      * y = (device const float      *) src1 + r1*ne10 + im*ne00*ne1;
-
-    float yl[NB_Q8_0];
-    float sumf[nr]={0.f};
-
-    const int ix = tiisg/4;
-    const int il = tiisg%4;
-
-    device const float * yb = y + ix * QK8_0 + NB_Q8_0*il;
-
-    // each thread in a SIMD group deals with NB_Q8_0 quants at a time
-    for (int ib = ix; ib < nb; ib += nw/4) {
-        for (int i = 0; i < NB_Q8_0; ++i) {
-            yl[i] = yb[i];
-        }
-
-        for (int row = 0; row < nr; row++) {
-            device const int8_t * qs = x[ib+row*nb].qs + NB_Q8_0*il;
-            float sumq = 0.f;
-            for (int iq = 0; iq < NB_Q8_0; ++iq) {
-                sumq += qs[iq] * yl[iq];
-            }
-            sumf[row] += sumq*x[ib+row*nb].d;
-        }
-
-        yb += NB_Q8_0 * nw;
-    }
-
-    for (int row = 0; row < nr; ++row) {
-        const float tot = simd_sum(sumf[row]);
-        if (tiisg == 0 && first_row + row < ne01) {
-            dst[r1*ne0 + im*ne0*ne1 + first_row + row] = tot;
-        }
-    }
-}
-
-[[host_name("kernel_mul_mv_q8_0_f32")]]
-kernel void kernel_mul_mv_q8_0_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-    kernel_mul_mv_q8_0_f32_impl(src0,src1,dst,ne00,ne01,ne02,ne10,ne12,ne0,ne1,r2,r3,tgpig,tiisg,sgitg);
-}
-
-#define N_F32_F32 4
-
-void kernel_mul_mv_f32_f32_impl(
-        device const  char * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]]) {
-
-    const int64_t r0 = tgpig.x;
-    const int64_t rb = tgpig.y*N_F32_F32;
-    const int64_t im = tgpig.z;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = r0*nb01 + (i12/r2)*nb02 + (i13/r3)*nb02*ne02;
-
-    device const float * x = (device const float *) (src0 + offset0);
-
-    if (ne00 < 128) {
-        for (int row = 0; row < N_F32_F32; ++row) {
-            int r1 = rb + row;
-            if (r1 >= ne11) {
-                break;
-            }
-
-            device const float * y = (device const float *) (src1 + r1*nb11 + im*nb12);
-
-            float sumf = 0;
-            for (int i = tiisg; i < ne00; i += 32) {
-                sumf += (float) x[i] * (float) y[i];
-            }
-
-            float all_sum = simd_sum(sumf);
-            if (tiisg == 0) {
-                dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-            }
-        }
-    } else {
-        device const float4 * x4 = (device const float4 *)x;
-        for (int row = 0; row < N_F32_F32; ++row) {
-            int r1 = rb + row;
-            if (r1 >= ne11) {
-                break;
-            }
-
-            device const float  * y  = (device const float  *) (src1 + r1*nb11 + im*nb12);
-            device const float4 * y4 = (device const float4 *) y;
-
-            float sumf = 0;
-            for (int i = tiisg; i < ne00/4; i += 32) {
-                for (int k = 0; k < 4; ++k) sumf += (float) x4[i][k] * y4[i][k];
-            }
-
-            float all_sum = simd_sum(sumf);
-            if (tiisg == 0) {
-                for (int i = 4*(ne00/4); i < ne00; ++i) all_sum += (float) x[i] * y[i];
-                dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-            }
-        }
-    }
-}
-
-[[host_name("kernel_mul_mv_f32_f32")]]
-kernel void kernel_mul_mv_f32_f32(
-        device const  char * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]]) {
-    kernel_mul_mv_f32_f32_impl(src0, src1, dst, ne00, ne01, ne02, nb00, nb01, nb02, ne10, ne11, ne12, nb10, nb11, nb12, ne0, ne1, r2, r3, tgpig, tiisg);
-}
-
-#define N_F16_F16 4
-
-kernel void kernel_mul_mv_f16_f16(
-        device const  char * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]]) {
-
-    const int64_t r0 = tgpig.x;
-    const int64_t rb = tgpig.y*N_F16_F16;
-    const int64_t im = tgpig.z;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = r0*nb01 + (i12/r2)*nb02 + (i13/r3)*nb02*ne02;
-
-    device const half * x = (device const half *) (src0 + offset0);
-
-    if (ne00 < 128) {
-        for (int row = 0; row < N_F16_F16; ++row) {
-            int r1 = rb + row;
-            if (r1 >= ne11) {
-                break;
-            }
-
-            device const half * y = (device const half *) (src1 + r1*nb11 + im*nb12);
-
-            float sumf = 0;
-            for (int i = tiisg; i < ne00; i += 32) {
-                sumf += (half) x[i] * (half) y[i];
-            }
-
-            float all_sum = simd_sum(sumf);
-            if (tiisg == 0) {
-                dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-            }
-        }
-    } else {
-        device const half4 * x4 = (device const half4 *)x;
-        for (int row = 0; row < N_F16_F16; ++row) {
-            int r1 = rb + row;
-            if (r1 >= ne11) {
-                break;
-            }
-
-            device const half  * y  = (device const half  *) (src1 + r1*nb11 + im*nb12);
-            device const half4 * y4 = (device const half4 *) y;
-
-            float sumf = 0;
-            for (int i = tiisg; i < ne00/4; i += 32) {
-                for (int k = 0; k < 4; ++k) sumf += (half) x4[i][k] * y4[i][k];
-            }
-
-            float all_sum = simd_sum(sumf);
-            if (tiisg == 0) {
-                for (int i = 4*(ne00/4); i < ne00; ++i) all_sum += (half) x[i] * y[i];
-                dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-            }
-        }
-    }
-}
-
-void kernel_mul_mv_f16_f32_1row_impl(
-        device const  char * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]]) {
-
-    const int64_t r0 = tgpig.x;
-    const int64_t r1 = tgpig.y;
-    const int64_t im = tgpig.z;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = r0*nb01 + (i12/r2)*nb02 + (i13/r3)*nb02*ne02;
-
-    device const half  * x = (device const half  *) (src0 + offset0);
-    device const float * y = (device const float *) (src1 + r1*nb11 + im*nb12);
-
-    float sumf = 0;
-    if (ne00 < 128) {
-        for (int i = tiisg; i < ne00; i += 32) {
-            sumf += (float) x[i] * (float) y[i];
-        }
-        float all_sum = simd_sum(sumf);
-        if (tiisg == 0) {
-            dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-        }
-    } else {
-        device const half4  * x4 = (device const half4  *) x;
-        device const float4 * y4 = (device const float4 *) y;
-        for (int i = tiisg; i < ne00/4; i += 32) {
-            for (int k = 0; k < 4; ++k) sumf += (float)x4[i][k] * y4[i][k];
-        }
-        float all_sum = simd_sum(sumf);
-        if (tiisg == 0) {
-            for (int i = 4*(ne00/4); i < ne00; ++i) all_sum += (float) x[i] * y[i];
-            dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-        }
-    }
-}
-
-[[host_name("kernel_mul_mv_f16_f32_1row")]]
-kernel void kernel_mul_mv_f16_f32_1row(
-        device const  char * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]]) {
-    kernel_mul_mv_f16_f32_1row_impl(src0, src1, dst, ne00, ne01, ne02, nb00, nb01, nb02, ne10, ne11, ne12, nb10, nb11, nb12, ne0, ne1, r2, r3, tgpig, tiisg);
-}
-
-#define N_F16_F32 4
-
-void kernel_mul_mv_f16_f32_impl(
-        device const  char * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint tiisg[[thread_index_in_simdgroup]]) {
-
-    const int64_t r0 = tgpig.x;
-    const int64_t rb = tgpig.y*N_F16_F32;
-    const int64_t im = tgpig.z;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = r0*nb01 + (i12/r2)*nb02 + (i13/r3)*nb02*ne02;
-
-    device const half * x = (device const half *) (src0 + offset0);
-
-    if (ne00 < 128) {
-        for (int row = 0; row < N_F16_F32; ++row) {
-            int r1 = rb + row;
-            if (r1 >= ne11) {
-                break;
-            }
-
-            device const float * y = (device const float *) (src1 + r1*nb11 + im*nb12);
-
-            float sumf = 0;
-            for (int i = tiisg; i < ne00; i += 32) {
-                sumf += (float) x[i] * (float) y[i];
-            }
-
-            float all_sum = simd_sum(sumf);
-            if (tiisg == 0) {
-                dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-            }
-        }
-    } else {
-        device const half4 * x4 = (device const half4 *)x;
-        for (int row = 0; row < N_F16_F32; ++row) {
-            int r1 = rb + row;
-            if (r1 >= ne11) {
-                break;
-            }
-
-            device const float  * y  = (device const float  *) (src1 + r1*nb11 + im*nb12);
-            device const float4 * y4 = (device const float4 *) y;
-
-            float sumf = 0;
-            for (int i = tiisg; i < ne00/4; i += 32) {
-                for (int k = 0; k < 4; ++k) sumf += (float) x4[i][k] * y4[i][k];
-            }
-
-            float all_sum = simd_sum(sumf);
-            if (tiisg == 0) {
-                for (int i = 4*(ne00/4); i < ne00; ++i) all_sum += (float) x[i] * y[i];
-                dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-            }
-        }
-    }
-}
-
-[[host_name("kernel_mul_mv_f16_f32")]]
-kernel void kernel_mul_mv_f16_f32(
-        device const  char * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint tiisg[[thread_index_in_simdgroup]]) {
-    kernel_mul_mv_f16_f32_impl(src0, src1, dst, ne00, ne01, ne02, nb00, nb01, nb02, ne10, ne11, ne12, nb10, nb11, nb12, ne0, ne1, r2, r3, tgpig, tiisg);
-}
-
-// Assumes row size (ne00) is a multiple of 4
-kernel void kernel_mul_mv_f16_f32_l4(
-        device const  char * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint tiisg[[thread_index_in_simdgroup]]) {
-
-    const int nrows = ne11;
-    const int64_t r0 = tgpig.x;
-    const int64_t im = tgpig.z;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = r0*nb01 + (i12/r2)*nb02 + (i13/r3)*nb02*ne02;
-
-    device const half4 * x4 = (device const half4 *) (src0 + offset0);
-
-    for (int r1 = 0; r1 < nrows; ++r1) {
-        device const float4 * y4 = (device const float4 *) (src1 + r1*nb11 + im*nb12);
-
-        float sumf = 0;
-        for (int i = tiisg; i < ne00/4; i += 32) {
-            for (int k = 0; k < 4; ++k) sumf += (float) x4[i][k] * y4[i][k];
-        }
-
-        float all_sum = simd_sum(sumf);
-        if (tiisg == 0) {
-            dst[im*ne1*ne0 + r1*ne0 + r0] = all_sum;
-        }
-    }
-}
-
-kernel void kernel_alibi_f32(
-        device const float * src0,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne03,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant  uint64_t & nb03,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   int64_t & ne2,
-        constant   int64_t & ne3,
-        constant  uint64_t & nb0,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        constant  uint64_t & nb3,
-        constant     float & m0,
-        constant     float & m1,
-        constant       int & n_heads_log2_floor,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig[2];
-    const int64_t i02 = tgpig[1];
-    const int64_t i01 = tgpig[0];
-
-    const int64_t n = i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    const int64_t i3 = n / (ne2*ne1*ne0);
-    const int64_t i2 = (n - i3*ne2*ne1*ne0) / (ne1*ne0);
-    const int64_t i1 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0) / ne0;
-  //const int64_t i0 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0 - i1*ne0);
-
-    const int64_t k = i3*ne3 + i2;
-
-    float m_k;
-    if (k < n_heads_log2_floor) {
-        m_k = pow(m0, k + 1);
-    } else {
-        m_k = pow(m1, 2 * (k - n_heads_log2_floor) + 1);
-    }
-
-    device       char * dst_row = (device char *) dst + i3*nb3 + i2*nb2 + i1*nb1;
-    device const char * src_row = (device char *) src0 + i03*nb03 + i02*nb02 + i01*nb01;
-    for (int64_t i00 = tpitg.x; i00 < ne00; i00 += ntg.x) {
-        const  float   src_v = *(device float *)(src_row + i00*nb00);
-        device float * dst_v =  (device float *)(dst_row + i00*nb0);
-        *dst_v = i00 * m_k + src_v;
-    }
-}
-
-static float rope_yarn_ramp(const float low, const float high, const int i0) {
-    const float y = (i0 / 2 - low) / max(0.001f, high - low);
-    return 1.0f - min(1.0f, max(0.0f, y));
-}
-
-// YaRN algorithm based on LlamaYaRNScaledRotaryEmbedding.py from https://github.com/jquesnelle/yarn
-// MIT licensed. Copyright (c) 2023 Jeffrey Quesnelle and Bowen Peng.
-static void rope_yarn(
-    float theta_extrap, float freq_scale, float corr_dims[2], int64_t i0, float ext_factor, float mscale,
-    thread float * cos_theta, thread float * sin_theta
-) {
-    // Get n-d rotational scaling corrected for extrapolation
-    float theta_interp = freq_scale * theta_extrap;
-    float theta = theta_interp;
-    if (ext_factor != 0.0f) {
-        float ramp_mix = rope_yarn_ramp(corr_dims[0], corr_dims[1], i0) * ext_factor;
-        theta = theta_interp * (1 - ramp_mix) + theta_extrap * ramp_mix;
-
-        // Get n-d magnitude scaling corrected for interpolation
-        mscale *= 1.0f + 0.1f * log(1.0f / freq_scale);
-    }
-    *cos_theta = cos(theta) * mscale;
-    *sin_theta = sin(theta) * mscale;
-}
-
-// Apparently solving `n_rot = 2pi * x * base^((2 * max_pos_emb) / n_dims)` for x, we get
-// `corr_fac(n_rot) = n_dims * log(max_pos_emb / (n_rot * 2pi)) / (2 * log(base))`
-static float rope_yarn_corr_factor(int n_dims, int n_orig_ctx, float n_rot, float base) {
-    return n_dims * log(n_orig_ctx / (n_rot * 2 * M_PI_F)) / (2 * log(base));
-}
-
-static void rope_yarn_corr_dims(
-    int n_dims, int n_orig_ctx, float freq_base, float beta_fast, float beta_slow, float dims[2]
-) {
-    // start and end correction dims
-    dims[0] = max(0.0f,         floor(rope_yarn_corr_factor(n_dims, n_orig_ctx, beta_fast, freq_base)));
-    dims[1] = min(n_dims - 1.0f, ceil(rope_yarn_corr_factor(n_dims, n_orig_ctx, beta_slow, freq_base)));
-}
-
-typedef void (rope_t)(
-        device const    void * src0,
-        device const int32_t * src1,
-        device         float * dst,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant     int64_t & ne03,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant    uint64_t & nb03,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant     int64_t & ne2,
-        constant     int64_t & ne3,
-        constant    uint64_t & nb0,
-        constant    uint64_t & nb1,
-        constant    uint64_t & nb2,
-        constant    uint64_t & nb3,
-        constant         int & n_past,
-        constant         int & n_dims,
-        constant         int & mode,
-        constant         int & n_orig_ctx,
-        constant       float & freq_base,
-        constant       float & freq_scale,
-        constant       float & ext_factor,
-        constant       float & attn_factor,
-        constant       float & beta_fast,
-        constant       float & beta_slow,
-        uint  tiitg[[thread_index_in_threadgroup]],
-        uint3 tptg[[threads_per_threadgroup]],
-        uint3 tgpig[[threadgroup_position_in_grid]]);
-
-template<typename T>
-kernel void kernel_rope(
-        device const    void * src0,
-        device const int32_t * src1,
-        device         float * dst,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant     int64_t & ne03,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant    uint64_t & nb03,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant     int64_t & ne2,
-        constant     int64_t & ne3,
-        constant    uint64_t & nb0,
-        constant    uint64_t & nb1,
-        constant    uint64_t & nb2,
-        constant    uint64_t & nb3,
-        constant         int & n_past,
-        constant         int & n_dims,
-        constant         int & mode,
-        constant         int & n_orig_ctx,
-        constant       float & freq_base,
-        constant       float & freq_scale,
-        constant       float & ext_factor,
-        constant       float & attn_factor,
-        constant       float & beta_fast,
-        constant       float & beta_slow,
-        uint  tiitg[[thread_index_in_threadgroup]],
-        uint3 tptg[[threads_per_threadgroup]],
-        uint3 tgpig[[threadgroup_position_in_grid]]) {
-    const int64_t i3 = tgpig[2];
-    const int64_t i2 = tgpig[1];
-    const int64_t i1 = tgpig[0];
-
-    const bool is_neox = mode & 2;
-
-    float corr_dims[2];
-    rope_yarn_corr_dims(n_dims, n_orig_ctx, freq_base, beta_fast, beta_slow, corr_dims);
-
-    device const int32_t * pos = src1;
-
-    const int64_t p = pos[i2];
-
-    const float theta_0 = (float)p;
-    const float inv_ndims = -1.f/n_dims;
-
-    if (!is_neox) {
-        for (int64_t i0 = 2*tiitg; i0 < ne0; i0 += 2*tptg.x) {
-
-            const float theta = theta_0 * pow(freq_base, inv_ndims*i0);
-            float cos_theta, sin_theta;
-            rope_yarn(theta, freq_scale, corr_dims, i0, ext_factor, attn_factor, &cos_theta, &sin_theta);
-
-            device const T * const src = (device T *)((device char *) src0 + i3*nb03 + i2*nb02 + i1*nb01 + i0*nb00);
-            device       T * dst_data  = (device T *)((device char *)  dst + i3*nb3  + i2*nb2  + i1*nb1  + i0*nb0);
-
-            const T x0 = src[0];
-            const T x1 = src[1];
-
-            dst_data[0] = x0*cos_theta - x1*sin_theta;
-            dst_data[1] = x0*sin_theta + x1*cos_theta;
-        }
-    } else {
-        for (int64_t ic = 2*tiitg; ic < ne0; ic += 2*tptg.x) {
-            if (ic < n_dims) {
-                const int64_t ib = 0;
-
-                // simplified from `(ib * n_dims + ic) * inv_ndims`
-                const float cur_rot = inv_ndims*ic - ib;
-
-                const float theta = theta_0 * pow(freq_base, cur_rot);
-                float cos_theta, sin_theta;
-                rope_yarn(theta, freq_scale, corr_dims, cur_rot, ext_factor, attn_factor, &cos_theta, &sin_theta);
-
-                const int64_t i0 = ib*n_dims + ic/2;
-
-                device const T * const src = (device T *)((device char *) src0 + i3*nb03 + i2*nb02 + i1*nb01 + i0*nb00);
-                device       T * dst_data  = (device T *)((device char *)  dst + i3*nb3  + i2*nb2  + i1*nb1  + i0*nb0);
-
-                const float x0 = src[0];
-                const float x1 = src[n_dims/2];
-
-                dst_data[0]        = x0*cos_theta - x1*sin_theta;
-                dst_data[n_dims/2] = x0*sin_theta + x1*cos_theta;
-            } else {
-                const int64_t i0 = ic;
-
-                device const T * const src = (device T *)((device char *) src0 + i3*nb03 + i2*nb02 + i1*nb01 + i0*nb00);
-                device       T * dst_data  = (device T *)((device char *)  dst + i3*nb3  + i2*nb2  + i1*nb1  + i0*nb0);
-
-                dst_data[0] = src[0];
-                dst_data[1] = src[1];
-            }
-        }
-    }
-}
-
-template [[host_name("kernel_rope_f32")]] kernel rope_t kernel_rope<float>;
-template [[host_name("kernel_rope_f16")]] kernel rope_t kernel_rope<half>;
-
-kernel void kernel_im2col_f16(
-        device const float * x,
-        device       half * dst,
-        constant   int32_t & ofs0,
-        constant   int32_t & ofs1,
-        constant   int32_t & IW,
-        constant   int32_t & IH,
-        constant   int32_t & CHW,
-        constant   int32_t & s0,
-        constant   int32_t & s1,
-        constant   int32_t & p0,
-        constant   int32_t & p1,
-        constant   int32_t & d0,
-        constant   int32_t & d1,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3  tgpg[[threadgroups_per_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int32_t iiw = tgpig[2] * s0 + tpitg[2] * d0 - p0;
-    const int32_t iih = tgpig[1] * s1 + tpitg[1] * d1 - p1;
-
-    const int32_t offset_dst =
-        (tpitg[0] * tgpg[1] * tgpg[2] + tgpig[1] * tgpg[2] + tgpig[2]) * CHW +
-        (tgpig[0] * (ntg[1] * ntg[2]) + tpitg[1] * ntg[2] + tpitg[2]);
-
-    if (iih < 0 || iih >= IH || iiw < 0 || iiw >= IW) {
-        dst[offset_dst] = 0.0f;
-    } else {
-        const int32_t offset_src = tpitg[0] * ofs0 + tgpig[0] * ofs1;
-        dst[offset_dst] = x[offset_src + iih * IW + iiw];
-    }
-}
-
-kernel void kernel_upscale_f32(
-    device  const char * src0,
-    device        char * dst,
-    constant   int64_t & ne00,
-    constant   int64_t & ne01,
-    constant   int64_t & ne02,
-    constant   int64_t & ne03,
-    constant  uint64_t & nb00,
-    constant  uint64_t & nb01,
-    constant  uint64_t & nb02,
-    constant  uint64_t & nb03,
-    constant   int64_t & ne0,
-    constant   int64_t & ne1,
-    constant   int64_t & ne2,
-    constant   int64_t & ne3,
-    constant  uint64_t & nb0,
-    constant  uint64_t & nb1,
-    constant  uint64_t & nb2,
-    constant  uint64_t & nb3,
-    constant   int32_t & sf,
-    uint3 tgpig[[threadgroup_position_in_grid]],
-    uint3 tpitg[[thread_position_in_threadgroup]],
-    uint3   ntg[[threads_per_threadgroup]]) {
-
-    const int64_t i3 = tgpig.z;
-    const int64_t i2 = tgpig.y;
-    const int64_t i1 = tgpig.x;
-
-    const int64_t i03 = i3;
-    const int64_t i02 = i2;
-    const int64_t i01 = i1/sf;
-
-    device const float * src0_ptr = (device const float *) (src0 + i03*nb03 + i02*nb02 + i01*nb01);
-    device       float * dst_ptr  = (device       float *) (dst  +  i3*nb3  +  i2*nb2  +  i1*nb1);
-
-    for (int i0 = tpitg.x; i0 < ne0; i0 += ntg.x) {
-        dst_ptr[i0] = src0_ptr[i0/sf];
-    }
-}
-
-kernel void kernel_pad_f32(
-    device  const char * src0,
-    device        char * dst,
-    constant   int64_t & ne00,
-    constant   int64_t & ne01,
-    constant   int64_t & ne02,
-    constant   int64_t & ne03,
-    constant  uint64_t & nb00,
-    constant  uint64_t & nb01,
-    constant  uint64_t & nb02,
-    constant  uint64_t & nb03,
-    constant   int64_t & ne0,
-    constant   int64_t & ne1,
-    constant   int64_t & ne2,
-    constant   int64_t & ne3,
-    constant  uint64_t & nb0,
-    constant  uint64_t & nb1,
-    constant  uint64_t & nb2,
-    constant  uint64_t & nb3,
-    uint3 tgpig[[threadgroup_position_in_grid]],
-    uint3 tpitg[[thread_position_in_threadgroup]],
-    uint3   ntg[[threads_per_threadgroup]]) {
-
-    const int64_t i3 = tgpig.z;
-    const int64_t i2 = tgpig.y;
-    const int64_t i1 = tgpig.x;
-
-    const int64_t i03 = i3;
-    const int64_t i02 = i2;
-    const int64_t i01 = i1;
-
-    device const float * src0_ptr = (device const float *) (src0 + i03*nb03 + i02*nb02 + i01*nb01);
-    device       float * dst_ptr  = (device       float *) (dst  +  i3*nb3  +  i2*nb2  +  i1*nb1);
-
-    if (i1 < ne01 && i2 < ne02 && i3 < ne03) {
-        for (int i0 = tpitg.x; i0 < ne0; i0 += ntg.x) {
-            if (i0 < ne00) {
-                dst_ptr[i0] = src0_ptr[i0];
-            } else {
-                dst_ptr[i0] = 0.0f;
-            }
-        }
-
-        return;
-    }
-
-    for (int i0 = tpitg.x; i0 < ne0; i0 += ntg.x) {
-        dst_ptr[i0] = 0.0f;
-    }
-}
-
-// bitonic sort implementation following the CUDA kernels as reference
-typedef void (argsort_t)(
-        device const float * x,
-        device     int32_t * dst,
-        constant   int64_t & ncols,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]]);
-
-template<ggml_sort_order order>
-kernel void kernel_argsort_f32_i32(
-        device const float   * x,
-        device       int32_t * dst,
-        constant     int64_t & ncols,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]]) {
-    // bitonic sort
-    int col = tpitg[0];
-    int row = tgpig[1];
-
-    if (col >= ncols) return;
-
-    device const float   * x_row   = x   + row * ncols;
-    device       int32_t * dst_row = dst + row * ncols;
-
-    // initialize indices
-    if (col < ncols) {
-        dst_row[col] = col;
-    }
-    threadgroup_barrier(mem_flags::mem_threadgroup);
-
-    for (int k = 2; k <= ncols; k *= 2) {
-        for (int j = k / 2; j > 0; j /= 2) {
-            int ixj = col ^ j;
-            if (ixj > col) {
-                if ((col & k) == 0) {
-                    if (order == GGML_SORT_ASC ? x_row[dst_row[col]] > x_row[dst_row[ixj]] : x_row[dst_row[col]] < x_row[dst_row[ixj]]) {
-                        SWAP(dst_row[col], dst_row[ixj]);
-                    }
-                } else {
-                    if (order == GGML_SORT_ASC ? x_row[dst_row[col]] < x_row[dst_row[ixj]] : x_row[dst_row[col]] > x_row[dst_row[ixj]]) {
-                        SWAP(dst_row[col], dst_row[ixj]);
-                    }
-                }
-            }
-            threadgroup_barrier(mem_flags::mem_threadgroup);
-        }
-    }
-}
-
-template [[host_name("kernel_argsort_f32_i32_asc")]]  kernel argsort_t kernel_argsort_f32_i32<GGML_SORT_ASC>;
-template [[host_name("kernel_argsort_f32_i32_desc")]] kernel argsort_t kernel_argsort_f32_i32<GGML_SORT_DESC>;
-
-kernel void kernel_leaky_relu_f32(
-        device const float * src0,
-        device       float * dst,
-        constant     float & slope,
-        uint tpig[[thread_position_in_grid]]) {
-    dst[tpig] = src0[tpig] > 0.0f ? src0[tpig] : src0[tpig] * slope;
-}
-
-kernel void kernel_cpy_f16_f16(
-        device  const half * src0,
-        device        half * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne03,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant  uint64_t & nb03,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   int64_t & ne2,
-        constant   int64_t & ne3,
-        constant  uint64_t & nb0,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        constant  uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig[2];
-    const int64_t i02 = tgpig[1];
-    const int64_t i01 = tgpig[0];
-
-    const int64_t n = i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    const int64_t i3 = n / (ne2*ne1*ne0);
-    const int64_t i2 = (n - i3*ne2*ne1*ne0) / (ne1*ne0);
-    const int64_t i1 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0) / ne0;
-    const int64_t i0 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0 - i1*ne0);
-
-    device half * dst_data = (device half *) ((device char *) dst + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0);
-
-    for (int64_t i00 = tpitg.x; i00 < ne00; i00 += ntg.x) {
-        device const half * src = (device half *)((device char *) src0 + i03*nb03 + i02*nb02 + i01*nb01 + i00*nb00);
-        dst_data[i00] = src[0];
-    }
-}
-
-kernel void kernel_cpy_f16_f32(
-        device  const half * src0,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne03,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant  uint64_t & nb03,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   int64_t & ne2,
-        constant   int64_t & ne3,
-        constant  uint64_t & nb0,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        constant  uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig[2];
-    const int64_t i02 = tgpig[1];
-    const int64_t i01 = tgpig[0];
-
-    const int64_t n = i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    const int64_t i3 = n / (ne2*ne1*ne0);
-    const int64_t i2 = (n - i3*ne2*ne1*ne0) / (ne1*ne0);
-    const int64_t i1 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0) / ne0;
-    const int64_t i0 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0 - i1*ne0);
-
-    device float * dst_data = (device float *) ((device char *) dst + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0);
-
-    for (int64_t i00 = tpitg.x; i00 < ne00; i00 += ntg.x) {
-        device const half * src = (device half *)((device char *) src0 + i03*nb03 + i02*nb02 + i01*nb01 + i00*nb00);
-        dst_data[i00] = src[0];
-    }
-}
-
-kernel void kernel_cpy_f32_f16(
-        device const float * src0,
-        device        half * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne03,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant  uint64_t & nb03,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   int64_t & ne2,
-        constant   int64_t & ne3,
-        constant  uint64_t & nb0,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        constant  uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig[2];
-    const int64_t i02 = tgpig[1];
-    const int64_t i01 = tgpig[0];
-
-    const int64_t n = i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    const int64_t i3 = n / (ne2*ne1*ne0);
-    const int64_t i2 = (n - i3*ne2*ne1*ne0) / (ne1*ne0);
-    const int64_t i1 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0) / ne0;
-    const int64_t i0 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0 - i1*ne0);
-
-    device half * dst_data = (device half *) ((device char *) dst + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0);
-
-    for (int64_t i00 = tpitg.x; i00 < ne00; i00 += ntg.x) {
-        device const float * src = (device float *)((device char *) src0 + i03*nb03 + i02*nb02 + i01*nb01 + i00*nb00);
-
-        dst_data[i00] = src[0];
-    }
-}
-
-kernel void kernel_cpy_f32_f32(
-        device const float * src0,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne03,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant  uint64_t & nb03,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   int64_t & ne2,
-        constant   int64_t & ne3,
-        constant  uint64_t & nb0,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        constant  uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig[2];
-    const int64_t i02 = tgpig[1];
-    const int64_t i01 = tgpig[0];
-
-    const int64_t n = i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    const int64_t i3 = n / (ne2*ne1*ne0);
-    const int64_t i2 = (n - i3*ne2*ne1*ne0) / (ne1*ne0);
-    const int64_t i1 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0) / ne0;
-    const int64_t i0 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0 - i1*ne0);
-
-    device float * dst_data = (device float *) ((device char *) dst + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0);
-
-    for (int64_t i00 = tpitg.x; i00 < ne00; i00 += ntg.x) {
-        device const float * src = (device float *)((device char *) src0 + i03*nb03 + i02*nb02 + i01*nb01 + i00*nb00);
-
-        dst_data[i00] = src[0];
-    }
-}
-
-kernel void kernel_cpy_f32_q8_0(
-        device const float * src0,
-        device        void * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne03,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant  uint64_t & nb03,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   int64_t & ne2,
-        constant   int64_t & ne3,
-        constant  uint64_t & nb0,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        constant  uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig[2];
-    const int64_t i02 = tgpig[1];
-    const int64_t i01 = tgpig[0];
-
-    const int64_t n = i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    const int64_t i3 = n / (ne2*ne1*ne0);
-    const int64_t i2 = (n - i3*ne2*ne1*ne0) / (ne1*ne0);
-    const int64_t i1 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0) / ne0;
-    const int64_t i0 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0 - i1*ne0)/QK8_0;
-
-    device block_q8_0 * dst_data = (device block_q8_0 *) ((device char *) dst + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0);
-
-    for (int64_t i00 = tpitg.x*QK8_0; i00 < ne00; i00 += ntg.x*QK8_0) {
-        device const float * src = (device float *)((device char *) src0 + i03*nb03 + i02*nb02 + i01*nb01 + i00*nb00);
-
-        float amax = 0.0f; // absolute max
-
-        for (int j = 0; j < QK8_0; j++) {
-            const float v = src[j];
-            amax = MAX(amax, fabs(v));
-        }
-
-        const float d = amax / ((1 << 7) - 1);
-        const float id = d ? 1.0f/d : 0.0f;
-
-        dst_data[i00/QK8_0].d = d;
-
-        for (int j = 0; j < QK8_0; ++j) {
-            const float x0 = src[j]*id;
-
-            dst_data[i00/QK8_0].qs[j] = round(x0);
-        }
-    }
-}
-
-kernel void kernel_cpy_f32_q4_0(
-        device const float * src0,
-        device        void * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne03,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant  uint64_t & nb03,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   int64_t & ne2,
-        constant   int64_t & ne3,
-        constant  uint64_t & nb0,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        constant  uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig[2];
-    const int64_t i02 = tgpig[1];
-    const int64_t i01 = tgpig[0];
-
-    const int64_t n = i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    const int64_t i3 = n / (ne2*ne1*ne0);
-    const int64_t i2 = (n - i3*ne2*ne1*ne0) / (ne1*ne0);
-    const int64_t i1 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0) / ne0;
-    const int64_t i0 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0 - i1*ne0)/QK4_0;
-
-    device block_q4_0 * dst_data = (device block_q4_0 *) ((device char *) dst + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0);
-
-    for (int64_t i00 = tpitg.x*QK4_0; i00 < ne00; i00 += ntg.x*QK4_0) {
-        device const float * src = (device float *)((device char *) src0 + i03*nb03 + i02*nb02 + i01*nb01 + i00*nb00);
-
-        float amax = 0.0f; // absolute max
-        float max  = 0.0f;
-
-        for (int j = 0; j < QK4_0; j++) {
-            const float v = src[j];
-            if (amax < fabs(v)) {
-                amax = fabs(v);
-                max  = v;
-            }
-        }
-
-        const float d = max / -8;
-        const float id = d ? 1.0f/d : 0.0f;
-
-        dst_data[i00/QK4_0].d = d;
-
-        for (int j = 0; j < QK4_0/2; ++j) {
-            const float x0 = src[0       + j]*id;
-            const float x1 = src[QK4_0/2 + j]*id;
-
-            const uint8_t xi0 = MIN(15, (int8_t)(x0 + 8.5f));
-            const uint8_t xi1 = MIN(15, (int8_t)(x1 + 8.5f));
-
-            dst_data[i00/QK4_0].qs[j]  = xi0;
-            dst_data[i00/QK4_0].qs[j] |= xi1 << 4;
-        }
-    }
-}
-
-kernel void kernel_cpy_f32_q4_1(
-        device const float * src0,
-        device        void * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne03,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant  uint64_t & nb03,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   int64_t & ne2,
-        constant   int64_t & ne3,
-        constant  uint64_t & nb0,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        constant  uint64_t & nb3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint3 tpitg[[thread_position_in_threadgroup]],
-        uint3   ntg[[threads_per_threadgroup]]) {
-    const int64_t i03 = tgpig[2];
-    const int64_t i02 = tgpig[1];
-    const int64_t i01 = tgpig[0];
-
-    const int64_t n = i03*ne02*ne01*ne00 + i02*ne01*ne00 + i01*ne00;
-
-    const int64_t i3 = n / (ne2*ne1*ne0);
-    const int64_t i2 = (n - i3*ne2*ne1*ne0) / (ne1*ne0);
-    const int64_t i1 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0) / ne0;
-    const int64_t i0 = (n - i3*ne2*ne1*ne0 - i2*ne1*ne0 - i1*ne0)/QK4_1;
-
-    device block_q4_1 * dst_data = (device block_q4_1 *) ((device char *) dst + i3*nb3 + i2*nb2 + i1*nb1 + i0*nb0);
-
-    for (int64_t i00 = tpitg.x*QK4_1; i00 < ne00; i00 += ntg.x*QK4_1) {
-        device const float * src = (device float *)((device char *) src0 + i03*nb03 + i02*nb02 + i01*nb01 + i00*nb00);
-
-        float min = FLT_MAX;
-        float max = -FLT_MAX;
-
-        for (int j = 0; j < QK4_1; j++) {
-            const float v = src[j];
-            if (min > v) min = v;
-            if (max < v) max = v;
-        }
-
-        const float d = (max - min) / ((1 << 4) - 1);
-        const float id = d ? 1.0f/d : 0.0f;
-
-        dst_data[i00/QK4_1].d = d;
-        dst_data[i00/QK4_1].m = min;
-
-        for (int j = 0; j < QK4_1/2; ++j) {
-            const float x0 = (src[0       + j] - min)*id;
-            const float x1 = (src[QK4_1/2 + j] - min)*id;
-
-            const uint8_t xi0 = MIN(15, (int8_t)(x0 + 0.5f));
-            const uint8_t xi1 = MIN(15, (int8_t)(x1 + 0.5f));
-
-            dst_data[i00/QK4_1].qs[j]  = xi0;
-            dst_data[i00/QK4_1].qs[j] |= xi1 << 4;
-        }
-    }
-}
-
-kernel void kernel_concat(
-    device  const char * src0,
-    device  const char * src1,
-    device        char * dst,
-    constant   int64_t & ne00,
-    constant   int64_t & ne01,
-    constant   int64_t & ne02,
-    constant   int64_t & ne03,
-    constant  uint64_t & nb00,
-    constant  uint64_t & nb01,
-    constant  uint64_t & nb02,
-    constant  uint64_t & nb03,
-    constant   int64_t & ne10,
-    constant   int64_t & ne11,
-    constant   int64_t & ne12,
-    constant   int64_t & ne13,
-    constant  uint64_t & nb10,
-    constant  uint64_t & nb11,
-    constant  uint64_t & nb12,
-    constant  uint64_t & nb13,
-    constant   int64_t & ne0,
-    constant   int64_t & ne1,
-    constant   int64_t & ne2,
-    constant   int64_t & ne3,
-    constant  uint64_t & nb0,
-    constant  uint64_t & nb1,
-    constant  uint64_t & nb2,
-    constant  uint64_t & nb3,
-    uint3 tgpig[[threadgroup_position_in_grid]],
-    uint3 tpitg[[thread_position_in_threadgroup]],
-    uint3   ntg[[threads_per_threadgroup]]) {
-
-    const int64_t i03 = tgpig.z;
-    const int64_t i02 = tgpig.y;
-    const int64_t i01 = tgpig.x;
-
-    const int64_t i13 = i03 % ne13;
-    const int64_t i12 = i02 % ne12;
-    const int64_t i11 = i01 % ne11;
-
-    device const char * src0_ptr = src0 + i03*nb03 + i02*nb02 + i01*nb01 + tpitg.x*nb00;
-    device const char * src1_ptr = src1 + i13*nb13 + i12*nb12 + i11*nb11 + tpitg.x*nb10;
-    device       char * dst_ptr  = dst  + i03*nb3  + i02*nb2  + i01*nb1  + tpitg.x*nb0;
-
-    for (int i0 = tpitg.x; i0 < ne0; i0 += ntg.x) {
-        if (i02 < ne02) {
-            ((device float *)dst_ptr)[0] = ((device float *)src0_ptr)[0];
-            src0_ptr += ntg.x*nb00;
-        } else {
-            ((device float *)dst_ptr)[0] = ((device float *)src1_ptr)[0];
-            src1_ptr += ntg.x*nb10;
-        }
-        dst_ptr += ntg.x*nb0;
-    }
-}
-
-//============================================ k-quants ======================================================
-
-#ifndef QK_K
-#define QK_K 256
-#else
-static_assert(QK_K == 256 || QK_K == 64, "QK_K must be 256 or 64");
-#endif
-
-#if QK_K == 256
-#define K_SCALE_SIZE 12
-#else
-#define K_SCALE_SIZE 4
-#endif
-
-typedef struct {
-    uint8_t scales[QK_K/16]; // scales and mins, quantized with 4 bits
-    uint8_t qs[QK_K/4];      // quants
-    half d;           // super-block scale for quantized scales
-    half dmin;        // super-block scale for quantized mins
-} block_q2_K;
-// 84 bytes / block
-
-typedef struct {
-    uint8_t hmask[QK_K/8];     // quants - high bit
-    uint8_t qs[QK_K/4];        // quants - low 2 bits
-#if QK_K == 64
-    uint8_t scales[2];
-#else
-    uint8_t scales[K_SCALE_SIZE]; // scales, quantized with 6 bits
-#endif
-    half d;             // super-block scale
-} block_q3_K;
-
-#if QK_K == 64
-typedef struct {
-    half    d[2];          // super-block scales/mins
-    uint8_t scales[2];
-    uint8_t qs[QK_K/2];    // 4-bit quants
-} block_q4_K;
-#else
-typedef struct {
-    half d;             // super-block scale for quantized scales
-    half dmin;          // super-block scale for quantized mins
-    uint8_t scales[K_SCALE_SIZE]; // scales and mins, quantized with 6 bits
-    uint8_t qs[QK_K/2];        // 4--bit quants
-} block_q4_K;
-#endif
-
-#if QK_K == 64
-typedef struct {
-    half  d;                     // super-block scales/mins
-    int8_t  scales[QK_K/16];     // 8-bit block scales
-    uint8_t qh[QK_K/8];          // quants, high bit
-    uint8_t qs[QK_K/2];          // quants, low 4 bits
-} block_q5_K;
-#else
-typedef struct {
-    half d;                      // super-block scale for quantized scales
-    half dmin;                   // super-block scale for quantized mins
-    uint8_t scales[3*QK_K/64];   // scales and mins, quantized with 6 bits
-    uint8_t qh[QK_K/8];          // quants, high bit
-    uint8_t qs[QK_K/2];          // quants, low 4 bits
-} block_q5_K;
-// 176 bytes / block
-#endif
-
-typedef struct {
-    uint8_t ql[QK_K/2];      // quants, lower 4 bits
-    uint8_t qh[QK_K/4];      // quants, upper 2 bits
-    int8_t  scales[QK_K/16]; // scales, quantized with 8 bits
-    half d;                  // super-block scale
-} block_q6_K;
-// 210 bytes / block
-
-//====================================== dot products =========================
-
-void kernel_mul_mv_q2_K_f32_impl(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    const int nb = ne00/QK_K;
-    const int r0 = tgpig.x;
-    const int r1 = tgpig.y;
-    const int im = tgpig.z;
-
-    const int first_row = (r0 * N_SIMDGROUP + sgitg) * N_DST;
-    const int ib_row = first_row * nb;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q2_K * x = (device const block_q2_K *) src0 + ib_row + offset0;
-    device const float      * y = (device const float      *) src1 + r1*ne10 + im*ne00*ne1;
-
-    float yl[32];
-    float sumf[N_DST]={0.f}, all_sum;
-
-    const int step = sizeof(block_q2_K) * nb;
-
-#if QK_K == 256
-    const int ix = tiisg/8;  // 0...3
-    const int it = tiisg%8;  // 0...7
-    const int iq = it/4;     // 0 or 1
-    const int ir = it%4;     // 0...3
-    const int is = (8*ir)/16;// 0 or 1
-
-    device const float * y4 = y + ix * QK_K + 128 * iq + 8 * ir;
-
-    for (int ib = ix; ib < nb; ib += 4) {
-
-        float4 sumy = {0.f, 0.f, 0.f, 0.f};
-        for (int i = 0; i < 8; ++i) {
-            yl[i+ 0] = y4[i+ 0]; sumy[0] += yl[i+ 0];
-            yl[i+ 8] = y4[i+32]; sumy[1] += yl[i+ 8];
-            yl[i+16] = y4[i+64]; sumy[2] += yl[i+16];
-            yl[i+24] = y4[i+96]; sumy[3] += yl[i+24];
-        }
-
-        device const uint8_t  * sc = (device const uint8_t  *)x[ib].scales + 8*iq + is;
-        device const uint16_t * qs = (device const uint16_t *)x[ib].qs + 16 * iq + 4 * ir;
-        device const half     * dh = &x[ib].d;
-
-        for (int row = 0; row < N_DST; row++) {
-
-            float4 acc1 = {0.f, 0.f, 0.f, 0.f};
-            float4 acc2 = {0.f, 0.f, 0.f, 0.f};
-            for (int i = 0; i < 8; i += 2) {
-                acc1[0] += yl[i+ 0] * (qs[i/2] & 0x0003);
-                acc2[0] += yl[i+ 1] * (qs[i/2] & 0x0300);
-                acc1[1] += yl[i+ 8] * (qs[i/2] & 0x000c);
-                acc2[1] += yl[i+ 9] * (qs[i/2] & 0x0c00);
-                acc1[2] += yl[i+16] * (qs[i/2] & 0x0030);
-                acc2[2] += yl[i+17] * (qs[i/2] & 0x3000);
-                acc1[3] += yl[i+24] * (qs[i/2] & 0x00c0);
-                acc2[3] += yl[i+25] * (qs[i/2] & 0xc000);
-            }
-            float dall = dh[0];
-            float dmin = dh[1] * 1.f/16.f;
-            sumf[row] += dall * ((acc1[0] + 1.f/256.f * acc2[0]) * (sc[0] & 0xF) * 1.f/ 1.f +
-                                 (acc1[1] + 1.f/256.f * acc2[1]) * (sc[2] & 0xF) * 1.f/ 4.f +
-                                 (acc1[2] + 1.f/256.f * acc2[2]) * (sc[4] & 0xF) * 1.f/16.f +
-                                 (acc1[3] + 1.f/256.f * acc2[3]) * (sc[6] & 0xF) * 1.f/64.f) -
-                         dmin * (sumy[0] * (sc[0] & 0xF0) + sumy[1] * (sc[2] & 0xF0) + sumy[2] * (sc[4] & 0xF0) + sumy[3] * (sc[6] & 0xF0));
-
-            qs += step/2;
-            sc += step;
-            dh += step/2;
-        }
-
-        y4 += 4 * QK_K;
-    }
-#else
-    const int ix = tiisg/2;  // 0...15
-    const int it = tiisg%2;  // 0...1
-
-    device const float * y4 = y + ix * QK_K + 8 * it;
-
-    for (int ib = ix; ib < nb; ib += 16) {
-
-        float4 sumy = {0.f, 0.f, 0.f, 0.f};
-        for (int i = 0; i < 8; ++i) {
-            yl[i+ 0] = y4[i+ 0]; sumy[0] += yl[i+ 0];
-            yl[i+ 8] = y4[i+16]; sumy[1] += yl[i+ 8];
-            yl[i+16] = y4[i+32]; sumy[2] += yl[i+16];
-            yl[i+24] = y4[i+48]; sumy[3] += yl[i+24];
-        }
-
-        device const uint8_t  * sc = (device const uint8_t  *)x[ib].scales;
-        device const uint16_t * qs = (device const uint16_t *)x[ib].qs + 4 * it;
-        device const half     * dh = &x[ib].d;
-
-        for (int row = 0; row < N_DST; row++) {
-
-            float4 acc1 = {0.f, 0.f, 0.f, 0.f};
-            float4 acc2 = {0.f, 0.f, 0.f, 0.f};
-            for (int i = 0; i < 8; i += 2) {
-                acc1[0] += yl[i+ 0] * (qs[i/2] & 0x0003);
-                acc2[0] += yl[i+ 1] * (qs[i/2] & 0x0300);
-                acc1[1] += yl[i+ 8] * (qs[i/2] & 0x000c);
-                acc2[1] += yl[i+ 9] * (qs[i/2] & 0x0c00);
-                acc1[2] += yl[i+16] * (qs[i/2] & 0x0030);
-                acc2[2] += yl[i+17] * (qs[i/2] & 0x3000);
-                acc1[3] += yl[i+24] * (qs[i/2] & 0x00c0);
-                acc2[3] += yl[i+25] * (qs[i/2] & 0xc000);
-            }
-
-            float dall = dh[0];
-            float dmin = dh[1];
-            sumf[row] += dall * ((acc1[0] + 1.f/256.f * acc2[0]) * (sc[0] & 0xF) * 1.f/ 1.f +
-                                 (acc1[1] + 1.f/256.f * acc2[1]) * (sc[1] & 0xF) * 1.f/ 4.f +
-                                 (acc1[2] + 1.f/256.f * acc2[2]) * (sc[2] & 0xF) * 1.f/16.f +
-                                 (acc1[3] + 1.f/256.f * acc2[3]) * (sc[3] & 0xF) * 1.f/64.f) -
-                         dmin * (sumy[0] * (sc[0] >> 4) + sumy[1] * (sc[1] >> 4) + sumy[2] * (sc[2] >> 4) + sumy[3] * (sc[3] >> 4));
-
-            qs += step/2;
-            sc += step;
-            dh += step/2;
-        }
-
-        y4 += 16 * QK_K;
-    }
-#endif
-
-    for (int row = 0; row < N_DST; ++row) {
-        all_sum = simd_sum(sumf[row]);
-        if (tiisg == 0) {
-            dst[r1*ne0 + im*ne0*ne1 + first_row + row] = all_sum;
-        }
-    }
-}
-
-[[host_name("kernel_mul_mv_q2_K_f32")]]
-kernel void kernel_mul_mv_q2_K_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    kernel_mul_mv_q2_K_f32_impl(src0, src1, dst, ne00, ne01, ne02, ne10, ne12, ne0, ne1, r2, r3, tgpig, tiisg, sgitg);
-}
-
-#if QK_K == 256
-void kernel_mul_mv_q3_K_f32_impl(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    const int nb = ne00/QK_K;
-
-    const int64_t r0 = tgpig.x;
-    const int64_t r1 = tgpig.y;
-    const int64_t im = tgpig.z;
-
-    const int first_row = (r0 * N_SIMDGROUP + sgitg) * 2;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q3_K * x = (device const block_q3_K *) src0 + first_row*nb + offset0;
-    device const float     * yy = (device const float      *) src1 + r1*ne10 + im*ne00*ne1;
-
-    float yl[32];
-
-    //const uint16_t kmask1 = 0x3030;
-    //const uint16_t kmask2 = 0x0f0f;
-
-    const int tid = tiisg/4;
-    const int ix  = tiisg%4;
-    const int ip  = tid/4;          // 0 or 1
-    const int il  = 2*((tid%4)/2);  // 0 or 2
-    const int ir  = tid%2;
-    const int n   = 8;
-    const int l0  = n*ir;
-
-    // One would think that the Metal compiler would figure out that ip and il can only have
-    // 4 possible states, and optimize accordingly. Well, no. It needs help, and we do it
-    // with these two tales.
-    //
-    // Possible masks for the high bit
-    const ushort4 mm[4] = {{0x0001, 0x0100, 0x0002, 0x0200},  // ip = 0, il = 0
-                           {0x0004, 0x0400, 0x0008, 0x0800},  // ip = 0, il = 2
-                           {0x0010, 0x1000, 0x0020, 0x2000},  // ip = 1, il = 0
-                           {0x0040, 0x4000, 0x0080, 0x8000}}; // ip = 1, il = 2
-
-    // Possible masks for the low 2 bits
-    const int4 qm[2] = {{0x0003, 0x0300, 0x000c, 0x0c00}, {0x0030, 0x3000, 0x00c0, 0xc000}};
-
-    const ushort4 hm = mm[2*ip + il/2];
-
-    const int shift = 2*il;
-    const float    v1 = il == 0 ? 4.f : 64.f;
-    const float    v2 = 4.f * v1;
-
-    const uint16_t s_shift1 = 4*ip;
-    const uint16_t s_shift2 = s_shift1 + il;
-
-    const int q_offset = 32*ip + l0;
-    const int y_offset = 128*ip + 32*il + l0;
-
-    const int step = sizeof(block_q3_K) * nb / 2;
-
-    device const float * y1 = yy + ix*QK_K + y_offset;
-
-    uint32_t scales32, aux32;
-    thread uint16_t * scales16 = (thread uint16_t *)&scales32;
-    thread const int8_t * scales = (thread const int8_t *)&scales32;
-
-    float sumf1[2] = {0.f};
-    float sumf2[2] = {0.f};
-    for (int i = ix; i < nb; i += 4) {
-
-        for (int l = 0; l < 8; ++l) {
-            yl[l+ 0] = y1[l+ 0];
-            yl[l+ 8] = y1[l+16];
-            yl[l+16] = y1[l+32];
-            yl[l+24] = y1[l+48];
-        }
-
-        device const uint16_t * q = (device const uint16_t *)(x[i].qs + q_offset);
-        device const uint16_t * h = (device const uint16_t *)(x[i].hmask + l0);
-        device const uint16_t * a = (device const uint16_t *)(x[i].scales);
-        device const half * dh = &x[i].d;
-
-        for (int row = 0; row < 2; ++row) {
-
-            const float d_all = (float)dh[0];
-
-            scales16[0] = a[4];
-            scales16[1] = a[5];
-            aux32 = ((scales32 >> s_shift2) << 4) & 0x30303030;
-            scales16[0] = a[il+0];
-            scales16[1] = a[il+1];
-            scales32 = ((scales32 >> s_shift1) & 0x0f0f0f0f) | aux32;
-
-            float s1 = 0, s2 = 0, s3 = 0, s4 = 0, s5 = 0, s6 = 0;
-            for (int l = 0; l < n; l += 2) {
-                const int32_t qs = q[l/2];
-                s1 += yl[l+0] * (qs & qm[il/2][0]);
-                s2 += yl[l+1] * (qs & qm[il/2][1]);
-                s3 += ((h[l/2] & hm[0]) ? 0.f : yl[l+0]) + ((h[l/2] & hm[1]) ? 0.f : yl[l+1]);
-                s4 += yl[l+16] * (qs & qm[il/2][2]);
-                s5 += yl[l+17] * (qs & qm[il/2][3]);
-                s6 += ((h[l/2] & hm[2]) ? 0.f : yl[l+16]) + ((h[l/2] & hm[3]) ? 0.f : yl[l+17]);
-            }
-            float d1 = d_all * (s1 + 1.f/256.f * s2 - s3*v1);
-            float d2 = d_all * (s4 + 1.f/256.f * s5 - s6*v2);
-            sumf1[row] += d1 * (scales[0] - 32);
-            sumf2[row] += d2 * (scales[2] - 32);
-
-            s1 = s2 = s3 = s4 = s5 = s6 = 0;
-            for (int l = 0; l < n; l += 2) {
-                const int32_t qs = q[l/2+8];
-                s1 += yl[l+8] * (qs & qm[il/2][0]);
-                s2 += yl[l+9] * (qs & qm[il/2][1]);
-                s3 += ((h[l/2+8] & hm[0]) ? 0.f : yl[l+8]) + ((h[l/2+8] & hm[1]) ? 0.f : yl[l+9]);
-                s4 += yl[l+24] * (qs & qm[il/2][2]);
-                s5 += yl[l+25] * (qs & qm[il/2][3]);
-                s6 += ((h[l/2+8] & hm[2]) ? 0.f : yl[l+24]) + ((h[l/2+8] & hm[3]) ? 0.f : yl[l+25]);
-            }
-            d1 = d_all * (s1 + 1.f/256.f * s2 - s3*v1);
-            d2 = d_all * (s4 + 1.f/256.f * s5 - s6*v2);
-            sumf1[row] += d1 * (scales[1] - 32);
-            sumf2[row] += d2 * (scales[3] - 32);
-
-            q  += step;
-            h  += step;
-            a  += step;
-            dh += step;
-
-        }
-
-        y1 += 4 * QK_K;
-
-    }
-
-    for (int row = 0; row < 2; ++row) {
-        const float sumf = (sumf1[row] + 0.25f * sumf2[row]) / (1 << shift);
-        sumf1[row] = simd_sum(sumf);
-    }
-    if (tiisg == 0) {
-        for (int row = 0; row < 2; ++row) {
-            dst[r1*ne0 + im*ne0*ne1 + first_row + row] = sumf1[row];
-        }
-    }
-}
-#else
-void kernel_mul_mv_q3_K_f32_impl(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    const int nb = ne00/QK_K;
-
-    const int64_t r0 = tgpig.x;
-    const int64_t r1 = tgpig.y;
-    const int64_t im = tgpig.z;
-
-    const int row = 2 * r0 + sgitg;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q3_K * x = (device const block_q3_K *) src0 + row*nb + offset0;
-    device const float     * yy = (device const float      *) src1 + r1*ne10 + im*ne00*ne1;
-
-    const int ix = tiisg/4;
-    const int il = 4 * (tiisg%4);// 0, 4, 8, 12
-    const int iq = il/8;         // 0, 0, 1, 1
-    const int in = il%8;         // 0, 4, 0, 4
-
-    float2 sum = {0.f, 0.f};
-
-    for (int i = ix; i < nb; i += 8) {
-
-        const float d_all = (float)(x[i].d);
-
-        device const uint16_t * q = (device const uint16_t *)(x[i].qs + il);
-        device const uint16_t * h = (device const uint16_t *)(x[i].hmask + in);
-        device const uint16_t * s = (device const uint16_t *)(x[i].scales);
-        device const float    * y = yy + i * QK_K + il;
-
-        const float d1 = d_all * ((int32_t)(s[0] & 0x000F) - 8);
-        const float d2 = d_all * ((int32_t)(s[0] & 0x00F0) - 128) * 1.f/64.f;
-        const float d3 = d_all * ((int32_t)(s[0] & 0x0F00) - 2048) * 1.f/4096.f;
-        const float d4 = d_all * ((int32_t)(s[0] & 0xF000) - 32768) * 1.f/262144.f;
-
-        for (int l = 0; l < 4; l += 2) {
-            const uint16_t hm = h[l/2] >> iq;
-            sum[0] += y[l+ 0] * d1 * ((int32_t)(q[l/2] & 0x0003) - ((hm & 0x0001) ? 0 :  4))
-                    + y[l+16] * d2 * ((int32_t)(q[l/2] & 0x000c) - ((hm & 0x0004) ? 0 : 16))
-                    + y[l+32] * d3 * ((int32_t)(q[l/2] & 0x0030) - ((hm & 0x0010) ? 0 : 64))
-                    + y[l+48] * d4 * ((int32_t)(q[l/2] & 0x00c0) - ((hm & 0x0040) ? 0 : 256));
-            sum[1] += y[l+ 1] * d1 * ((int32_t)(q[l/2] & 0x0300) - ((hm & 0x0100) ? 0 : 1024))
-                    + y[l+17] * d2 * ((int32_t)(q[l/2] & 0x0c00) - ((hm & 0x0400) ? 0 : 4096))
-                    + y[l+33] * d3 * ((int32_t)(q[l/2] & 0x3000) - ((hm & 0x1000) ? 0 : 16384))
-                    + y[l+49] * d4 * ((int32_t)(q[l/2] & 0xc000) - ((hm & 0x4000) ? 0 : 65536));
-        }
-
-    }
-    const float sumf = sum[0] + sum[1] * 1.f/256.f;
-
-    const float tot = simd_sum(sumf);
-    if (tiisg == 0) {
-        dst[r1*ne0 + im*ne0*ne1 + row] = tot;
-    }
-
-}
-#endif
-
-[[host_name("kernel_mul_mv_q3_K_f32")]]
-kernel void kernel_mul_mv_q3_K_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    kernel_mul_mv_q3_K_f32_impl(src0, src1, dst, ne00, ne01, ne02, ne10, ne12, ne0, ne1, r2, r3, tgpig, tiisg, sgitg);
-}
-
-#if QK_K == 256
-void kernel_mul_mv_q4_K_f32_impl(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    const uint16_t kmask1 = 0x3f3f;
-    const uint16_t kmask2 = 0x0f0f;
-    const uint16_t kmask3 = 0xc0c0;
-
-    const int ix = tiisg/8;  // 0...3
-    const int it = tiisg%8;  // 0...7
-    const int iq = it/4;     // 0 or 1
-    const int ir = it%4;     // 0...3
-
-    const int nb = ne00/QK_K;
-    const int r0 = tgpig.x;
-    const int r1 = tgpig.y;
-    const int im = tgpig.z;
-    //const int first_row = (r0 * N_SIMDGROUP + sgitg) * N_DST;
-    const int first_row = r0 * N_DST;
-    const int ib_row = first_row * nb;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q4_K * x = (device const block_q4_K *) src0 + ib_row + offset0;
-    device const float      * y = (device const float      *) src1 + r1*ne10 + im*ne00*ne1;
-
-    float yl[16];
-    float yh[16];
-    float sumf[N_DST]={0.f}, all_sum;
-
-    const int step = sizeof(block_q4_K) * nb / 2;
-
-    device const float * y4 = y + ix * QK_K + 64 * iq + 8 * ir;
-
-    uint16_t sc16[4];
-    thread const uint8_t * sc8 = (thread const uint8_t *)sc16;
-
-    for (int ib = ix; ib < nb; ib += 4) {
-
-        float4 sumy = {0.f, 0.f, 0.f, 0.f};
-        for (int i = 0; i < 8; ++i) {
-            yl[i+0] = y4[i+  0]; sumy[0] += yl[i+0];
-            yl[i+8] = y4[i+ 32]; sumy[1] += yl[i+8];
-            yh[i+0] = y4[i+128]; sumy[2] += yh[i+0];
-            yh[i+8] = y4[i+160]; sumy[3] += yh[i+8];
-        }
-
-        device const uint16_t * sc = (device const uint16_t *)x[ib].scales + iq;
-        device const uint16_t * q1 = (device const uint16_t *)x[ib].qs + 16 * iq + 4 * ir;
-        device const half     * dh = &x[ib].d;
-
-        for (int row = 0; row < N_DST; row++) {
-
-            sc16[0] = sc[0] & kmask1;
-            sc16[1] = sc[2] & kmask1;
-            sc16[2] = ((sc[4] >> 0) & kmask2) | ((sc[0] & kmask3) >> 2);
-            sc16[3] = ((sc[4] >> 4) & kmask2) | ((sc[2] & kmask3) >> 2);
-
-            device const uint16_t * q2 = q1 + 32;
-
-            float4 acc1 = {0.f, 0.f, 0.f, 0.f};
-            float4 acc2 = {0.f, 0.f, 0.f, 0.f};
-            for (int i = 0; i < 8; i += 2) {
-                acc1[0] += yl[i+0] * (q1[i/2] & 0x000F);
-                acc1[1] += yl[i+1] * (q1[i/2] & 0x0F00);
-                acc1[2] += yl[i+8] * (q1[i/2] & 0x00F0);
-                acc1[3] += yl[i+9] * (q1[i/2] & 0xF000);
-                acc2[0] += yh[i+0] * (q2[i/2] & 0x000F);
-                acc2[1] += yh[i+1] * (q2[i/2] & 0x0F00);
-                acc2[2] += yh[i+8] * (q2[i/2] & 0x00F0);
-                acc2[3] += yh[i+9] * (q2[i/2] & 0xF000);
-            }
-
-            float dall = dh[0];
-            float dmin = dh[1];
-            sumf[row] += dall * ((acc1[0] + 1.f/256.f * acc1[1]) * sc8[0] +
-                                 (acc1[2] + 1.f/256.f * acc1[3]) * sc8[1] * 1.f/16.f +
-                                 (acc2[0] + 1.f/256.f * acc2[1]) * sc8[4] +
-                                 (acc2[2] + 1.f/256.f * acc2[3]) * sc8[5] * 1.f/16.f) -
-                         dmin * (sumy[0] * sc8[2] + sumy[1] * sc8[3] + sumy[2] * sc8[6] + sumy[3] * sc8[7]);
-
-            q1 += step;
-            sc += step;
-            dh += step;
-        }
-
-        y4 += 4 * QK_K;
-    }
-
-    for (int row = 0; row < N_DST; ++row) {
-        all_sum = simd_sum(sumf[row]);
-        if (tiisg == 0) {
-            dst[r1*ne0 + im*ne0*ne1 + first_row + row] = all_sum;
-        }
-    }
-}
-#else
-void kernel_mul_mv_q4_K_f32_impl(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    const int ix = tiisg/4;  // 0...7
-    const int it = tiisg%4;  // 0...3
-
-    const int nb = ne00/QK_K;
-    const int r0 = tgpig.x;
-    const int r1 = tgpig.y;
-    const int im = tgpig.z;
-    const int first_row = r0 * N_DST;
-    const int ib_row = first_row * nb;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q4_K * x = (device const block_q4_K *) src0 + ib_row + offset0;
-    device const float      * y = (device const float      *) src1 + r1*ne10 + im*ne00*ne1;
-
-    float yl[8];
-    float yh[8];
-    float sumf[N_DST]={0.f}, all_sum;
-
-    const int step = sizeof(block_q4_K) * nb / 2;
-
-    device const float * y4 = y + ix * QK_K + 8 * it;
-
-    uint16_t sc16[4];
-
-    for (int ib = ix; ib < nb; ib += 8) {
-
-        float2 sumy = {0.f, 0.f};
-        for (int i = 0; i < 8; ++i) {
-            yl[i] = y4[i+ 0]; sumy[0] += yl[i];
-            yh[i] = y4[i+32]; sumy[1] += yh[i];
-        }
-
-        device const uint16_t * sc = (device const uint16_t *)x[ib].scales;
-        device const uint16_t * qs = (device const uint16_t *)x[ib].qs + 4 * it;
-        device const half     * dh = x[ib].d;
-
-        for (int row = 0; row < N_DST; row++) {
-
-            sc16[0] = sc[0] & 0x000f;
-            sc16[1] = sc[0] & 0x0f00;
-            sc16[2] = sc[0] & 0x00f0;
-            sc16[3] = sc[0] & 0xf000;
-
-            float2 acc1 = {0.f, 0.f};
-            float2 acc2 = {0.f, 0.f};
-            for (int i = 0; i < 8; i += 2) {
-                acc1[0] += yl[i+0] * (qs[i/2] & 0x000F);
-                acc1[1] += yl[i+1] * (qs[i/2] & 0x0F00);
-                acc2[0] += yh[i+0] * (qs[i/2] & 0x00F0);
-                acc2[1] += yh[i+1] * (qs[i/2] & 0xF000);
-            }
-
-            float dall = dh[0];
-            float dmin = dh[1];
-            sumf[row] += dall * ((acc1[0] + 1.f/256.f * acc1[1]) * sc16[0] +
-                                 (acc2[0] + 1.f/256.f * acc2[1]) * sc16[1] * 1.f/4096.f) -
-                         dmin * 1.f/16.f * (sumy[0] * sc16[2] + sumy[1] * sc16[3] * 1.f/256.f);
-
-            qs += step;
-            sc += step;
-            dh += step;
-        }
-
-        y4 += 8 * QK_K;
-    }
-
-    for (int row = 0; row < N_DST; ++row) {
-        all_sum = simd_sum(sumf[row]);
-        if (tiisg == 0) {
-            dst[r1*ne0 + im*ne0*ne1 + first_row + row] = all_sum;
-        }
-    }
-}
-#endif
-
-[[host_name("kernel_mul_mv_q4_K_f32")]]
-kernel void kernel_mul_mv_q4_K_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint tiisg[[thread_index_in_simdgroup]],
-        uint sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    kernel_mul_mv_q4_K_f32_impl(src0, src1, dst, ne00, ne01, ne02, ne10, ne12, ne0, ne1, r2, r3, tgpig, tiisg, sgitg);
-}
-
-void kernel_mul_mv_q5_K_f32_impl(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    const int nb = ne00/QK_K;
-
-    const int64_t r0 = tgpig.x;
-    const int64_t r1 = tgpig.y;
-    const int im = tgpig.z;
-
-    const int first_row = (r0 * N_SIMDGROUP + sgitg) * 2;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q5_K * x = (device const block_q5_K *) src0 + first_row*nb + offset0;
-    device const float     * yy = (device const float      *) src1 + r1*ne10 + im*ne00*ne1;
-
-    float sumf[2]={0.f};
-
-    const int step = sizeof(block_q5_K) * nb;
-
-#if QK_K == 256
-#
-    float yl[16], yh[16];
-
-    const uint16_t kmask1 = 0x3f3f;
-    const uint16_t kmask2 = 0x0f0f;
-    const uint16_t kmask3 = 0xc0c0;
-
-    const int tid = tiisg/4;
-    const int ix  = tiisg%4;
-    const int iq  = tid/4;
-    const int ir  = tid%4;
-    const int n   = 8;
-
-    const int l0 = n*ir;
-    const int q_offset = 32*iq + l0;
-    const int y_offset = 64*iq + l0;
-
-    const uint8_t hm1 = 1u << (2*iq);
-    const uint8_t hm2 = hm1 << 1;
-    const uint8_t hm3 = hm1 << 4;
-    const uint8_t hm4 = hm2 << 4;
-
-    uint16_t sc16[4];
-    thread const uint8_t * sc8 = (thread const uint8_t *)sc16;
-
-    device const float * y1 = yy + ix*QK_K + y_offset;
-
-    for (int i = ix; i < nb; i += 4) {
-
-        device const uint8_t * q1 = x[i].qs + q_offset;
-        device const uint8_t * qh = x[i].qh + l0;
-        device const half * dh = &x[i].d;
-        device const uint16_t * a = (device const uint16_t *)x[i].scales + iq;
-
-        device const float * y2 = y1 + 128;
-        float4 sumy = {0.f, 0.f, 0.f, 0.f};
-        for (int l = 0; l < 8; ++l) {
-            yl[l+0] = y1[l+ 0]; sumy[0] += yl[l+0];
-            yl[l+8] = y1[l+32]; sumy[1] += yl[l+8];
-            yh[l+0] = y2[l+ 0]; sumy[2] += yh[l+0];
-            yh[l+8] = y2[l+32]; sumy[3] += yh[l+8];
-        }
-
-        for (int row = 0; row < 2; ++row) {
-
-            device const uint8_t * q2 = q1 + 64;
-
-            sc16[0] = a[0] & kmask1;
-            sc16[1] = a[2] & kmask1;
-            sc16[2] = ((a[4] >> 0) & kmask2) | ((a[0] & kmask3) >> 2);
-            sc16[3] = ((a[4] >> 4) & kmask2) | ((a[2] & kmask3) >> 2);
-
-            float4 acc1 = {0.f};
-            float4 acc2 = {0.f};
-            for (int l = 0; l < n; ++l) {
-                uint8_t h = qh[l];
-                acc1[0] += yl[l+0] * (q1[l] & 0x0F);
-                acc1[1] += yl[l+8] * (q1[l] & 0xF0);
-                acc1[2] += yh[l+0] * (q2[l] & 0x0F);
-                acc1[3] += yh[l+8] * (q2[l] & 0xF0);
-                acc2[0] += h & hm1 ? yl[l+0] : 0.f;
-                acc2[1] += h & hm2 ? yl[l+8] : 0.f;
-                acc2[2] += h & hm3 ? yh[l+0] : 0.f;
-                acc2[3] += h & hm4 ? yh[l+8] : 0.f;
-            }
-            const float dall = dh[0];
-            const float dmin = dh[1];
-            sumf[row] += dall * (sc8[0] * (acc1[0] +  16.f*acc2[0]) +
-                                 sc8[1] * (acc1[1]/16.f + 16.f*acc2[1]) +
-                                 sc8[4] * (acc1[2] +  16.f*acc2[2]) +
-                                 sc8[5] * (acc1[3]/16.f + 16.f*acc2[3])) -
-                         dmin * (sumy[0] * sc8[2] + sumy[1] * sc8[3] + sumy[2] * sc8[6] + sumy[3] * sc8[7]);
-
-            q1 += step;
-            qh += step;
-            dh += step/2;
-            a  += step/2;
-
-        }
-
-        y1 += 4 * QK_K;
-
-    }
-#else
-    float yl[8], yh[8];
-
-    const int il = 4 * (tiisg/8);  // 0, 4, 8, 12
-    const int ix = tiisg%8;
-    const int iq = il/8;         // 0, 0, 1, 1
-    const int in = il%8;         // 0, 4, 0, 4
-
-    device const float * y = yy + ix*QK_K + il;
-
-    for (int i = ix; i < nb; i += 8) {
-
-        for (int l = 0; l < 4; ++l) {
-            yl[l+0] = y[l+ 0];
-            yl[l+4] = y[l+16];
-            yh[l+0] = y[l+32];
-            yh[l+4] = y[l+48];
-        }
-
-        device const half * dh = &x[i].d;
-        device const uint8_t * q = x[i].qs + il;
-        device const uint8_t * h = x[i].qh + in;
-        device const int8_t  * s = x[i].scales;
-
-        for (int row = 0; row < 2; ++row) {
-
-            const float d = dh[0];
-
-            float2 acc = {0.f, 0.f};
-            for (int l = 0; l < 4; ++l) {
-                const uint8_t hl = h[l] >> iq;
-                acc[0] += yl[l+0] * s[0] * ((int16_t)(q[l+ 0] & 0x0F) - (hl & 0x01 ? 0 : 16))
-                        + yl[l+4] * s[1] * ((int16_t)(q[l+16] & 0x0F) - (hl & 0x04 ? 0 : 16));
-                acc[1] += yh[l+0] * s[2] * ((int16_t)(q[l+ 0] & 0xF0) - (hl & 0x10 ? 0 : 256))
-                        + yh[l+4] * s[3] * ((int16_t)(q[l+16] & 0xF0) - (hl & 0x40 ? 0 : 256));
-            }
-            sumf[row] += d * (acc[0] + 1.f/16.f * acc[1]);
-
-            q += step;
-            h += step;
-            s += step;
-            dh += step/2;
-
-        }
-
-        y += 8 * QK_K;
-    }
-#endif
-
-    for (int row = 0; row < 2; ++row) {
-        const float tot = simd_sum(sumf[row]);
-        if (tiisg == 0) {
-            dst[r1*ne0 + im*ne0*ne1 + first_row + row] = tot;
-        }
-    }
-}
-
-[[host_name("kernel_mul_mv_q5_K_f32")]]
-kernel void kernel_mul_mv_q5_K_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    kernel_mul_mv_q5_K_f32_impl(src0, src1, dst, ne00, ne01, ne02, ne10, ne12, ne0, ne1, r2, r3, tgpig, tiisg, sgitg);
-}
-
-void kernel_mul_mv_q6_K_f32_impl(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    const uint8_t kmask1 = 0x03;
-    const uint8_t kmask2 = 0x0C;
-    const uint8_t kmask3 = 0x30;
-    const uint8_t kmask4 = 0xC0;
-
-    const int nb = ne00/QK_K;
-
-    const int64_t r0 = tgpig.x;
-    const int64_t r1 = tgpig.y;
-    const int     im = tgpig.z;
-
-    const int row = 2 * r0 + sgitg;
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    const uint offset0 = (i12/r2)*(nb*ne01) + (i13/r3)*(nb*ne01*ne02);
-
-    device const block_q6_K * x = (device const block_q6_K *) src0 + row * nb + offset0;
-    device const float     * yy = (device const float      *) src1 + r1*ne10 + im*ne00*ne1;
-
-    float sumf = 0;
-
-#if QK_K == 256
-    const int tid  = tiisg/2;
-    const int ix   = tiisg%2;
-    const int ip   = tid/8;         // 0 or 1
-    const int il   = tid%8;
-    const int n    = 4;
-    const int l0   = n*il;
-    const int is   = 8*ip + l0/16;
-
-    const int y_offset = 128*ip + l0;
-    const int q_offset_l = 64*ip + l0;
-    const int q_offset_h = 32*ip + l0;
-
-    for (int i = ix; i < nb; i += 2) {
-
-        device const uint8_t * q1 = x[i].ql + q_offset_l;
-        device const uint8_t * q2 = q1 + 32;
-        device const uint8_t * qh = x[i].qh + q_offset_h;
-        device const int8_t  * sc = x[i].scales + is;
-
-        device const float * y = yy + i * QK_K + y_offset;
-
-        const float dall = x[i].d;
-
-        float4 sums = {0.f, 0.f, 0.f, 0.f};
-        for (int l = 0; l < n; ++l) {
-            sums[0] += y[l+ 0] * ((int8_t)((q1[l] & 0xF) | ((qh[l] & kmask1) << 4)) - 32);
-            sums[1] += y[l+32] * ((int8_t)((q2[l] & 0xF) | ((qh[l] & kmask2) << 2)) - 32);
-            sums[2] += y[l+64] * ((int8_t)((q1[l]  >> 4) | ((qh[l] & kmask3) << 0)) - 32);
-            sums[3] += y[l+96] * ((int8_t)((q2[l]  >> 4) | ((qh[l] & kmask4) >> 2)) - 32);
-        }
-
-        sumf += dall * (sums[0] * sc[0] + sums[1] * sc[2] + sums[2] * sc[4] + sums[3] * sc[6]);
-
-    }
-
-#else
-    const int ix  = tiisg/4;
-    const int il  = 4*(tiisg%4);
-
-    for (int i = ix; i < nb; i += 8) {
-        device const float * y = yy + i * QK_K + il;
-        device const uint8_t * ql = x[i].ql + il;
-        device const uint8_t * qh = x[i].qh + il;
-        device const int8_t  * s  = x[i].scales;
-
-        const float d = x[i].d;
-
-        float4 sums = {0.f, 0.f, 0.f, 0.f};
-        for (int l = 0; l < 4; ++l) {
-            sums[0] += y[l+ 0] * ((int8_t)((ql[l+ 0] & 0xF) | ((qh[l] & kmask1) << 4)) - 32);
-            sums[1] += y[l+16] * ((int8_t)((ql[l+16] & 0xF) | ((qh[l] & kmask2) << 2)) - 32);
-            sums[2] += y[l+32] * ((int8_t)((ql[l+ 0] >>  4) | ((qh[l] & kmask3) >> 0)) - 32);
-            sums[3] += y[l+48] * ((int8_t)((ql[l+16] >>  4) | ((qh[l] & kmask4) >> 2)) - 32);
-        }
-        sumf += d * (sums[0] * s[0] + sums[1] * s[1] + sums[2] * s[2] + sums[3] * s[3]);
-    }
-
-#endif
-
-    const float tot = simd_sum(sumf);
-    if (tiisg == 0) {
-        dst[r1*ne0 + im*ne0*ne1 + row] = tot;
-    }
-}
-
-[[host_name("kernel_mul_mv_q6_K_f32")]]
-kernel void kernel_mul_mv_q6_K_f32(
-        device const  void * src0,
-        device const float * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant   int64_t & ne01,
-        constant   int64_t & ne02,
-        constant  uint64_t & nb00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant   int64_t & ne11,
-        constant   int64_t & ne12,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb12,
-        constant   int64_t & ne0,
-        constant   int64_t & ne1,
-        constant   uint    & r2,
-        constant   uint    & r3,
-        uint3 tgpig[[threadgroup_position_in_grid]],
-        uint  tiisg[[thread_index_in_simdgroup]],
-        uint  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    kernel_mul_mv_q6_K_f32_impl(src0, src1, dst, ne00, ne01, ne02, ne10, ne12, ne0, ne1, r2, r3, tgpig, tiisg, sgitg);
-}
-
-//============================= templates and their specializations =============================
-
-// NOTE: this is not dequantizing - we are simply fitting the template
-template <typename type4x4>
-void dequantize_f32(device const float4x4 * src, short il, thread type4x4 & reg) {
-    float4x4 temp = *(((device float4x4 *)src));
-    for (int i = 0; i < 16; i++){
-        reg[i/4][i%4] = temp[i/4][i%4];
-    }
-}
-
-template <typename type4x4>
-void dequantize_f16(device const half4x4 * src, short il, thread type4x4 & reg) {
-    half4x4 temp = *(((device half4x4 *)src));
-    for (int i = 0; i < 16; i++){
-        reg[i/4][i%4] = temp[i/4][i%4];
-    }
-}
-
-template <typename type4x4>
-void dequantize_q4_0(device const block_q4_0 *xb, short il, thread type4x4 & reg) {
-    device const uint16_t * qs = ((device const uint16_t *)xb + 1);
-    const float d1 = il ? (xb->d / 16.h) : xb->d;
-    const float d2 = d1 / 256.f;
-    const float md = -8.h * xb->d;
-    const ushort mask0 = il ? 0x00F0 : 0x000F;
-    const ushort mask1 = mask0 << 8;
-
-    for (int i=0;i<8;i++) {
-        reg[i/2][2*(i%2)+0] = d1 * (qs[i] & mask0) + md;
-        reg[i/2][2*(i%2)+1] = d2 * (qs[i] & mask1) + md;
-    }
-}
-
-template <typename type4x4>
-void dequantize_q4_1(device const block_q4_1 *xb, short il, thread type4x4 & reg) {
-    device const uint16_t * qs = ((device const uint16_t *)xb + 2);
-    const float d1 = il ? (xb->d / 16.h) : xb->d;
-    const float d2 = d1 / 256.f;
-    const float  m = xb->m;
-    const ushort mask0 = il ? 0x00F0 : 0x000F;
-    const ushort mask1 = mask0 << 8;
-
-    for (int i=0;i<8;i++) {
-        reg[i/2][2*(i%2)+0] = ((qs[i] & mask0) * d1) + m;
-        reg[i/2][2*(i%2)+1] = ((qs[i] & mask1) * d2) + m;
-    }
-}
-
-template <typename type4x4>
-void dequantize_q5_0(device const block_q5_0 *xb, short il, thread type4x4 & reg) {
-    device const uint16_t * qs = ((device const uint16_t *)xb + 3);
-    const float d = xb->d;
-    const float md = -16.h * xb->d;
-    const ushort mask = il ? 0x00F0 : 0x000F;
-
-    const uint32_t qh = *((device const uint32_t *)xb->qh);
-
-    const int x_mv = il ? 4 : 0;
-
-    const int gh_mv = il ? 12 : 0;
-    const int gh_bk = il ?  0 : 4;
-
-    for (int i = 0; i < 8; i++) {
-        // extract the 5-th bits for x0 and x1
-        const uint8_t xh_0 = ((qh >> (gh_mv + 2*i  )) << gh_bk) & 0x10;
-        const uint8_t xh_1 = ((qh >> (gh_mv + 2*i+1)) << gh_bk) & 0x10;
-
-        // combine the 4-bits from qs with the 5th bit
-        const int32_t x0 = ((((qs[i]     ) & mask) >> x_mv) | xh_0);
-        const int32_t x1 = ((((qs[i] >> 8) & mask) >> x_mv) | xh_1);
-
-        reg[i/2][2*(i%2)+0] = d * x0 + md;
-        reg[i/2][2*(i%2)+1] = d * x1 + md;
-    }
-}
-
-template <typename type4x4>
-void dequantize_q5_1(device const block_q5_1 *xb, short il, thread type4x4 & reg) {
-    device const uint16_t * qs = ((device const uint16_t *)xb + 4);
-    const float d = xb->d;
-    const float m = xb->m;
-    const ushort mask = il ? 0x00F0 : 0x000F;
-
-    const uint32_t qh = *((device const uint32_t *)xb->qh);
-
-    const int x_mv = il ? 4 : 0;
-
-    const int gh_mv = il ? 12 : 0;
-    const int gh_bk = il ?  0 : 4;
-
-    for (int i = 0; i < 8; i++) {
-        // extract the 5-th bits for x0 and x1
-        const uint8_t xh_0 = ((qh >> (gh_mv + 2*i  )) << gh_bk) & 0x10;
-        const uint8_t xh_1 = ((qh >> (gh_mv + 2*i+1)) << gh_bk) & 0x10;
-
-        // combine the 4-bits from qs with the 5th bit
-        const int32_t x0 = ((((qs[i]     ) & mask) >> x_mv) | xh_0);
-        const int32_t x1 = ((((qs[i] >> 8) & mask) >> x_mv) | xh_1);
-
-        reg[i/2][2*(i%2)+0] = d * x0 + m;
-        reg[i/2][2*(i%2)+1] = d * x1 + m;
-    }
-}
-
-template <typename type4x4>
-void dequantize_q8_0(device const block_q8_0 *xb, short il, thread type4x4 & reg) {
-    device const int8_t * qs = ((device const int8_t *)xb->qs);
-    const half d = xb->d;
-
-    for (int i = 0; i < 16; i++) {
-        reg[i/4][i%4] = (qs[i + 16*il] * d);
-    }
-}
-
-template <typename type4x4>
-void dequantize_q2_K(device const block_q2_K *xb, short il, thread type4x4 & reg) {
-    const float d = xb->d;
-    const float min = xb->dmin;
-    device const uint8_t * q = (device const uint8_t *)xb->qs;
-    float dl, ml;
-    uint8_t sc = xb->scales[il];
-
-#if QK_K == 256
-    q = q + 32*(il/8) + 16*(il&1);
-    il = (il/2)%4;
-#endif
-    half  coef = il>1 ? (il>2 ? 1/64.h : 1/16.h) : (il>0 ? 1/4.h : 1.h);
-    uchar mask = il>1 ? (il>2 ? 192    : 48)     : (il>0 ? 12    : 3);
-    dl = d * (sc & 0xF) * coef, ml = min * (sc >> 4);
-    for (int i = 0; i < 16; ++i) {
-        reg[i/4][i%4] = dl * (q[i] & mask) - ml;
-    }
-}
-
-template <typename type4x4>
-void dequantize_q3_K(device const block_q3_K *xb, short il, thread type4x4 & reg) {
-    const half d_all = xb->d;
-    device const uint8_t * q = (device const uint8_t *)xb->qs;
-    device const uint8_t * h = (device const uint8_t *)xb->hmask;
-    device const int8_t * scales = (device const int8_t *)xb->scales;
-
-#if QK_K == 256
-    q = q + 32 * (il/8) + 16 * (il&1);
-    h = h + 16 * (il&1);
-    uint8_t m = 1 << (il/2);
-    uint16_t kmask1 = (il/4)>1 ? ((il/4)>2 ? 192 : 48) : \
-                                 ((il/4)>0 ? 12  : 3);
-    uint16_t kmask2 = il/8 ? 0xF0 : 0x0F;
-    uint16_t scale_2 = scales[il%8], scale_1 = scales[8 + il%4];
-    int16_t  dl_int = (il/4)&1 ? (scale_2&kmask2) | ((scale_1&kmask1) << 2)
-                               : (scale_2&kmask2) | ((scale_1&kmask1) << 4);
-    half dl = il<8 ? d_all * (dl_int - 32.h) : d_all * (dl_int / 16.h - 32.h);
-    const half ml = 4.h * dl;
-
-    il = (il/2) & 3;
-    const half    coef = il>1 ? (il>2 ? 1/64.h : 1/16.h) : (il>0 ? 1/4.h : 1.h);
-    const uint8_t mask = il>1 ? (il>2 ? 192    : 48)     : (il>0 ? 12    : 3);
-    dl *= coef;
-
-    for (int i = 0; i < 16; ++i) {
-        reg[i/4][i%4] = dl * (q[i] & mask) - (h[i] & m ? 0 : ml);
-    }
-#else
-    float    kcoef = il&1 ? 1.f/16.f : 1.f;
-    uint16_t kmask = il&1 ? 0xF0     : 0x0F;
-    float    dl = d_all * ((scales[il/2] & kmask) * kcoef - 8);
-    float    coef = il>1 ? (il>2 ? 1/64.h : 1/16.h) : (il>0 ? 1/4.h : 1.h);
-    uint8_t  mask = il>1 ? (il>2 ? 192    : 48)     : (il>0 ? 12    : 3);
-    uint8_t  m = 1<<(il*2);
-    for (int i = 0; i < 16; ++i) {
-        reg[i/4][i%4] = coef * dl * ((q[i] & mask) - ((h[i%8] & (m * (1 + i/8))) ? 0 : 4.f/coef));
-    }
-#endif
-}
-
-static inline uchar2 get_scale_min_k4_just2(int j, int k, device const uchar * q) {
-    return j < 4 ? uchar2{uchar(q[j+0+k] & 63), uchar(q[j+4+k] & 63)}
-                 : uchar2{uchar((q[j+4+k] & 0xF) | ((q[j-4+k] & 0xc0) >> 2)), uchar((q[j+4+k] >> 4) | ((q[j-0+k] & 0xc0) >> 2))};
-}
-
-template <typename type4x4>
-void dequantize_q4_K(device const block_q4_K *xb, short il, thread type4x4 & reg) {
-    device const uchar * q = xb->qs;
-
-#if QK_K == 256
-    short is = (il/4) * 2;
-    q = q + (il/4) * 32 + 16 * (il&1);
-    il = il & 3;
-    const uchar2 sc = get_scale_min_k4_just2(is, il/2, xb->scales);
-    const float d   = il < 2 ? xb->d : xb->d / 16.h;
-    const float min = xb->dmin;
-    const float dl = d * sc[0];
-    const float ml = min * sc[1];
-#else
-    q = q + 16 * (il&1);
-    device const uint8_t * s = xb->scales;
-    device const half2 * dh = (device const half2 *)xb->d;
-    const float2 d = (float2)dh[0];
-    const float dl = il<2 ? d[0] * (s[0]&0xF) : d[0] * (s[1]&0xF)/16.h;
-    const float ml = il<2 ? d[1] * (s[0]>>4)  : d[1] * (s[1]>>4);
-#endif
-    const ushort mask = il<2 ? 0x0F : 0xF0;
-    for (int i = 0; i < 16; ++i) {
-        reg[i/4][i%4] = dl * (q[i] & mask) - ml;
-    }
-}
-
-template <typename type4x4>
-void dequantize_q5_K(device const block_q5_K *xb, short il, thread type4x4 & reg) {
-    device const uint8_t * q  = xb->qs;
-    device const uint8_t * qh = xb->qh;
-
-#if QK_K == 256
-    short is = (il/4) * 2;
-    q  = q + 32 * (il/4) + 16 * (il&1);
-    qh = qh + 16 * (il&1);
-    uint8_t ul = 1 << (il/2);
-    il = il & 3;
-    const uchar2 sc = get_scale_min_k4_just2(is, il/2, xb->scales);
-    const float d = il < 2 ? xb->d : xb->d / 16.h;
-    const float min = xb->dmin;
-    const float dl = d * sc[0];
-    const float ml = min * sc[1];
-
-    const ushort mask  = il<2 ? 0x0F : 0xF0;
-    const float qh_val = il<2 ? 16.f : 256.f;
-    for (int i = 0; i < 16; ++i) {
-        reg[i/4][i%4] = dl * ((q[i] & mask) + (qh[i] & ul ? qh_val : 0)) - ml;
-    }
-#else
-    q = q + 16 * (il&1);
-    device const int8_t * s = xb->scales;
-    const float dl = xb->d * s[il];
-    uint8_t m = 1<<(il*2);
-    const float  coef = il<2 ? 1.f  : 1.f/16.f;
-    const ushort mask = il<2 ? 0x0F : 0xF0;
-    for (int i = 0; i < 16; ++i) {
-        reg[i/4][i%4] = coef * dl * ((q[i] & mask) - (qh[i%8] & (m*(1+i/8)) ? 0.f : 16.f/coef));
-    }
-#endif
-}
-
-template <typename type4x4>
-void dequantize_q6_K(device const block_q6_K *xb, short il, thread type4x4 & reg) {
-    const half d_all = xb->d;
-    device const uint8_t * ql = (device const uint8_t *)xb->ql;
-    device const uint8_t * qh = (device const uint8_t *)xb->qh;
-    device const int8_t * scales = (device const int8_t *)xb->scales;
-
-#if QK_K == 256
-    ql = ql + 64*(il/8) + 32*((il/2)&1) + 16*(il&1);
-    qh = qh + 32*(il/8) + 16*(il&1);
-    half sc = scales[(il%2) + 2 * ((il/2))];
-    il = (il/2) & 3;
-#else
-    ql = ql + 16 * (il&1);
-    half sc = scales[il];
-#endif
-    const uint16_t  kmask1 = il>1 ? (il>2 ? 192 : 48) : (il>0 ? 12 : 3);
-    const uint16_t  kmask2 = il>1 ? 0xF0              : 0x0F;
-    const half        coef = il>1 ? 1.f/16.h          : 1.h;
-    const half ml = d_all * sc * 32.h;
-    const half dl = d_all * sc * coef;
-    for (int i = 0; i < 16; ++i) {
-        const half q = il&1 ? ((ql[i] & kmask2) | ((qh[i] & kmask1) << 2))
-                            : ((ql[i] & kmask2) | ((qh[i] & kmask1) << 4));
-        reg[i/4][i%4] = dl * q - ml;
-    }
-}
-
-template<typename block_q, short nl, void (*dequantize_func)(device const block_q *, short, thread float4x4 &)>
-kernel void kernel_get_rows(
-        device const  void * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        uint3                tgpig[[threadgroup_position_in_grid]],
-        uint                 tiitg[[thread_index_in_threadgroup]],
-        uint3                tptg [[threads_per_threadgroup]]) {
-    //const int64_t i = tgpig;
-    //const int64_t r = ((device int32_t *) src1)[i];
-
-    const int64_t i10 = tgpig.x;
-    const int64_t i11 = tgpig.y;
-
-    const int64_t r = ((device int32_t *) ((device char *) src1 + i11*nb11 + i10*nb10))[0];
-
-    const int64_t i02 = i11;
-
-    for (int64_t ind = tiitg; ind < ne00/16; ind += tptg.x) {
-        float4x4 temp;
-        dequantize_func(
-            ((device const block_q *) ((device char *) src0 + r*nb01 + i02*nb02)) + ind/nl, ind%nl, temp);
-        *(((device float4x4 *) ((device char *) dst + i11*nb2 + i10*nb1)) + ind) = temp;
-    }
-}
-
-kernel void kernel_get_rows_f32(
-        device const  void * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        uint3                tgpig[[threadgroup_position_in_grid]],
-        uint                 tiitg[[thread_index_in_threadgroup]],
-        uint3                tptg [[threads_per_threadgroup]]) {
-    const int64_t i10 = tgpig.x;
-    const int64_t i11 = tgpig.y;
-
-    const int64_t r = ((device int32_t *) ((device char *) src1 + i11*nb11 + i10*nb10))[0];
-
-    const int64_t i02 = i11;
-
-    for (int ind = tiitg; ind < ne00; ind += tptg.x) {
-        ((device float *) ((device char *) dst + i11*nb2 + i10*nb1))[ind] =
-            ((device float *) ((device char *) src0 + r*nb01 + i02*nb02))[ind];
-    }
-}
-
-kernel void kernel_get_rows_f16(
-        device const  void * src0,
-        device const  char * src1,
-        device       float * dst,
-        constant   int64_t & ne00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        uint3                tgpig[[threadgroup_position_in_grid]],
-        uint                 tiitg[[thread_index_in_threadgroup]],
-        uint3                tptg [[threads_per_threadgroup]]) {
-    const int64_t i10 = tgpig.x;
-    const int64_t i11 = tgpig.y;
-
-    const int64_t r = ((device int32_t *) ((device char *) src1 + i11*nb11 + i10*nb10))[0];
-
-    const int64_t i02 = i11;
-
-    for (int ind = tiitg; ind < ne00; ind += tptg.x) {
-        ((device float *) ((device char *) dst + i11*nb2 + i10*nb1))[ind] =
-            ((device half *) ((device char *) src0 + r*nb01 + i02*nb02))[ind];
-    }
-}
-
-kernel void kernel_get_rows_i32(
-        device const  void * src0,
-        device const  char * src1,
-        device     int32_t * dst,
-        constant   int64_t & ne00,
-        constant  uint64_t & nb01,
-        constant  uint64_t & nb02,
-        constant   int64_t & ne10,
-        constant  uint64_t & nb10,
-        constant  uint64_t & nb11,
-        constant  uint64_t & nb1,
-        constant  uint64_t & nb2,
-        uint3                tgpig[[threadgroup_position_in_grid]],
-        uint                 tiitg[[thread_index_in_threadgroup]],
-        uint3                tptg [[threads_per_threadgroup]]) {
-    const int64_t i10 = tgpig.x;
-    const int64_t i11 = tgpig.y;
-
-    const int64_t r = ((device int32_t *) ((device char *) src1 + i11*nb11 + i10*nb10))[0];
-
-    const int64_t i02 = i11;
-
-    for (int ind = tiitg; ind < ne00; ind += tptg.x) {
-        ((device int32_t *) ((device char *) dst + i11*nb2 + i10*nb1))[ind] =
-            ((device int32_t *) ((device char *) src0 + r*nb01 + i02*nb02))[ind];
-    }
-}
-
-
-#define BLOCK_SIZE_M 64 // 8 simdgroup matrices from matrix A
-#define BLOCK_SIZE_N 32 // 4 simdgroup matrices from matrix B
-#define BLOCK_SIZE_K 32
-#define THREAD_MAT_M 4 // each thread take 4 simdgroup matrices from matrix A
-#define THREAD_MAT_N 2 // each thread take 2 simdgroup matrices from matrix B
-#define THREAD_PER_BLOCK 128
-#define THREAD_PER_ROW 2 // 2 thread for each row in matrix A to load numbers
-#define THREAD_PER_COL 4 // 4 thread for each row in matrix B to load numbers
-#define SG_MAT_SIZE 64 // simdgroup matrix is of shape 8x8
-#define SG_MAT_ROW 8
-
-// each block_q contains 16*nl weights
-template<typename block_q, short nl, void (*dequantize_func)(device const block_q *, short, thread half4x4 &)>
-void kernel_mul_mm_impl(device const  uchar * src0,
-                        device const  uchar * src1,
-                        device        float * dst,
-                        constant    int64_t & ne00,
-                        constant    int64_t & ne02,
-                        constant   uint64_t & nb01,
-                        constant   uint64_t & nb02,
-                        constant    int64_t & ne12,
-                        constant   uint64_t & nb10,
-                        constant   uint64_t & nb11,
-                        constant   uint64_t & nb12,
-                        constant    int64_t & ne0,
-                        constant    int64_t & ne1,
-                        constant       uint & r2,
-                        constant       uint & r3,
-                        threadgroup   uchar * shared_memory [[threadgroup(0)]],
-                        uint3                 tgpig[[threadgroup_position_in_grid]],
-                        uint                  tiitg[[thread_index_in_threadgroup]],
-                        uint                  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    threadgroup half  * sa = (threadgroup half  *)(shared_memory);
-    threadgroup float * sb = (threadgroup float *)(shared_memory + 4096);
-
-    const uint r0 = tgpig.y;
-    const uint r1 = tgpig.x;
-    const uint im = tgpig.z;
-
-    // if this block is of 64x32 shape or smaller
-    short n_rows = (ne0 - r0 * BLOCK_SIZE_M < BLOCK_SIZE_M) ? (ne0 - r0 * BLOCK_SIZE_M) : BLOCK_SIZE_M;
-    short n_cols = (ne1 - r1 * BLOCK_SIZE_N < BLOCK_SIZE_N) ? (ne1 - r1 * BLOCK_SIZE_N) : BLOCK_SIZE_N;
-
-    // a thread shouldn't load data outside of the matrix
-    short thread_row = ((short)tiitg/THREAD_PER_ROW) < n_rows ? ((short)tiitg/THREAD_PER_ROW) : n_rows - 1;
-    short thread_col = ((short)tiitg/THREAD_PER_COL) < n_cols ? ((short)tiitg/THREAD_PER_COL) : n_cols - 1;
-
-    simdgroup_half8x8  ma[4];
-    simdgroup_float8x8 mb[2];
-    simdgroup_float8x8 c_res[8];
-    for (int i = 0; i < 8; i++){
-        c_res[i] = make_filled_simdgroup_matrix<float, 8>(0.f);
-    }
-
-    short il = (tiitg % THREAD_PER_ROW);
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    uint   offset0 = (i12/r2)*nb02 + (i13/r3)*(nb02*ne02);
-    ushort offset1 = il/nl;
-
-    device const block_q * x = (device const block_q *)(src0 + (r0 * BLOCK_SIZE_M + thread_row) * nb01 + offset0) + offset1;
-    device const float   * y = (device const float   *)(src1
-        + nb12 * im
-        + nb11 * (r1 * BLOCK_SIZE_N + thread_col)
-        + nb10 * (BLOCK_SIZE_K / THREAD_PER_COL * (tiitg % THREAD_PER_COL)));
-
-    for (int loop_k = 0; loop_k < ne00; loop_k += BLOCK_SIZE_K) {
-        // load data and store to threadgroup memory
-        half4x4 temp_a;
-        dequantize_func(x, il, temp_a);
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        #pragma unroll(16)
-        for (int i = 0; i < 16; i++) {
-            *(sa + SG_MAT_SIZE * ((tiitg / THREAD_PER_ROW / 8) \
-            +                     (tiitg % THREAD_PER_ROW) * 16 + (i / 8) * 8) \
-            +                     (tiitg / THREAD_PER_ROW) % 8  + (i & 7) * 8) = temp_a[i/4][i%4];
-        }
-
-        *(threadgroup float2x4 *)(sb + (tiitg % THREAD_PER_COL) * 8 * 32 + 8 * (tiitg / THREAD_PER_COL)) = *((device float2x4 *)y);
-
-        il = (il + 2 < nl) ? il + 2 : il % 2;
-        x  = (il < 2) ? x + (2+nl-1)/nl : x;
-        y += BLOCK_SIZE_K;
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        // load matrices from threadgroup memory and conduct outer products
-        threadgroup half  * lsma = (sa + THREAD_MAT_M * SG_MAT_SIZE * (sgitg % 2));
-        threadgroup float * lsmb = (sb + THREAD_MAT_N * SG_MAT_SIZE * (sgitg / 2));
-
-        #pragma unroll(4)
-        for (int ik = 0; ik < BLOCK_SIZE_K / 8; ik++) {
-            #pragma unroll(4)
-            for (int i = 0; i < 4; i++) {
-                simdgroup_load(ma[i],lsma + SG_MAT_SIZE * i);
-            }
-            simdgroup_barrier(mem_flags::mem_none);
-            #pragma unroll(2)
-            for (int i = 0; i < 2; i++) {
-                simdgroup_load(mb[i],lsmb + SG_MAT_SIZE * i);
-            }
-
-            lsma += BLOCK_SIZE_M / SG_MAT_ROW * SG_MAT_SIZE;
-            lsmb += BLOCK_SIZE_N / SG_MAT_ROW * SG_MAT_SIZE;
-
-            #pragma unroll(8)
-            for (int i = 0; i < 8; i++){
-                simdgroup_multiply_accumulate(c_res[i], mb[i/4], ma[i%4], c_res[i]);
-            }
-        }
-    }
-
-    if ((r0 + 1) * BLOCK_SIZE_M <= ne0 && (r1 + 1) * BLOCK_SIZE_N <= ne1) {
-        device float * C = dst + (BLOCK_SIZE_M * r0 + 32 * (sgitg &  1)) \
-                               + (BLOCK_SIZE_N * r1 + 16 * (sgitg >> 1)) * ne0 + im*ne1*ne0;
-        for (int i = 0; i < 8; i++) {
-            simdgroup_store(c_res[i], C + 8 * (i%4) + 8 * ne0 * (i/4), ne0);
-        }
-    } else {
-        // block is smaller than 64x32, we should avoid writing data outside of the matrix
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-        threadgroup float * temp_str = ((threadgroup float *)shared_memory) \
-                                      + 32 * (sgitg&1) + (16 * (sgitg>>1)) * BLOCK_SIZE_M;
-        for (int i = 0; i < 8; i++) {
-            simdgroup_store(c_res[i], temp_str + 8 * (i%4) + 8 * BLOCK_SIZE_M * (i/4), BLOCK_SIZE_M);
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        device float * C = dst + (BLOCK_SIZE_M * r0) + (BLOCK_SIZE_N * r1) * ne0 + im*ne1*ne0;
-        if (sgitg == 0) {
-            for (int i = 0; i < n_rows; i++) {
-                for (int j = tiitg; j < n_cols; j += BLOCK_SIZE_N) {
-                    *(C + i + j * ne0) = *(temp_str + i + j * BLOCK_SIZE_M);
-                }
-            }
-        }
-    }
-}
-
-// same as kernel_mul_mm_impl, but src1 and dst are accessed via indices stored in src1ids
-template<typename block_q, short nl, void (*dequantize_func)(device const block_q *, short, thread half4x4 &)>
-void kernel_mul_mm_id_impl(
-        device const  uchar * src0,
-        device const  uchar * src1,
-        thread        short * src1ids,
-        device        float * dst,
-        constant    int64_t & ne00,
-        constant    int64_t & ne02,
-        constant   uint64_t & nb01,
-        constant   uint64_t & nb02,
-        constant    int64_t & ne12,
-        constant   uint64_t & nb10,
-        constant   uint64_t & nb11,
-        constant   uint64_t & nb12,
-        constant    int64_t & ne0,
-                    int64_t   ne1,
-        constant       uint & r2,
-        constant       uint & r3,
-        threadgroup   uchar * shared_memory,
-        uint3                 tgpig[[threadgroup_position_in_grid]],
-        uint                  tiitg[[thread_index_in_threadgroup]],
-        uint                  sgitg[[simdgroup_index_in_threadgroup]]) {
-
-    threadgroup half  * sa = (threadgroup half  *)(shared_memory);
-    threadgroup float * sb = (threadgroup float *)(shared_memory + 4096);
-
-    const uint r0 = tgpig.y;
-    const uint r1 = tgpig.x;
-    const uint im = tgpig.z;
-
-    if (r1 * BLOCK_SIZE_N >= ne1) return;
-
-    // if this block is of 64x32 shape or smaller
-    short n_rows = (ne0 - r0 * BLOCK_SIZE_M < BLOCK_SIZE_M) ? (ne0 - r0 * BLOCK_SIZE_M) : BLOCK_SIZE_M;
-    short n_cols = (ne1 - r1 * BLOCK_SIZE_N < BLOCK_SIZE_N) ? (ne1 - r1 * BLOCK_SIZE_N) : BLOCK_SIZE_N;
-
-    // a thread shouldn't load data outside of the matrix
-    short thread_row = ((short)tiitg/THREAD_PER_ROW) < n_rows ? ((short)tiitg/THREAD_PER_ROW) : n_rows - 1;
-    short thread_col = ((short)tiitg/THREAD_PER_COL) < n_cols ? ((short)tiitg/THREAD_PER_COL) : n_cols - 1;
-
-    simdgroup_half8x8  ma[4];
-    simdgroup_float8x8 mb[2];
-    simdgroup_float8x8 c_res[8];
-    for (int i = 0; i < 8; i++){
-        c_res[i] = make_filled_simdgroup_matrix<float, 8>(0.f);
-    }
-
-    short il = (tiitg % THREAD_PER_ROW);
-
-    const uint i12 = im%ne12;
-    const uint i13 = im/ne12;
-
-    uint   offset0 = (i12/r2)*nb02 + (i13/r3)*(nb02*ne02);
-    ushort offset1 = il/nl;
-
-    device const block_q * x = (device const block_q *)(src0 + (r0 * BLOCK_SIZE_M + thread_row) * nb01 + offset0) + offset1;
-    device const float   * y = (device const float   *)(src1
-        + nb12 * im
-        + nb11 * src1ids[r1 * BLOCK_SIZE_N + thread_col]
-        + nb10 * (BLOCK_SIZE_K / THREAD_PER_COL * (tiitg % THREAD_PER_COL)));
-
-    for (int loop_k = 0; loop_k < ne00; loop_k += BLOCK_SIZE_K) {
-        // load data and store to threadgroup memory
-        half4x4 temp_a;
-        dequantize_func(x, il, temp_a);
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        for (int i = 0; i < 16; i++) {
-            *(sa + SG_MAT_SIZE * ((tiitg / THREAD_PER_ROW / 8) \
-            +                     (tiitg % THREAD_PER_ROW) * 16 + (i / 8) * 8) \
-            +                     (tiitg / THREAD_PER_ROW) % 8  + (i & 7) * 8) = temp_a[i/4][i%4];
-        }
-
-        *(threadgroup float2x4 *)(sb + (tiitg % THREAD_PER_COL) * 8 * 32 + 8 * (tiitg / THREAD_PER_COL)) = *((device float2x4 *)y);
-
-        il = (il + 2 < nl) ? il + 2 : il % 2;
-        x  = (il < 2) ? x + (2+nl-1)/nl : x;
-        y += BLOCK_SIZE_K;
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        // load matrices from threadgroup memory and conduct outer products
-        threadgroup half  * lsma = (sa + THREAD_MAT_M * SG_MAT_SIZE * (sgitg % 2));
-        threadgroup float * lsmb = (sb + THREAD_MAT_N * SG_MAT_SIZE * (sgitg / 2));
-
-        for (int ik = 0; ik < BLOCK_SIZE_K / 8; ik++) {
-            for (int i = 0; i < 4; i++) {
-                simdgroup_load(ma[i],lsma + SG_MAT_SIZE * i);
-            }
-            simdgroup_barrier(mem_flags::mem_none);
-            for (int i = 0; i < 2; i++) {
-                simdgroup_load(mb[i],lsmb + SG_MAT_SIZE * i);
-            }
-
-            lsma += BLOCK_SIZE_M / SG_MAT_ROW * SG_MAT_SIZE;
-            lsmb += BLOCK_SIZE_N / SG_MAT_ROW * SG_MAT_SIZE;
-
-            for (int i = 0; i < 8; i++){
-                simdgroup_multiply_accumulate(c_res[i], mb[i/4], ma[i%4], c_res[i]);
-            }
-        }
-    }
-
-    {
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-        threadgroup float * temp_str = ((threadgroup float *)shared_memory) \
-                                      + 32 * (sgitg&1) + (16 * (sgitg>>1)) * BLOCK_SIZE_M;
-        for (int i = 0; i < 8; i++) {
-            simdgroup_store(c_res[i], temp_str + 8 * (i%4) + 8 * BLOCK_SIZE_M * (i/4), BLOCK_SIZE_M);
-        }
-
-        threadgroup_barrier(mem_flags::mem_threadgroup);
-
-        device float * C = dst + (BLOCK_SIZE_M * r0) + im*ne1*ne0;
-        if (sgitg == 0) {
-            for (int i = 0; i < n_rows; i++) {
-                for (int j = tiitg; j < n_cols; j += BLOCK_SIZE_N) {
-                    *(C + i + src1ids[j + r1*BLOCK_SIZE_N] * ne0) = *(temp_str + i + j * BLOCK_SIZE_M);
-                }
-            }
-        }
-    }
-}
-
-template<typename block_q, short nl, void (*dequantize_func)(device const block_q *, short, thread half4x4 &)>
-kernel void kernel_mul_mm(device const  uchar * src0,
-                          device const  uchar * src1,
-                          device        float * dst,
-                          constant    int64_t & ne00,
-                          constant    int64_t & ne02,
-                          constant   uint64_t & nb01,
-                          constant   uint64_t & nb02,
-                          constant    int64_t & ne12,
-                          constant   uint64_t & nb10,
-                          constant   uint64_t & nb11,
-                          constant   uint64_t & nb12,
-                          constant    int64_t & ne0,
-                          constant    int64_t & ne1,
-                          constant       uint & r2,
-                          constant       uint & r3,
-                          threadgroup   uchar * shared_memory [[threadgroup(0)]],
-                          uint3                 tgpig[[threadgroup_position_in_grid]],
-                          uint                  tiitg[[thread_index_in_threadgroup]],
-                          uint                  sgitg[[simdgroup_index_in_threadgroup]]) {
-    kernel_mul_mm_impl<block_q, nl, dequantize_func>(
-        src0,
-        src1,
-        dst,
-        ne00,
-        ne02,
-        nb01,
-        nb02,
-        ne12,
-        nb10,
-        nb11,
-        nb12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        shared_memory,
-        tgpig,
-        tiitg,
-        sgitg);
-}
-
-template<typename block_q, short nl, void (*dequantize_func)(device const block_q *, short, thread half4x4 &)>
-kernel void kernel_mul_mm_id(
-        device const   uchar * ids,
-        device const   uchar * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const   uchar * src00,
-        device const   uchar * src01,
-        device const   uchar * src02,
-        device const   uchar * src03,
-        device const   uchar * src04,
-        device const   uchar * src05,
-        device const   uchar * src06,
-        device const   uchar * src07,
-        threadgroup    uchar * shared_memory [[threadgroup(0)]],
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const uchar * src0s[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    // expert id
-    const int32_t id = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    // row indices of src1 for expert id
-    int64_t _ne1 = 0;
-    short src1ids[512];
-
-    for (int64_t i1 = 0; i1 < ne1; i1++) {
-        if (((device int32_t *) (ids + i1*nbi1))[idx] == id) {
-            src1ids[_ne1++] = i1;
-        }
-    }
-
-    kernel_mul_mm_id_impl<block_q, nl, dequantize_func>(
-        src0s[id],
-        src1,
-        src1ids,
-        dst,
-        ne00,
-        ne02,
-        nb01,
-        nb02,
-        ne12,
-        nb10,
-        nb11,
-        nb12,
-        ne0,
-        _ne1,
-        r2,
-        r3,
-        shared_memory,
-        tgpig,
-        tiitg,
-        sgitg);
-}
-
-#if QK_K == 256
-#define QK_NL 16
-#else
-#define QK_NL 4
-#endif
-
-//
-// get rows
-//
-
-typedef void (get_rows_t)(
-        device const void * src0,
-        device const char * src1,
-        device      float * dst,
-        constant  int64_t & ne00,
-        constant uint64_t & nb01,
-        constant uint64_t & nb02,
-        constant  int64_t & ne10,
-        constant uint64_t & nb10,
-        constant uint64_t & nb11,
-        constant uint64_t & nb1,
-        constant uint64_t & nb2,
-        uint3, uint, uint3);
-
-//template [[host_name("kernel_get_rows_f32")]]  kernel get_rows_t kernel_get_rows<float4x4,   1, dequantize_f32>;
-//template [[host_name("kernel_get_rows_f16")]]  kernel get_rows_t kernel_get_rows<half4x4,    1, dequantize_f16>;
-template [[host_name("kernel_get_rows_q4_0")]] kernel get_rows_t kernel_get_rows<block_q4_0, 2, dequantize_q4_0>;
-template [[host_name("kernel_get_rows_q4_1")]] kernel get_rows_t kernel_get_rows<block_q4_1, 2, dequantize_q4_1>;
-template [[host_name("kernel_get_rows_q5_0")]] kernel get_rows_t kernel_get_rows<block_q5_0, 2, dequantize_q5_0>;
-template [[host_name("kernel_get_rows_q5_1")]] kernel get_rows_t kernel_get_rows<block_q5_1, 2, dequantize_q5_1>;
-template [[host_name("kernel_get_rows_q8_0")]] kernel get_rows_t kernel_get_rows<block_q8_0, 2, dequantize_q8_0>;
-template [[host_name("kernel_get_rows_q2_K")]] kernel get_rows_t kernel_get_rows<block_q2_K, QK_NL, dequantize_q2_K>;
-template [[host_name("kernel_get_rows_q3_K")]] kernel get_rows_t kernel_get_rows<block_q3_K, QK_NL, dequantize_q3_K>;
-template [[host_name("kernel_get_rows_q4_K")]] kernel get_rows_t kernel_get_rows<block_q4_K, QK_NL, dequantize_q4_K>;
-template [[host_name("kernel_get_rows_q5_K")]] kernel get_rows_t kernel_get_rows<block_q5_K, QK_NL, dequantize_q5_K>;
-template [[host_name("kernel_get_rows_q6_K")]] kernel get_rows_t kernel_get_rows<block_q6_K, QK_NL, dequantize_q6_K>;
-
-//
-// matrix-matrix multiplication
-//
-
-typedef void (mat_mm_t)(
-        device const  uchar * src0,
-        device const  uchar * src1,
-        device        float * dst,
-        constant    int64_t & ne00,
-        constant    int64_t & ne02,
-        constant   uint64_t & nb01,
-        constant   uint64_t & nb02,
-        constant    int64_t & ne12,
-        constant   uint64_t & nb10,
-        constant   uint64_t & nb11,
-        constant   uint64_t & nb12,
-        constant    int64_t & ne0,
-        constant    int64_t & ne1,
-        constant       uint & r2,
-        constant       uint & r3,
-        threadgroup   uchar *,
-        uint3, uint, uint);
-
-template [[host_name("kernel_mul_mm_f32_f32")]]  kernel mat_mm_t kernel_mul_mm<float4x4,   1,     dequantize_f32>;
-template [[host_name("kernel_mul_mm_f16_f32")]]  kernel mat_mm_t kernel_mul_mm<half4x4,    1,     dequantize_f16>;
-template [[host_name("kernel_mul_mm_q4_0_f32")]] kernel mat_mm_t kernel_mul_mm<block_q4_0, 2,     dequantize_q4_0>;
-template [[host_name("kernel_mul_mm_q4_1_f32")]] kernel mat_mm_t kernel_mul_mm<block_q4_1, 2,     dequantize_q4_1>;
-template [[host_name("kernel_mul_mm_q5_0_f32")]] kernel mat_mm_t kernel_mul_mm<block_q5_0, 2,     dequantize_q5_0>;
-template [[host_name("kernel_mul_mm_q5_1_f32")]] kernel mat_mm_t kernel_mul_mm<block_q5_1, 2,     dequantize_q5_1>;
-template [[host_name("kernel_mul_mm_q8_0_f32")]] kernel mat_mm_t kernel_mul_mm<block_q8_0, 2,     dequantize_q8_0>;
-template [[host_name("kernel_mul_mm_q2_K_f32")]] kernel mat_mm_t kernel_mul_mm<block_q2_K, QK_NL, dequantize_q2_K>;
-template [[host_name("kernel_mul_mm_q3_K_f32")]] kernel mat_mm_t kernel_mul_mm<block_q3_K, QK_NL, dequantize_q3_K>;
-template [[host_name("kernel_mul_mm_q4_K_f32")]] kernel mat_mm_t kernel_mul_mm<block_q4_K, QK_NL, dequantize_q4_K>;
-template [[host_name("kernel_mul_mm_q5_K_f32")]] kernel mat_mm_t kernel_mul_mm<block_q5_K, QK_NL, dequantize_q5_K>;
-template [[host_name("kernel_mul_mm_q6_K_f32")]] kernel mat_mm_t kernel_mul_mm<block_q6_K, QK_NL, dequantize_q6_K>;
-
-//
-// indirect matrix-matrix multiplication
-//
-
-typedef void (mat_mm_id_t)(
-        device const   uchar * ids,
-        device const   uchar * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const   uchar * src00,
-        device const   uchar * src01,
-        device const   uchar * src02,
-        device const   uchar * src03,
-        device const   uchar * src04,
-        device const   uchar * src05,
-        device const   uchar * src06,
-        device const   uchar * src07,
-        threadgroup    uchar *,
-        uint3, uint, uint);
-
-template [[host_name("kernel_mul_mm_id_f32_f32")]]  kernel mat_mm_id_t kernel_mul_mm_id<float4x4,   1,     dequantize_f32>;
-template [[host_name("kernel_mul_mm_id_f16_f32")]]  kernel mat_mm_id_t kernel_mul_mm_id<half4x4,    1,     dequantize_f16>;
-template [[host_name("kernel_mul_mm_id_q4_0_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q4_0, 2,     dequantize_q4_0>;
-template [[host_name("kernel_mul_mm_id_q4_1_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q4_1, 2,     dequantize_q4_1>;
-template [[host_name("kernel_mul_mm_id_q5_0_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q5_0, 2,     dequantize_q5_0>;
-template [[host_name("kernel_mul_mm_id_q5_1_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q5_1, 2,     dequantize_q5_1>;
-template [[host_name("kernel_mul_mm_id_q8_0_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q8_0, 2,     dequantize_q8_0>;
-template [[host_name("kernel_mul_mm_id_q2_K_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q2_K, QK_NL, dequantize_q2_K>;
-template [[host_name("kernel_mul_mm_id_q3_K_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q3_K, QK_NL, dequantize_q3_K>;
-template [[host_name("kernel_mul_mm_id_q4_K_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q4_K, QK_NL, dequantize_q4_K>;
-template [[host_name("kernel_mul_mm_id_q5_K_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q5_K, QK_NL, dequantize_q5_K>;
-template [[host_name("kernel_mul_mm_id_q6_K_f32")]] kernel mat_mm_id_t kernel_mul_mm_id<block_q6_K, QK_NL, dequantize_q6_K>;
-
-//
-// matrix-vector multiplication
-//
-
-[[host_name("kernel_mul_mv_id_f32_f32")]]
-kernel void kernel_mul_mv_id_f32_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    kernel_mul_mv_f32_f32_impl(
-        src0[id],
-        src1 + bid*nb11,
-        dst  + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        nb00,
-        nb01,
-        nb02,
-        ne10,
-        ne11,
-        ne12,
-        nb10,
-        nb11,
-        nb12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg);
-}
-
-[[host_name("kernel_mul_mv_id_f16_f32")]]
-kernel void kernel_mul_mv_id_f16_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    kernel_mul_mv_f16_f32_impl(
-        src0[id],
-        src1 + bid*nb11,
-        dst  + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        nb00,
-        nb01,
-        nb02,
-        ne10,
-        ne11,
-        ne12,
-        nb10,
-        nb11,
-        nb12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg);
-}
-
-[[host_name("kernel_mul_mv_id_q8_0_f32")]]
-kernel void kernel_mul_mv_id_q8_0_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    kernel_mul_mv_q8_0_f32_impl(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q4_0_f32")]]
-kernel void kernel_mul_mv_id_q4_0_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    mul_vec_q_n_f32_impl<block_q4_0, N_DST, N_SIMDGROUP, N_SIMDWIDTH>(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q4_1_f32")]]
-kernel void kernel_mul_mv_id_q4_1_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    mul_vec_q_n_f32_impl<block_q4_1, N_DST, N_SIMDGROUP, N_SIMDWIDTH>(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q5_0_f32")]]
-kernel void kernel_mul_mv_id_q5_0_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    mul_vec_q_n_f32_impl<block_q5_0, N_DST, N_SIMDGROUP, N_SIMDWIDTH>(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q5_1_f32")]]
-kernel void kernel_mul_mv_id_q5_1_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    mul_vec_q_n_f32_impl<block_q5_1, N_DST, N_SIMDGROUP, N_SIMDWIDTH>(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q2_K_f32")]]
-kernel void kernel_mul_mv_id_q2_K_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    kernel_mul_mv_q2_K_f32_impl(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q3_K_f32")]]
-kernel void kernel_mul_mv_id_q3_K_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    kernel_mul_mv_q3_K_f32_impl(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q4_K_f32")]]
-kernel void kernel_mul_mv_id_q4_K_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    kernel_mul_mv_q4_K_f32_impl(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q5_K_f32")]]
-kernel void kernel_mul_mv_id_q5_K_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    kernel_mul_mv_q5_K_f32_impl(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
-
-[[host_name("kernel_mul_mv_id_q6_K_f32")]]
-kernel void kernel_mul_mv_id_q6_K_f32(
-        device const    char * ids,
-        device const    char * src1,
-        device         float * dst,
-        constant    uint64_t & nbi1,
-        constant     int64_t & ne00,
-        constant     int64_t & ne01,
-        constant     int64_t & ne02,
-        constant    uint64_t & nb00,
-        constant    uint64_t & nb01,
-        constant    uint64_t & nb02,
-        constant     int64_t & ne10,
-        constant     int64_t & ne11,
-        constant     int64_t & ne12,
-        constant     int64_t & ne13,
-        constant    uint64_t & nb10,
-        constant    uint64_t & nb11,
-        constant    uint64_t & nb12,
-        constant     int64_t & ne0,
-        constant     int64_t & ne1,
-        constant    uint64_t & nb1,
-        constant        uint & r2,
-        constant        uint & r3,
-        constant         int & idx,
-        device const    char * src00,
-        device const    char * src01,
-        device const    char * src02,
-        device const    char * src03,
-        device const    char * src04,
-        device const    char * src05,
-        device const    char * src06,
-        device const    char * src07,
-        uint3                  tgpig[[threadgroup_position_in_grid]],
-        uint                   tiitg[[thread_index_in_threadgroup]],
-        uint                   tiisg[[thread_index_in_simdgroup]],
-        uint                   sgitg[[simdgroup_index_in_threadgroup]]) {
-    device const char * src0[8] = {src00, src01, src02, src03, src04, src05, src06, src07};
-
-    const int64_t bid = tgpig.z/(ne12*ne13);
-
-    tgpig.z = tgpig.z%(ne12*ne13);
-
-    const int32_t id = ((device int32_t *) (ids + bid*nbi1))[idx];
-
-    kernel_mul_mv_q6_K_f32_impl(
-        src0[id],
-        (device const float *) (src1 + bid*nb11),
-        dst + bid*ne0,
-        ne00,
-        ne01,
-        ne02,
-        ne10,
-        ne12,
-        ne0,
-        ne1,
-        r2,
-        r3,
-        tgpig,
-        tiisg,
-        sgitg);
-}
diff --git a/src-tauri/src/main.rs b/src-tauri/src/main.rs
index 7fea8fd..d752ed4 100644
--- a/src-tauri/src/main.rs
+++ b/src-tauri/src/main.rs
@@ -5,17 +5,12 @@
 
 use tauri::{
     http::{HttpRange, ResponseBuilder},
-    Manager, State, Window,
+    AppHandle, Manager, State, Window,
 };
 use tauri_plugin_sql::{Migration, MigrationKind};
 
 use std::{
-    cmp::min,
-    env,
-    io::{Read, Seek, SeekFrom},
-    path::PathBuf,
-    str::FromStr,
-    sync::{Arc, Mutex},
+    cmp::min, env, io::{Read, Seek, SeekFrom}, path::PathBuf, str::FromStr, sync::{Arc, Mutex}
 };
 
 use crossbeam_channel::{unbounded, Sender};
@@ -28,66 +23,132 @@ use module::{
     deleter::NoteDeleter,
     device::{self, Device},
     downloader::{
-        fugumt::FugumtModelDownloader, honyaku13b::Honyaku13BModelDownloader,
-        vosk::VoskModelDownloader, whisper::WhisperModelDownloader,
+        model_dir::ModelDirDownloader, sbv2::StyleBertVits2ModelDownloader,
+        sbv2_voice::StyleBertVits2VoiceModelDownloader, vosk::VoskModelDownloader,
+        whisper::WhisperModelDownloader,
     },
+    model_type_sbv2::ModelTypeStyleBertVits2,
     model_type_vosk::ModelTypeVosk,
     model_type_whisper::ModelTypeWhisper,
     permissions,
     record::Record,
     record_desktop::RecordDesktop,
     screenshot::{self, AppWindow},
+    synthesizer::{self, Synthesizer},
     transcription::{TraceCompletion, Transcription},
     transcription_amivoice::TranscriptionAmivoice,
     transcription_online::TranscriptionOnline,
+    translation_en::TranslationEn,
     translation_ja::TranslationJa,
     translation_ja_high::TranslationJaHigh,
 };
 
 struct RecordState(Arc<Mutex<Option<Sender<()>>>>);
+struct SynthesizeState(Arc<Mutex<Option<Synthesizer>>>);
 
 const BUNDLE_IDENTIFIER: &str = "blog.aota.Lycoris";
 
 #[tauri::command]
-fn delete_note_command(window: Window, note_id: u64) {
+fn list_synthesize_models_command(app_handle: AppHandle) -> Vec<String> {
+    synthesizer::list_models(app_handle)
+}
+
+#[tauri::command]
+async fn synthesize_init_command(
+    state: State<'_, SynthesizeState>,
+    app_handle: AppHandle,
+    model: String,
+) -> Result<bool, ()> {
+    let state_clone = state.0.clone();
+    let synthesizer = Synthesizer::new(app_handle, model);
+    let mut lock = state_clone.lock().unwrap();
+    *lock = Some(synthesizer);
+    Ok(true)
+}
+
+#[tauri::command]
+fn synthesize_finalize_command(state: State<'_, SynthesizeState>) -> bool {
+    let mut lock = state.0.lock().unwrap();
+    lock.take();
+    true
+}
+
+#[tauri::command]
+async fn synthesize_command(
+    state: State<'_, SynthesizeState>,
+    text: String,
+    sdp_ratio: f32,
+    length_scale: f32,
+) -> Result<Vec<u8>, String> {
+    let mut lock = state.0.lock().unwrap();
+    let synthesizer = lock.as_mut().unwrap();
+    synthesizer.synthesize(text, sdp_ratio, length_scale)
+}
+
+#[tauri::command]
+fn delete_note_command(app_handle: AppHandle, note_id: u64) {
     std::thread::spawn(move || {
-        let deleter = NoteDeleter::new(window.app_handle().clone());
+        let deleter = NoteDeleter::new(app_handle);
         deleter.delete(note_id)
     });
 }
 
 #[tauri::command]
-fn download_whisper_model_command(window: Window, model: String) {
+fn download_whisper_model_command(app_handle: AppHandle, model: String) {
     std::thread::spawn(move || {
-        let dl = WhisperModelDownloader::new(window.app_handle().clone());
+        let dl = WhisperModelDownloader::new(app_handle);
         dl.download(ModelTypeWhisper::from_str(&model).unwrap())
     });
 }
 
 #[tauri::command]
-fn download_vosk_model_command(window: Window, model: String) {
+fn download_vosk_model_command(app_handle: AppHandle, model: String) {
     std::thread::spawn(move || {
-        let dl = VoskModelDownloader::new(window.app_handle().clone());
+        let dl = VoskModelDownloader::new(app_handle);
         dl.download(ModelTypeVosk::from_str(&model).unwrap())
     });
 }
 
 #[tauri::command]
-fn download_fugumt_model_command(window: Window) {
+fn download_fugumt_enja_model_command(app_handle: AppHandle) {
     std::thread::spawn(move || {
-        let dl = FugumtModelDownloader::new(window.app_handle().clone());
-        dl.download()
+        let dl = ModelDirDownloader::new(app_handle);
+        dl.download("fugumt-en-ja", "downloadFugumtEnJaProgress")
     });
 }
 
 #[tauri::command]
-fn download_honyaku13b_model_command(window: Window) {
+fn download_fugumt_jaen_model_command(app_handle: AppHandle) {
     std::thread::spawn(move || {
-        let dl = Honyaku13BModelDownloader::new(window.app_handle().clone());
+        let dl = ModelDirDownloader::new(app_handle);
+        dl.download("fugumt-ja-en", "downloadFugumtJaEnProgress")
+    });
+}
+
+#[tauri::command]
+fn download_honyaku13b_model_command(app_handle: AppHandle) {
+    std::thread::spawn(move || {
+        let dl = ModelDirDownloader::new(app_handle);
+        dl.download("honyaku-13b", "downloadHonyaku13BProgress")
+    });
+}
+
+#[tauri::command]
+fn download_sbv2_command(app_handle: AppHandle) {
+    std::thread::spawn(move || {
+        let dl = StyleBertVits2ModelDownloader::new(app_handle);
         dl.download()
     });
 }
 
+#[tauri::command]
+fn download_sbv2_model_command(app_handle: AppHandle, model: String) {
+    std::thread::spawn(move || {
+        let dl = StyleBertVits2VoiceModelDownloader::new(app_handle);
+        dl.download(ModelTypeStyleBertVits2::from_str(&model).unwrap())
+    });
+}
+
 #[tauri::command]
 fn list_devices_command() -> Vec<Device> {
     device::list_devices()
@@ -104,8 +165,9 @@ fn list_app_windows_command(app_name: String) -> Vec<AppWindow> {
 }
 
 #[tauri::command]
-fn screenshot_command(window: Window, window_id: u32, note_id: u64) -> bool {
-    screenshot::screenshot(window_id, note_id, window.app_handle().clone())
+async fn screenshot_command(app_handle: AppHandle, window_id: u32, note_id: u64) -> Result<bool, ()> {
+    let result = screenshot::screenshot(window_id, note_id, app_handle);
+    Ok(result)
 }
 
 #[tauri::command]
@@ -124,9 +186,9 @@ fn has_microphone_permission_command(window: Window) -> bool {
 }
 
 #[tauri::command]
-fn execute_action_command(window: Window, note_id: u64) {
+fn execute_action_command(app_handle: AppHandle, note_id: u64) {
     std::thread::spawn(move || {
-        if action::initialize_action(window.app_handle().clone(), note_id) {
+        if action::initialize_action(app_handle, note_id) {
             let mut lock = action::SINGLETON_INSTANCE.lock().unwrap();
             if let Some(singleton) = lock.as_mut() {
                 singleton.execute();
@@ -141,7 +203,7 @@ fn execute_action_command(window: Window, note_id: u64) {
 #[tauri::command]
 fn start_command(
     state: State<'_, RecordState>,
-    window: Window,
+    app_handle: AppHandle,
     device_label: String,
     speaker_language: String,
     transcription_accuracy: String,
@@ -153,7 +215,7 @@ fn start_command(
     *lock = Some(stop_record_tx);
     std::thread::spawn(move || {
         if device_type == "microphone" {
-            let record = Record::new(window.app_handle().clone());
+            let record = Record::new(app_handle);
             record.start(
                 device_label,
                 speaker_language,
@@ -162,7 +224,7 @@ fn start_command(
                 stop_record_rx,
             );
         } else if device_type == "desktop" {
-            let record_desktop = RecordDesktop::new(window.app_handle().clone());
+            let record_desktop = RecordDesktop::new(app_handle);
             record_desktop.start(
                 speaker_language,
                 transcription_accuracy,
@@ -171,8 +233,8 @@ fn start_command(
                 None,
             );
         } else {
-            let record = Record::new(window.app_handle().clone());
-            let record_desktop = RecordDesktop::new(window.app_handle().clone());
+            let record = Record::new(app_handle.clone());
+            let record_desktop = RecordDesktop::new(app_handle);
 
             let (stop_record_clone_tx, stop_record_clone_rx) = unbounded();
             let speaker_language_clone = speaker_language.clone();
@@ -209,7 +271,7 @@ fn stop_command(state: State<'_, RecordState>) {
 #[tauri::command]
 fn start_trace_command(
     state: State<'_, RecordState>,
-    window: tauri::Window,
+    app_handle: AppHandle,
     speaker_language: String,
     transcription_accuracy: String,
     note_id: u64,
@@ -221,30 +283,31 @@ fn start_trace_command(
     std::thread::spawn(move || {
         if transcription_accuracy.starts_with("online-transcript") {
             let mut transcription_online = TranscriptionOnline::new(
-                window.app_handle(),
+                app_handle,
                 transcription_accuracy,
                 speaker_language,
                 note_id,
             );
             transcription_online.start(stop_convert_rx, true);
         } else if transcription_accuracy.starts_with("online-amivoice") {
-            let mut transcription_amivoice =
-                TranscriptionAmivoice::new(window.app_handle(), note_id);
+            let mut transcription_amivoice = TranscriptionAmivoice::new(app_handle, note_id);
             transcription_amivoice.start(stop_convert_rx, true);
         } else if transcription_accuracy.starts_with("online-chat") {
-            let mut chat_online = ChatOnline::new(window.app_handle(), speaker_language, note_id);
+            let mut chat_online = ChatOnline::new(app_handle, speaker_language, note_id);
             chat_online.start(stop_convert_rx, true);
         } else if transcription_accuracy.starts_with("fugumt-en-ja") {
-            let mut translation_ja =
-                TranslationJa::new(window.app_handle(), speaker_language, note_id);
+            let mut translation_ja = TranslationJa::new(app_handle, speaker_language, note_id);
             translation_ja.start(stop_convert_rx, true);
-        } else if transcription_accuracy.starts_with("honyaku13b-q4-0") {
+        } else if transcription_accuracy.starts_with("fugumt-ja-en") {
+            let mut translation_en = TranslationEn::new(app_handle, note_id);
+            translation_en.start(stop_convert_rx, true);
+        } else if transcription_accuracy.starts_with("honyaku-13b") {
             let mut translation_ja_high =
-                TranslationJaHigh::new(window.app_handle(), speaker_language, note_id);
+                TranslationJaHigh::new(app_handle, speaker_language, note_id);
             translation_ja_high.start(stop_convert_rx, true);
         } else {
             let mut transcription = Transcription::new(
-                window.app_handle(),
+                app_handle,
                 transcription_accuracy,
                 speaker_language,
                 note_id,
@@ -255,40 +318,18 @@ fn start_trace_command(
 }
 
 #[tauri::command]
-fn stop_trace_command(state: State<'_, RecordState>, window: tauri::Window) {
+fn stop_trace_command(state: State<'_, RecordState>, app_handle: AppHandle) {
     let mut lock = state.0.lock().unwrap();
     if let Some(stop_convert_tx) = lock.take() {
         stop_convert_tx.send(()).unwrap_or_else(|_| {
-            window
-                .app_handle()
+            app_handle
                 .emit_all("traceCompletion", TraceCompletion {})
                 .unwrap();
         })
     }
 }
 
-fn set_whisper_metal_lib_path(relative_path: &str) {
-    if let Ok(exe_path) = env::current_exe() {
-        if let Some(exe_dir) = exe_path.parent() {
-            let absolute_path = exe_dir.join(relative_path);
-            if let Some(absolute_path_str) = absolute_path.to_str() {
-                println!("Setting GGML_METAL_PATH_RESOURCES to {}", absolute_path_str);
-                env::set_var("GGML_METAL_PATH_RESOURCES", absolute_path_str);
-            }
-        } else {
-            eprintln!("GGML_METAL_PATH_RESOURCES cloud not be set: Failed to get the executable directory.");
-        }
-    } else {
-        eprintln!("GGML_METAL_PATH_RESOURCES cloud not be set: Failed to get the executable path.");
-    }
-}
-
 fn main() {
-    #[cfg(not(debug_assertions))]
-    set_whisper_metal_lib_path("../Resources/resources/whisper");
-    #[cfg(debug_assertions)]
-    set_whisper_metal_lib_path("../../resources/whisper");
-
     tauri::Builder::default()
         .register_uri_scheme_protocol("stream", move |_app, request| {
             let raw_path = request.uri().replace("stream://localhost", "");
@@ -347,12 +388,20 @@ fn main() {
                 .build(),
         )
         .manage(RecordState(Default::default()))
+        .manage(SynthesizeState(Default::default()))
         .invoke_handler(tauri::generate_handler![
+            list_synthesize_models_command,
+            synthesize_init_command,
+            synthesize_finalize_command,
+            synthesize_command,
             delete_note_command,
             download_whisper_model_command,
             download_vosk_model_command,
-            download_fugumt_model_command,
+            download_fugumt_enja_model_command,
+            download_fugumt_jaen_model_command,
             download_honyaku13b_model_command,
+            download_sbv2_command,
+            download_sbv2_model_command,
             list_devices_command,
             list_apps_command,
             list_app_windows_command,
diff --git a/src-tauri/src/module/action.rs b/src-tauri/src/module/action.rs
index 1af89bb..a3fcfc3 100644
--- a/src-tauri/src/module/action.rs
+++ b/src-tauri/src/module/action.rs
@@ -8,8 +8,10 @@ use serde_json::{json, Value};
 use tauri::{AppHandle, Manager};
 
 use super::sqlite::{Content, Sqlite};
+use tokio::runtime::Runtime;
 
 pub struct Action {
+    runtime: Runtime,
     app_handle: AppHandle,
     sqlite: Sqlite,
     note_id: u64,
@@ -19,12 +21,14 @@ pub struct Action {
 
 impl Action {
     pub fn new(app_handle: AppHandle, note_id: u64) -> Self {
+        let runtime = Runtime::new().expect("Failed to create Tokio runtime");
         let sqlite = Sqlite::new();
         let token = sqlite.select_whisper_token().unwrap();
         let model = sqlite
             .select_ai_model()
             .unwrap_or_else(|_| "gpt-4o-mini".to_string());
         Self {
+            runtime,
             app_handle,
             sqlite,
             note_id,
@@ -33,7 +37,6 @@ impl Action {
         }
     }
 
-    #[tokio::main]
     async fn request_gpt(
         model: String,
         question: String,
@@ -90,17 +93,25 @@ impl Action {
                             .push_str(&format!(":::{}\n{}\n:::\n", current_type, current_content));
                         current_content.clear();
                     }
-                    prompt.push_str(&format!(
-                        ":::assistant\n[query]\n{}\n[answer]\n{}\n:::\n",
-                        content.content, content.content_2
-                    ));
+                    if content.action_type == "suggest" {
+                        prompt.push_str(&format!(
+                                ":::assistant\n[query]\n次の発言者のための3つの発話サジェストとその理由を生成してください。\n[answer] {}\n{}\n:::\n",
+                                content.content, content.content_2
+                            ));
+                    } else {
+                        prompt.push_str(&format!(
+                            ":::assistant\n[query]\n{}\n[answer]\n{}\n:::\n",
+                            content.content, content.content_2
+                        ));
+                    }
                 }
                 "speech" | _ => {
                     let speech_type = if content.speech_type == "speech" {
                         "transcription"
                     } else if content.speech_type == "memo" {
                         "note"
-                    } else { // "screenshot"
+                    } else {
+                        // "screenshot"
                         "note"
                     };
                     if speech_type != current_type && !current_content.is_empty() {
@@ -160,6 +171,176 @@ impl Action {
         Ok(response_text)
     }
 
+    async fn request_gpt_suggest(
+        contents: Vec<Content>,
+        token: String,
+    ) -> Result<String, Box<dyn std::error::Error>> {
+        let url = "https://api.openai.com/v1/chat/completions";
+        let temperature = 0.7;
+
+        let client = Client::new();
+
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            AUTHORIZATION,
+            HeaderValue::from_str(&format!("Bearer {}", token))?,
+        );
+        headers.insert(CONTENT_TYPE, HeaderValue::from_static("application/json"));
+
+        let mut messages: Vec<Value> = Vec::new();
+        let mut prompt = "あなたは高度な会話分析・発話提案AIアシスタントです。提供される情報を分析し、次の発言者に対して適切な発話サジェストを生成することがあなたの役割です。以下の手順に従って処理を行ってください：
+
+1. 情報の分析：
+   a) 文字起こし (:::transcription で囲まれた部分)：直近の会話の内容と流れを詳細に把握します。
+   b) メモ (:::note で囲まれた部分)：会話の背景や補足情報として扱います。
+   c) 過去のAIとのQ&A (:::assistant で囲まれた部分)：関連する追加情報として考慮します。ただし直近の発話サジェストは、今回の発話サジェストが同一性を持たないように考慮します。
+
+2. 会話の状況把握：
+   - 誰が最後に発言したか、どのような内容だったかを特定します。
+   - 発話サジェストを受ける人が直前で聞き手だったことを前提とします。
+
+3. 発話サジェストの生成：
+   会話の流れ、文脈、および背景情報を考慮し、以下の3種類の発言提案を生成します：
+   a) 中立的な発言：会話を自然に進行させる発言
+   b) ポジティブな発言：質問、共感、あるいは会話を前向きな方向に導く発言。
+   c) ネガティブな発言：懸念や問題点を指摘する発言
+
+4. 各発言提案の理由付け：
+   それぞれの発言提案について、なぜその発言が適切か、どのような効果が期待できるかを簡潔に説明します。理由付けの詳細さは、必要に応じて調整します。
+
+5. 発話サジェストの調整：
+   - 会話の雰囲気や目的に応じて、各提案の内容や調子を調整します。
+   - 文化的背景や社会的文脈を考慮し、適切な表現を選択します。
+
+以下に提供される情報を上記の手順に従って分析し、中立的、ポジティブ（質問・共感を含む）、ネガティブな3つの発話サジェストとその理由を生成してください。各サジェストは自然で、会話の流れに沿ったものにしてください：
+
+".to_string();
+        let mut current_type = String::new();
+        let mut current_content = String::new();
+
+        for content in contents.iter() {
+            match content.speech_type.as_str() {
+                "action" => {
+                    if !current_content.is_empty() {
+                        prompt
+                            .push_str(&format!(":::{}\n{}\n:::\n", current_type, current_content));
+                        current_content.clear();
+                    }
+                    if content.action_type == "suggest" {
+                        prompt.push_str(&format!(
+                                ":::assistant\n[query]\n次の発言者のための3つの発話サジェストとその理由を生成してください。\n[answer] {}\n{}\n:::\n",
+                                content.content, content.content_2
+                            ));
+                    } else {
+                        prompt.push_str(&format!(
+                            ":::assistant\n[query]\n{}\n[answer]\n{}\n:::\n",
+                            content.content, content.content_2
+                        ));
+                    }
+                }
+                "speech" | _ => {
+                    let speech_type = if content.speech_type == "speech" {
+                        "transcription"
+                    } else if content.speech_type == "memo" {
+                        "note"
+                    } else {
+                        // "screenshot"
+                        "note"
+                    };
+                    if speech_type != current_type && !current_content.is_empty() {
+                        prompt
+                            .push_str(&format!(":::{}\n{}\n:::\n", current_type, current_content));
+                        current_content.clear();
+                    }
+                    current_type = speech_type.to_string();
+                    current_content.push_str(&content.content);
+                    current_content.push('\n');
+                }
+            }
+        }
+
+        if !current_content.is_empty() {
+            prompt.push_str(&format!(":::{}\n{}\n:::\n", current_type, current_content));
+        }
+
+        messages.push(json!({
+            "role": "system",
+            "content": prompt
+        }));
+        messages.push(json!({
+            "role": "user",
+            "content": "上記の情報を基に、次の発言者のための3つの発話サジェストとその理由を生成してください。"
+        }));
+
+        // for debugging
+        // println!("messages: {:?}", messages);
+
+        let response_format = json!({
+            "type": "json_schema",
+            "json_schema": {
+                "name": "generate_speech_suggestions",
+                "description": "提供されたコンテキストに基づいて、ニュートラル、ポジティブ、ネガティブな発言の提案とその理由を生成します。",
+                "strict": true,
+                "schema": {
+                    "type": "object",
+                    "properties": {
+                        "neutral": { "$ref": "#/$defs/suggestion" },
+                        "positive": { "$ref": "#/$defs/suggestion" },
+                        "negative": { "$ref": "#/$defs/suggestion" }
+                    },
+                    "required": ["neutral", "positive", "negative"],
+                    "additionalProperties": false,
+                    "$defs": {
+                        "suggestion": {
+                            "type": "object",
+                            "description": "発言の提案とその理由",
+                            "properties": {
+                                "content": {
+                                    "type": "string",
+                                    "description": "提案される発言内容"
+                                },
+                                "reason": {
+                                    "type": "string",
+                                    "description": "その発言を提案する理由"
+                                }
+                            },
+                            "required": ["content", "reason"],
+                            "additionalProperties": false
+                        }
+                    }
+                }
+            }
+        });
+
+        let post_body = json!({
+          "model": "gpt-4o-2024-08-06",
+          "temperature": temperature,
+          "messages": messages,
+          "response_format": response_format
+        });
+
+        let response = client
+            .post(url)
+            .headers(headers)
+            .json(&post_body)
+            .send()
+            .await?;
+
+        let status = response.status();
+        let json_response: Value = response.json().await?;
+
+        let response_text = if status == 200 {
+            json_response["choices"][0]["message"]["content"]
+                .as_str()
+                .unwrap_or("choices[0].message.content field not found")
+                .to_string()
+        } else {
+            json_response.to_string()
+        };
+
+        Ok(response_text)
+    }
+
     pub fn execute(&mut self) {
         if self.token == "" {
             println!("whisper token is empty, so skipping...");
@@ -168,62 +349,112 @@ impl Action {
         let mut is_executing = IS_EXECUTING.lock().unwrap();
         *is_executing = true;
 
-        while let Ok(action) = self.sqlite.select_first_unexecuted_action(self.note_id) {
-            match self
-                .sqlite
-                .select_has_no_permission_of_execute_action(self.note_id, action.id)
-            {
-                Ok(permissions) => {
-                    if permissions.is_empty() || permissions.iter().any(|p| p.model == "whisper") {
-                        match self.sqlite.select_contents_by(self.note_id, action.id) {
-                            Ok(contents) => {
-                                match Self::request_gpt(
-                                    self.model.clone(),
-                                    action.content,
-                                    contents,
-                                    self.token.clone(),
-                                ) {
-                                    Ok(answer) => {
-                                        match self
-                                            .sqlite
-                                            .update_action_content_2(action.id, answer.clone())
+        self.runtime.block_on(async {
+            while let Ok(action) = self.sqlite.select_first_unexecuted_action(self.note_id) {
+                match self
+                    .sqlite
+                    .select_has_no_permission_of_execute_action(self.note_id, action.id)
+                {
+                    Ok(permissions) => {
+                        if permissions.is_empty()
+                            || permissions.iter().any(|p| p.model == "whisper")
+                        {
+                            match self.sqlite.select_contents_by(self.note_id, action.id) {
+                                Ok(contents) => match action.action_type.as_str() {
+                                    "chat" => {
+                                        match Self::request_gpt(
+                                            self.model.clone(),
+                                            action.content,
+                                            contents,
+                                            self.token.clone(),
+                                        )
+                                        .await
                                         {
-                                            Ok(result) => {
-                                                let _ = self
-                                                    .app_handle
-                                                    .emit_all("actionExecuted", result);
+                                            Ok(answer) => {
+                                                match self.sqlite.update_action_content_2(
+                                                    action.id,
+                                                    answer.clone(),
+                                                ) {
+                                                    Ok(result) => {
+                                                        let _ = self
+                                                            .app_handle
+                                                            .emit_all("actionExecuted", result);
+                                                    }
+                                                    Err(e) => {
+                                                        println!(
+                                                            "Error updating action content_2: {:?}",
+                                                            e
+                                                        );
+                                                        break;
+                                                    }
+                                                }
                                             }
-                                            Err(e) => {
+                                            Err(_) => {
                                                 println!(
-                                                    "Error updating action content_2: {:?}",
-                                                    e
+                                                    "gpt api is temporarily failed, so skipping..."
                                                 );
                                                 break;
                                             }
                                         }
                                     }
-                                    Err(_) => {
-                                        println!("gpt api is temporarily failed, so skipping...");
+                                    "suggest" => {
+                                        match Self::request_gpt_suggest(
+                                            contents,
+                                            self.token.clone(),
+                                        )
+                                        .await
+                                        {
+                                            Ok(answer) => {
+                                                match self.sqlite.update_action_content_2(
+                                                    action.id,
+                                                    answer.clone(),
+                                                ) {
+                                                    Ok(result) => {
+                                                        let _ = self
+                                                            .app_handle
+                                                            .emit_all("actionExecuted", result);
+                                                    }
+                                                    Err(e) => {
+                                                        println!(
+                                                            "Error updating action content_2: {:?}",
+                                                            e
+                                                        );
+                                                        break;
+                                                    }
+                                                }
+                                            }
+                                            Err(_) => {
+                                                println!(
+                                                    "gpt api is temporarily failed, so skipping..."
+                                                );
+                                                break;
+                                            }
+                                        }
+                                    }
+                                    &_ => {
+                                        println!("Unsupported action type, so skipping...");
                                         break;
                                     }
+                                },
+                                Err(e) => {
+                                    println!("Error selecting contents: {:?}", e);
+                                    break;
                                 }
                             }
-                            Err(e) => {
-                                println!("Error selecting contents: {:?}", e);
-                                break;
-                            }
+                        } else {
+                            println!(
+                                "has_no_permission_of_execute_action is false, so skipping..."
+                            );
+                            break;
                         }
-                    } else {
-                        println!("has_no_permission_of_execute_action is false, so skipping...");
+                    }
+                    Err(e) => {
+                        println!("Error checking permissions: {:?}", e);
                         break;
                     }
                 }
-                Err(e) => {
-                    println!("Error checking permissions: {:?}", e);
-                    break;
-                }
             }
-        }
+        });
 
         *is_executing = false;
     }
diff --git a/src-tauri/src/module/device.rs b/src-tauri/src/module/device.rs
index 3f79f3a..2ea95c7 100644
--- a/src-tauri/src/module/device.rs
+++ b/src-tauri/src/module/device.rs
@@ -12,7 +12,7 @@ pub fn list_devices() -> Vec<Device> {
         .input_devices()
         .unwrap()
         .filter_map(|device| {
-            if device.name().is_ok() && device.name().unwrap().contains("ZoomAudioDevice") {
+            if device.name().is_ok() && (device.name().unwrap().contains("ZoomAudioDevice") || device.name().unwrap().contains("Microsoft Teams Audio")) {
                 None
             } else {
                 Some(Device {
diff --git a/src-tauri/src/module/downloader/mod.rs b/src-tauri/src/module/downloader/mod.rs
index 618e3ca..3a42ae9 100644
--- a/src-tauri/src/module/downloader/mod.rs
+++ b/src-tauri/src/module/downloader/mod.rs
@@ -1,4 +1,5 @@
-pub mod whisper;
+pub mod model_dir;
+pub mod sbv2;
+pub mod sbv2_voice;
 pub mod vosk;
-pub mod fugumt;
-pub mod honyaku13b;
\ No newline at end of file
+pub mod whisper;
diff --git a/src-tauri/src/module/downloader/honyaku13b.rs b/src-tauri/src/module/downloader/model_dir.rs
similarity index 85%
rename from src-tauri/src/module/downloader/honyaku13b.rs
rename to src-tauri/src/module/downloader/model_dir.rs
index 5cd5b52..415b73e 100644
--- a/src-tauri/src/module/downloader/honyaku13b.rs
+++ b/src-tauri/src/module/downloader/model_dir.rs
@@ -14,33 +14,32 @@ pub struct Progress {
     pub is_progress: bool,
 }
 
-pub struct Honyaku13BModelDownloader {
+pub struct ModelDirDownloader {
     app_handle: AppHandle,
 }
-impl Honyaku13BModelDownloader {
+impl ModelDirDownloader {
     pub fn new(app_handle: AppHandle) -> Self {
         Self { app_handle }
     }
 
     #[tokio::main]
-    pub async fn download(&self) {
-        let model_type = "honyaku13b-q4-0";
+    pub async fn download(&self, model_type: &str, progress_identifier: &str) {
         let path: &str = &self
             .app_handle
             .path_resolver()
-            .resolve_resource("resources/honyaku13b-q4-0.zip")
+            .resolve_resource(format!("resources/{}.zip", model_type))
             .unwrap()
             .to_string_lossy()
             .to_string();
-        let url = "https://object-storage.tyo1.conoha.io/v1/nc_b22de95e3cf1434da07499038766e2b7/lycoris/honyaku13b-q4-0.zip";
-        let res = reqwest::get(url).await.unwrap();
+        let url = format!("https://lycoris-storage.wktk.dev/{}.zip", model_type);
+        let res = reqwest::get(url.clone()).await.unwrap();
         let total_size = res
             .content_length()
             .ok_or(format!("Failed to get content length from '{}'", url))
             .unwrap();
 
         let _ = &self.app_handle.emit_all(
-            "downloadHonyaku13BProgress",
+            progress_identifier,
             Progress {
                 model_type: model_type.to_string(),
                 rate: 0.0,
@@ -76,7 +75,7 @@ impl Honyaku13BModelDownloader {
             let current_rate = ((new as f64 * 100.0) / total_size as f64).round();
             if rate != current_rate {
                 let _ = &self.app_handle.emit_all(
-                    "downloadHonyaku13BProgress",
+                    progress_identifier,
                     Progress {
                         model_type: model_type.to_string(),
                         rate: current_rate,
@@ -108,7 +107,7 @@ impl Honyaku13BModelDownloader {
         let _ = Sqlite::new().update_model_is_downloaded(model_type.to_string(), 1);
 
         let _ = &self.app_handle.emit_all(
-            "downloadHonyaku13BProgress",
+            progress_identifier,
             Progress {
                 model_type: model_type.to_string(),
                 rate: 0.0,
diff --git a/src-tauri/src/module/downloader/fugumt.rs b/src-tauri/src/module/downloader/sbv2.rs
similarity index 86%
rename from src-tauri/src/module/downloader/fugumt.rs
rename to src-tauri/src/module/downloader/sbv2.rs
index 5df67aa..d8c299e 100644
--- a/src-tauri/src/module/downloader/fugumt.rs
+++ b/src-tauri/src/module/downloader/sbv2.rs
@@ -14,25 +14,25 @@ pub struct Progress {
     pub is_progress: bool,
 }
 
-pub struct FugumtModelDownloader {
+pub struct StyleBertVits2ModelDownloader {
     app_handle: AppHandle,
 }
-impl FugumtModelDownloader {
+impl StyleBertVits2ModelDownloader {
     pub fn new(app_handle: AppHandle) -> Self {
         Self { app_handle }
     }
 
     #[tokio::main]
     pub async fn download(&self) {
-        let model_type = "fugumt-en-ja";
+        let model_type = "style-bert-vits2";
         let path: &str = &self
             .app_handle
             .path_resolver()
-            .resolve_resource("resources/fugumt-en-ja.zip")
+            .resolve_resource("resources/style-bert-vits/style-bert-vits.zip")
             .unwrap()
             .to_string_lossy()
             .to_string();
-        let url = "https://object-storage.tyo1.conoha.io/v1/nc_b22de95e3cf1434da07499038766e2b7/lycoris/fugumt-en-ja.zip";
+        let url = "https://lycoris-storage.wktk.dev/style-bert-vits.zip";
         let res = reqwest::get(url).await.unwrap();
         let total_size = res
             .content_length()
@@ -40,7 +40,7 @@ impl FugumtModelDownloader {
             .unwrap();
 
         let _ = &self.app_handle.emit_all(
-            "downloadFugumtProgress",
+            "downloadStyleBertVits2Progress",
             Progress {
                 model_type: model_type.to_string(),
                 rate: 0.0,
@@ -76,7 +76,7 @@ impl FugumtModelDownloader {
             let current_rate = ((new as f64 * 100.0) / total_size as f64).round();
             if rate != current_rate {
                 let _ = &self.app_handle.emit_all(
-                    "downloadFugumtProgress",
+                    "downloadStyleBertVits2Progress",
                     Progress {
                         model_type: model_type.to_string(),
                         rate: current_rate,
@@ -90,7 +90,7 @@ impl FugumtModelDownloader {
         let dir: &str = &self
             .app_handle
             .path_resolver()
-            .resolve_resource("resources")
+            .resolve_resource("resources/style-bert-vits")
             .unwrap()
             .to_string_lossy()
             .to_string();
@@ -108,7 +108,7 @@ impl FugumtModelDownloader {
         let _ = Sqlite::new().update_model_is_downloaded(model_type.to_string(), 1);
 
         let _ = &self.app_handle.emit_all(
-            "downloadFugumtProgress",
+            "downloadStyleBertVits2Progress",
             Progress {
                 model_type: model_type.to_string(),
                 rate: 0.0,
diff --git a/src-tauri/src/module/downloader/sbv2_voice.rs b/src-tauri/src/module/downloader/sbv2_voice.rs
new file mode 100644
index 0000000..e711431
--- /dev/null
+++ b/src-tauri/src/module/downloader/sbv2_voice.rs
@@ -0,0 +1,105 @@
+use tauri::{AppHandle, Manager};
+
+use futures_util::StreamExt;
+use std::cmp::min;
+use std::fs::File;
+use std::io::Write;
+
+use crate::module::model_type_sbv2::ModelTypeStyleBertVits2;
+use crate::module::sqlite::Sqlite;
+
+#[derive(Debug, Clone, serde::Serialize)]
+pub struct Progress {
+    pub model_type: String,
+    pub rate: f64,
+    pub is_progress: bool,
+}
+
+pub struct StyleBertVits2VoiceModelDownloader {
+    app_handle: AppHandle,
+}
+impl StyleBertVits2VoiceModelDownloader {
+    pub fn new(app_handle: AppHandle) -> Self {
+        Self { app_handle }
+    }
+
+    #[tokio::main]
+    pub async fn download(&self, model_type: ModelTypeStyleBertVits2) {
+        let model_path: &str = &format!("resources/style-bert-vits/models/{}.sbv2", model_type.as_str());
+        let path: &str = &self
+            .app_handle
+            .path_resolver()
+            .resolve_resource(model_path)
+            .unwrap()
+            .to_string_lossy()
+            .to_string();
+        let url: &str = &format!(
+            "https://lycoris-storage.wktk.dev/{}.sbv2",
+            model_type.as_str()
+        );
+        let res = reqwest::get(url).await.unwrap();
+        let total_size = res
+            .content_length()
+            .ok_or(format!("Failed to get content length from '{}'", url))
+            .unwrap();
+
+        let _ = &self.app_handle.emit_all(
+            "downloadStyleBertVits2VoiceProgress",
+            Progress {
+                model_type: model_type.as_str().to_string(),
+                rate: 0.0,
+                is_progress: true,
+            },
+        );
+
+        let mut file;
+        let mut downloaded: u64 = 0;
+        let mut stream = res.bytes_stream();
+
+        println!("Seeking in file.");
+        if std::path::Path::new(&path).exists() {
+            println!("File exists. Removig...");
+            let _ = std::fs::remove_file(&path);
+        }
+        file = File::create(&path)
+            .or(Err(format!("Failed to create file '{}'", &path)))
+            .unwrap();
+
+        println!("Commencing transfer");
+        let mut rate = 0.0;
+        while let Some(item) = stream.next().await {
+            let chunk = item
+                .or(Err(format!("Error while downloading file")))
+                .unwrap();
+            file.write(&chunk)
+                .or(Err(format!("Error while writing to file")))
+                .unwrap();
+            let new = min(downloaded + (chunk.len() as u64), total_size);
+            downloaded = new;
+
+            let current_rate = ((new as f64 * 100.0) / total_size as f64).round();
+            if rate != current_rate {
+                let _ = &self.app_handle.emit_all(
+                    "downloadStyleBertVits2VoiceProgress",
+                    Progress {
+                        model_type: model_type.as_str().to_string(),
+                        rate: current_rate,
+                        is_progress: true,
+                    },
+                );
+                rate = current_rate
+            }
+        }
+
+        let _ = Sqlite::new().update_model_is_downloaded(model_type.as_str().to_string(), 1);
+
+        let _ = &self.app_handle.emit_all(
+            "downloadStyleBertVits2VoiceProgress",
+            Progress {
+                model_type: model_type.as_str().to_string(),
+                rate,
+                is_progress: false,
+            },
+        );
+    }
+}
diff --git a/src-tauri/src/module/downloader/vosk.rs b/src-tauri/src/module/downloader/vosk.rs
index 8fbcf07..de0678d 100644
--- a/src-tauri/src/module/downloader/vosk.rs
+++ b/src-tauri/src/module/downloader/vosk.rs
@@ -34,7 +34,7 @@ impl VoskModelDownloader {
             .to_string_lossy()
             .to_string();
         let url: &str = &format!(
-            "https://object-storage.tyo1.conoha.io/v1/nc_b22de95e3cf1434da07499038766e2b7/lycoris/vosk-model-{}.zip",
+            "https://lycoris-storage.wktk.dev/vosk-model-{}.zip",
             model_type.as_str()
         );
         let res = reqwest::get(url).await.unwrap();
diff --git a/src-tauri/src/module/downloader/whisper.rs b/src-tauri/src/module/downloader/whisper.rs
index 943846d..e283ff0 100644
--- a/src-tauri/src/module/downloader/whisper.rs
+++ b/src-tauri/src/module/downloader/whisper.rs
@@ -34,7 +34,7 @@ impl WhisperModelDownloader {
             .to_string_lossy()
             .to_string();
         let url: &str = &format!(
-            "https://object-storage.tyo1.conoha.io/v1/nc_b22de95e3cf1434da07499038766e2b7/lycoris/ggml-{}.zip",
+            "https://lycoris-storage.wktk.dev/ggml-{}.zip",
             model_type.as_str()
         );
         let res = reqwest::get(url).await.unwrap();
diff --git a/src-tauri/src/module/mod.rs b/src-tauri/src/module/mod.rs
index 7f3de43..c4434b9 100644
--- a/src-tauri/src/module/mod.rs
+++ b/src-tauri/src/module/mod.rs
@@ -1,20 +1,23 @@
+pub mod action;
 pub mod chat_online;
 pub mod deleter;
 pub mod device;
 pub mod downloader;
+pub mod model_type_sbv2;
 pub mod model_type_vosk;
 pub mod model_type_whisper;
 pub mod permissions;
 mod recognizer;
 pub mod record;
 pub mod record_desktop;
+pub mod screenshot;
 mod sqlite;
+pub mod synthesizer;
 mod transcriber;
 pub mod transcription;
 pub mod transcription_amivoice;
 pub mod transcription_online;
+pub mod translation_en;
 pub mod translation_ja;
 pub mod translation_ja_high;
 mod writer;
-pub mod screenshot;
-pub mod action;
diff --git a/src-tauri/src/module/model_type_sbv2.rs b/src-tauri/src/module/model_type_sbv2.rs
new file mode 100644
index 0000000..ef6ed1e
--- /dev/null
+++ b/src-tauri/src/module/model_type_sbv2.rs
@@ -0,0 +1,42 @@
+use std::str::FromStr;
+
+pub enum ModelTypeStyleBertVits2 {
+    TsukuyomiChan,
+    KoharuneAmi,
+    Amitaro,
+    JvnvF1Jp,
+    JvnvF2Jp,
+    JvnvM1Jp,
+    JvnvM2Jp,
+}
+
+impl ModelTypeStyleBertVits2 {
+    pub fn as_str(&self) -> &'static str {
+        match self {
+            ModelTypeStyleBertVits2::TsukuyomiChan => "tsukuyomi-chan",
+            ModelTypeStyleBertVits2::KoharuneAmi => "koharune-ami",
+            ModelTypeStyleBertVits2::Amitaro => "amitaro",
+            ModelTypeStyleBertVits2::JvnvF1Jp => "jvnv-F1-jp",
+            ModelTypeStyleBertVits2::JvnvF2Jp => "jvnv-F2-jp",
+            ModelTypeStyleBertVits2::JvnvM1Jp => "jvnv-M1-jp",
+            ModelTypeStyleBertVits2::JvnvM2Jp => "jvnv-M2-jp",
+        }
+    }
+}
+
+impl FromStr for ModelTypeStyleBertVits2 {
+    type Err = ();
+
+    fn from_str(input: &str) -> Result<ModelTypeStyleBertVits2, Self::Err> {
+        match input {
+            "tsukuyomi-chan" => Ok(ModelTypeStyleBertVits2::TsukuyomiChan),
+            "koharune-ami" => Ok(ModelTypeStyleBertVits2::KoharuneAmi),
+            "amitaro" => Ok(ModelTypeStyleBertVits2::Amitaro),
+            "jvnv-F1-jp" => Ok(ModelTypeStyleBertVits2::JvnvF1Jp),
+            "jvnv-F2-jp" => Ok(ModelTypeStyleBertVits2::JvnvF2Jp),
+            "jvnv-M1-jp" => Ok(ModelTypeStyleBertVits2::JvnvM1Jp),
+            "jvnv-M2-jp" => Ok(ModelTypeStyleBertVits2::JvnvM2Jp),
+            _ => Err(()),
+        }
+    }
+}
diff --git a/src-tauri/src/module/model_type_whisper.rs b/src-tauri/src/module/model_type_whisper.rs
index 7c1d3ad..c7e73c7 100644
--- a/src-tauri/src/module/model_type_whisper.rs
+++ b/src-tauri/src/module/model_type_whisper.rs
@@ -4,8 +4,10 @@ pub enum ModelTypeWhisper {
     Base,
     BaseEn,
     Large,
+    LargeTurbo,
     LargeDistilEn,
     LargeDistilJa,
+    LargeDistilBilingual,
     Medium,
     MediumEn,
     Small,
@@ -20,8 +22,10 @@ impl ModelTypeWhisper {
             ModelTypeWhisper::Base => "base",
             ModelTypeWhisper::BaseEn => "base.en",
             ModelTypeWhisper::Large => "large",
+            ModelTypeWhisper::LargeTurbo => "large-turbo",
             ModelTypeWhisper::LargeDistilEn => "large-distil.en",
             ModelTypeWhisper::LargeDistilJa => "large-distil.ja",
+            ModelTypeWhisper::LargeDistilBilingual => "large-distil.bilingual",
             ModelTypeWhisper::Medium => "medium",
             ModelTypeWhisper::MediumEn => "medium.en",
             ModelTypeWhisper::Small => "small",
@@ -40,8 +44,10 @@ impl FromStr for ModelTypeWhisper {
             "base" => Ok(ModelTypeWhisper::Base),
             "base.en" => Ok(ModelTypeWhisper::BaseEn),
             "large" => Ok(ModelTypeWhisper::Large),
+            "large-turbo" => Ok(ModelTypeWhisper::LargeTurbo),
             "large-distil.en" => Ok(ModelTypeWhisper::LargeDistilEn),
             "large-distil.ja" => Ok(ModelTypeWhisper::LargeDistilJa),
+            "large-distil.bilingual" => Ok(ModelTypeWhisper::LargeDistilBilingual),
             "medium" => Ok(ModelTypeWhisper::Medium),
             "medium.en" => Ok(ModelTypeWhisper::MediumEn),
             "small" => Ok(ModelTypeWhisper::Small),
diff --git a/src-tauri/src/module/record.rs b/src-tauri/src/module/record.rs
index cd88920..037ed1f 100644
--- a/src-tauri/src/module/record.rs
+++ b/src-tauri/src/module/record.rs
@@ -24,7 +24,7 @@ use tauri::{api::path::data_dir, AppHandle, Manager};
 
 use super::{
     chat_online, recognizer::MyRecognizer, sqlite::Sqlite, transcription, transcription_amivoice,
-    transcription_online, translation_ja, translation_ja_high, writer::Writer,
+    transcription_online, translation_en, translation_ja, translation_ja_high, writer::Writer,
 };
 
 pub struct Record {
@@ -228,7 +228,16 @@ impl Record {
                                 if let Some(singleton) = lock.as_mut() {
                                     singleton.start(stop_convert_rx_clone, false);
                                 }
-                            } else if transcription_accuracy_clone.starts_with("honyaku13b-q4-0") {
+                            } else if transcription_accuracy_clone.starts_with("fugumt-ja-en") {
+                                translation_en::initialize_translation_en(
+                                    app_handle_clone,
+                                    note_id,
+                                );
+                                let mut lock = translation_en::SINGLETON_INSTANCE.lock().unwrap();
+                                if let Some(singleton) = lock.as_mut() {
+                                    singleton.start(stop_convert_rx_clone, false);
+                                }
+                            } else if transcription_accuracy_clone.starts_with("honyaku-13b") {
                                 translation_ja_high::initialize_translation_ja_high(
                                     app_handle_clone,
                                     speaker_language_clone,
@@ -275,6 +284,7 @@ impl Record {
         if !is_no_transcription {
             stop_convert_tx.send(()).unwrap();
             transcription::drop_transcription();
+            translation_en::drop_translation_en();
             translation_ja::drop_translation_ja();
             translation_ja_high::drop_translation_ja_high();
             transcription_online::drop_transcription_online();
diff --git a/src-tauri/src/module/record_desktop.rs b/src-tauri/src/module/record_desktop.rs
index 005926a..c94cd25 100644
--- a/src-tauri/src/module/record_desktop.rs
+++ b/src-tauri/src/module/record_desktop.rs
@@ -39,7 +39,7 @@ use vosk::Recognizer;
 
 use super::{
     chat_online, recognizer::MyRecognizer, sqlite::Sqlite, transcription, transcription_amivoice,
-    transcription_online, translation_ja, translation_ja_high, writer::Writer,
+    transcription_online, translation_en, translation_ja, translation_ja_high, writer::Writer,
 };
 
 pub struct RecordDesktop {
@@ -260,7 +260,16 @@ impl RecordDesktop {
                                 if let Some(singleton) = lock.as_mut() {
                                     singleton.start(stop_convert_rx_clone, false);
                                 }
-                            } else if transcription_accuracy_clone.starts_with("honyaku13b-q4-0") {
+                            } else if transcription_accuracy_clone.starts_with("fugumt-ja-en") {
+                                translation_en::initialize_translation_en(
+                                    app_handle_clone,
+                                    note_id,
+                                );
+                                let mut lock = translation_en::SINGLETON_INSTANCE.lock().unwrap();
+                                if let Some(singleton) = lock.as_mut() {
+                                    singleton.start(stop_convert_rx_clone, false);
+                                }
+                            } else if transcription_accuracy_clone.starts_with("honyaku-13b") {
                                 translation_ja_high::initialize_translation_ja_high(
                                     app_handle_clone,
                                     speaker_language_clone,
@@ -311,6 +320,7 @@ impl RecordDesktop {
         if !is_no_transcription {
             stop_convert_tx.send(()).unwrap();
             transcription::drop_transcription();
+            translation_en::drop_translation_en();
             translation_ja::drop_translation_ja();
             translation_ja_high::drop_translation_ja_high();
             transcription_online::drop_transcription_online();
diff --git a/src-tauri/src/module/sqlite.rs b/src-tauri/src/module/sqlite.rs
index 3aac31c..a57701e 100644
--- a/src-tauri/src/module/sqlite.rs
+++ b/src-tauri/src/module/sqlite.rs
@@ -29,12 +29,14 @@ pub struct Updated {
 #[derive(Debug, Clone, serde::Serialize)]
 pub struct UnexecutedAction {
     pub id: u16,
+    pub action_type: String,
     pub content: String,
 }
 
 #[derive(Debug, Clone, serde::Serialize)]
 pub struct Content {
     pub speech_type: String,
+    pub action_type: String,
     pub content: String,
     pub content_2: String,
 }
@@ -195,13 +197,14 @@ impl Sqlite {
         note_id: u64,
         id: u16,
     ) -> Result<Vec<Content>, rusqlite::Error> {
-        let mut stmt = self.conn.prepare("SELECT speech_type,content,content_2 FROM speeches WHERE note_id = ?1 AND id < ?2 ORDER BY created_at_unixtime ASC").unwrap();
+        let mut stmt = self.conn.prepare("SELECT speech_type,action_type,content,content_2 FROM speeches WHERE note_id = ?1 AND id < ?2 ORDER BY created_at_unixtime ASC").unwrap();
         let results = stmt
             .query_map(params![note_id, id], |row| {
                 Ok(Content {
                     speech_type: row.get_unwrap(0),
-                    content: row.get_unwrap(1),
-                    content_2: row.get(2).unwrap_or_default(),
+                    action_type: row.get(1).unwrap_or_default(),
+                    content: row.get_unwrap(2),
+                    content_2: row.get(3).unwrap_or_default(),
                 })
             })
             .unwrap()
@@ -213,9 +216,9 @@ impl Sqlite {
         &self,
         note_id: u64,
     ) -> Result<UnexecutedAction, rusqlite::Error> {
-        return self.conn.query_row("SELECT id, content FROM speeches WHERE speech_type = \"action\" AND content_2 IS NULL AND note_id = ?1 ORDER BY created_at_unixtime ASC LIMIT 1",
+        return self.conn.query_row("SELECT id, action_type, content FROM speeches WHERE speech_type = \"action\" AND content_2 IS NULL AND note_id = ?1 ORDER BY created_at_unixtime ASC LIMIT 1",
             params![note_id],
-            |row| Ok(UnexecutedAction{id: row.get_unwrap(0), content: row.get_unwrap(1)}),
+            |row| Ok(UnexecutedAction{id: row.get_unwrap(0), action_type: row.get_unwrap(1), content: row.get_unwrap(2)}),
         );
     }
 
diff --git a/src-tauri/src/module/synthesizer.rs b/src-tauri/src/module/synthesizer.rs
new file mode 100644
index 0000000..51fcfbb
--- /dev/null
+++ b/src-tauri/src/module/synthesizer.rs
@@ -0,0 +1,96 @@
+use std::fs;
+
+use sbv2_core::tts::TTSModelHolder;
+use tauri::AppHandle;
+
+pub fn list_models(app_handle: AppHandle) -> Vec<String> {
+    let models_path = app_handle
+        .path_resolver()
+        .resolve_resource("resources/style-bert-vits/models".to_string())
+        .unwrap()
+        .to_string_lossy()
+        .to_string();
+
+    let dir = fs::read_dir(models_path).unwrap();
+    let mut models: Vec<String> = Vec::new();
+    for item in dir.into_iter() {
+        let name = item.unwrap().file_name().to_string_lossy().to_string();
+        if name.ends_with(".sbv2") {
+            let entry = &name[..name.len() - 5];
+            models.push(entry.to_string());
+        }
+    }
+
+    models
+}
+
+pub struct Synthesizer {
+    ident: String,
+    tts_model: TTSModelHolder,
+}
+
+impl Synthesizer {
+    pub fn new(app_handle: AppHandle, model: String) -> Self {
+        let bert_model_path = app_handle
+            .path_resolver()
+            .resolve_resource(format!("resources/style-bert-vits/{}", "deberta.onnx"))
+            .unwrap()
+            .to_string_lossy()
+            .to_string();
+        let tokenizer_path = app_handle
+            .path_resolver()
+            .resolve_resource(format!("resources/style-bert-vits/{}", "tokenizer.json"))
+            .unwrap()
+            .to_string_lossy()
+            .to_string();
+        let models_path = app_handle
+            .path_resolver()
+            .resolve_resource("resources/style-bert-vits/models".to_string())
+            .unwrap()
+            .to_string_lossy()
+            .to_string();
+
+        let mut tts_model = TTSModelHolder::new(
+            &fs::read(bert_model_path).unwrap(),
+            &fs::read(tokenizer_path).unwrap(),
+        )
+        .unwrap();
+
+        let sbv2_bytes = fs::read(format!("{models_path}/{}.sbv2", model.clone())).unwrap();
+        let _ = tts_model.load_sbv2file(model.clone(), sbv2_bytes);
+
+        Self {
+            ident: model,
+            tts_model,
+        }
+    }
+
+    pub fn synthesize(
+        &mut self,
+        text: String,
+        sdp_ratio: f32,
+        length_scale: f32,
+    ) -> Result<Vec<u8>, String> {
+        let (bert_ori, phones, tones, lang_ids) = self.tts_model.parse_text(&text).unwrap();
+
+        let style_vector = self
+            .tts_model
+            .get_style_vector(self.ident.clone(), 0, 1.0)
+            .unwrap();
+        let buffer = self
+            .tts_model
+            .synthesize(
+                self.ident.clone(),
+                bert_ori.to_owned(),
+                phones,
+                tones,
+                lang_ids,
+                style_vector,
+                sdp_ratio,
+                length_scale,
+            )
+            .unwrap();
+
+        Ok(buffer)
+    }
+}
diff --git a/src-tauri/src/module/transcriber.rs b/src-tauri/src/module/transcriber.rs
index c0c11e1..1b245a9 100644
--- a/src-tauri/src/module/transcriber.rs
+++ b/src-tauri/src/module/transcriber.rs
@@ -16,6 +16,10 @@ impl Transcriber {
             model_type = "large-distil.en"
         } else if transcription_accuracy.starts_with("large-distil.ja") {
             model_type = "large-distil.ja"
+        } else if transcription_accuracy.starts_with("large-distil.bilingual") {
+            model_type = "large-distil.bilingual"
+        } else if transcription_accuracy.starts_with("large-turbo") {
+            model_type = "large-turbo"
         } else if transcription_accuracy.starts_with("large") {
             model_type = "large"
         }
@@ -26,8 +30,14 @@ impl Transcriber {
             .to_string_lossy()
             .to_string();
 
-        return WhisperContext::new_with_params(&model_path, WhisperContextParameters::default())
-            .expect("failed to load whisper model");
+        return WhisperContext::new_with_params(
+            &model_path,
+            WhisperContextParameters {
+                flash_attn: true,
+                ..WhisperContextParameters::default()
+            },
+        )
+        .expect("failed to load whisper model");
     }
 
     pub fn build_params(
@@ -85,12 +95,64 @@ impl Transcriber {
         );
         println!("working on {} threads.", hardware_concurrency);
         params.set_n_threads(hardware_concurrency);
-        if transcription_accuracy.ends_with("en") {
+
+        if transcription_accuracy.starts_with("large-distil.bilingual") {
             params.set_translate(true);
+            if language == "en" {
+                params.set_initial_prompt("こんにちは、私の講義へようこそ。");
+                params.set_language(Some("ja"));
+            } else if language == "ja" {
+                params.set_initial_prompt("Hello, welcome to my lecture.");
+                params.set_language(Some("en"));
+            }
         } else {
-            params.set_translate(false);
+            params.set_language(Some(language));
+            if transcription_accuracy.ends_with("en") {
+                params.set_translate(true);
+                params.set_initial_prompt("Hello, welcome to my lecture.");
+            } else {
+                params.set_translate(false);
+                if language == "en" {
+                    params.set_initial_prompt("Hello, welcome to my lecture.");
+                } else if language == "zh" {
+                    params.set_initial_prompt("你好，欢迎来到我的讲座。");
+                } else if language == "ko" {
+                    params.set_initial_prompt("안녕하세요, 제 강의에 오신 것을 환영합니다.");
+                } else if language == "fr" {
+                    params.set_initial_prompt("Bonjour, bienvenue à mon cours.");
+                } else if language == "de" {
+                    params.set_initial_prompt("Hallo, willkommen zu meiner Vorlesung.");
+                } else if language == "ru" {
+                    params.set_initial_prompt("Привет, добро пожаловать на мою лекцию.");
+                } else if language == "es" {
+                    params.set_initial_prompt("Hola, bienvenido a mi conferencia.");
+                } else if language == "pt" {
+                    params.set_initial_prompt("Olá, bem-vindo à minha palestra.");
+                } else if language == "tr" {
+                    params.set_initial_prompt("Merhaba, dersime hoş geldiniz.");
+                } else if language == "vi" {
+                    params.set_initial_prompt("Xin chào, chào mừng bạn đến với bài giảng của tôi.");
+                } else if language == "it" {
+                    params.set_initial_prompt("Ciao, benvenuto alla mia conferenza.");
+                } else if language == "nl" {
+                    params.set_initial_prompt("Hallo, welkom bij mijn lezing.");
+                } else if language == "ca" {
+                    params.set_initial_prompt("Hola, benvingut a la meva conferència.");
+                } else if language == "uk" {
+                    params.set_initial_prompt("Привіт, ласкаво просимо на мою лекцію.");
+                } else if language == "sv" {
+                    params.set_initial_prompt("Hej, välkommen till min föreläsning.");
+                } else if language == "hi" {
+                    params.set_initial_prompt("नमस्ते, मेरे व्याख्यान में आपका स्वागत है।");
+                } else if language == "cs" {
+                    params.set_initial_prompt("Ahoj, vítejte na mé přednášce.");
+                } else if language == "pl" {
+                    params.set_initial_prompt("Cześć, witaj na mojej wykładzie.");
+                } else if language == "ja" {
+                    params.set_initial_prompt("こんにちは、私の講義へようこそ。");
+                }
+            }
         }
-        params.set_language(Some(language));
         params.set_print_special(false);
         params.set_print_progress(false);
         params.set_print_realtime(false);
diff --git a/src-tauri/src/module/transcription_online.rs b/src-tauri/src/module/transcription_online.rs
index 4ba0b3c..1b80fb0 100644
--- a/src-tauri/src/module/transcription_online.rs
+++ b/src-tauri/src/module/transcription_online.rs
@@ -146,16 +146,64 @@ impl TranscriptionOnline {
             "ja"
         };
         let part_language = multipart::Part::text(language);
+        let prompt = if is_translate {
+            "Hello, welcome to my lecture."
+        } else {
+            if language == "en" {
+                "Hello, welcome to my lecture."
+            } else if language == "zh" {
+                "你好，欢迎来到我的讲座。"
+            } else if language == "ko" {
+                "안녕하세요, 제 강의에 오신 것을 환영합니다."
+            } else if language == "fr" {
+                "Bonjour, bienvenue à mon cours."
+            } else if language == "de" {
+                "Hallo, willkommen zu meiner Vorlesung."
+            } else if language == "ru" {
+                "Привет, добро пожаловать на мою лекцию."
+            } else if language == "es" {
+                "Hola, bienvenido a mi conferencia."
+            } else if language == "pt" {
+                "Olá, bem-vindo à minha palestra."
+            } else if language == "tr" {
+                "Merhaba, dersime hoş geldiniz."
+            } else if language == "vi" {
+                "Xin chào, chào mừng bạn đến với bài giảng của tôi."
+            } else if language == "it" {
+                "Ciao, benvenuto alla mia conferenza."
+            } else if language == "nl" {
+                "Hallo, welkom bij mijn lezing."
+            } else if language == "ca" {
+                "Hola, benvingut a la meva conferència."
+            } else if language == "uk" {
+                "Привіт, ласкаво просимо на мою лекцію."
+            } else if language == "sv" {
+                "Hej, välkommen till min föreläsning."
+            } else if language == "hi" {
+                "नमस्ते, मेरे व्याख्यान में आपका स्वागत है।"
+            } else if language == "cs" {
+                "Ahoj, vítejte na mé přednášce."
+            } else if language == "pl" {
+                "Cześć, witaj na mojej wykładzie."
+            } else if language == "ja" {
+                "こんにちは、私の講義へようこそ。"
+            } else {
+                "Hello, welcome to my lecture."
+            }
+        };
+        let part_prompt = multipart::Part::text(prompt);
 
         let form = if is_translate {
             multipart::Form::new()
                 .part("file", part_file)
                 .part("model", part_model)
+                .part("prompt", part_prompt)
         } else {
             multipart::Form::new()
                 .part("file", part_file)
                 .part("model", part_model)
                 .part("language", part_language)
+                .part("prompt", part_prompt)
         };
 
         let response = client
diff --git a/src-tauri/src/module/translation_en.rs b/src-tauri/src/module/translation_en.rs
new file mode 100644
index 0000000..8865e1d
--- /dev/null
+++ b/src-tauri/src/module/translation_en.rs
@@ -0,0 +1,190 @@
+use super::{sqlite::Sqlite, transcriber::Transcriber};
+
+use crossbeam_channel::Receiver;
+use ct2rs::{tokenizers::auto::Tokenizer, Config, TranslationOptions, Translator};
+use hound::SampleFormat;
+use samplerate_rs::{convert, ConverterType};
+use std::sync::Mutex;
+use tauri::{AppHandle, Manager};
+use whisper_rs::WhisperContext;
+
+#[derive(Debug, Clone, serde::Serialize)]
+pub struct TraceCompletion {}
+
+pub struct TranslationEn {
+    app_handle: AppHandle,
+    sqlite: Sqlite,
+    ctx: WhisperContext,
+    translator: Translator<Tokenizer>,
+    note_id: u64,
+}
+
+impl TranslationEn {
+    pub fn new(app_handle: AppHandle, note_id: u64) -> Self {
+        let app_handle_clone = app_handle.clone();
+        let model_path = app_handle
+            .path_resolver()
+            .resolve_resource(format!("resources/fugumt-ja-en"))
+            .unwrap()
+            .to_string_lossy()
+            .to_string();
+
+        TranslationEn {
+            app_handle,
+            sqlite: Sqlite::new(),
+            ctx: Transcriber::build(app_handle_clone, "large".to_string()),
+            translator: Translator::new(&model_path, &Config::default()).unwrap(),
+            note_id,
+        }
+    }
+
+    pub fn start(&mut self, stop_convert_rx: Receiver<()>, is_continuous: bool) {
+        while Self::convert(self).is_ok() {
+            if is_continuous {
+                let vosk_speech = self.sqlite.select_vosk(self.note_id);
+                if vosk_speech.is_err() {
+                    self.app_handle
+                        .clone()
+                        .emit_all("traceCompletion", TraceCompletion {})
+                        .unwrap();
+                    break;
+                }
+            }
+            if stop_convert_rx.try_recv().is_ok() {
+                let vosk_speech = self.sqlite.select_vosk(self.note_id);
+                if vosk_speech.is_err() {
+                    self.app_handle
+                        .clone()
+                        .emit_all("traceCompletion", TraceCompletion {})
+                        .unwrap();
+                } else {
+                    self.app_handle
+                        .clone()
+                        .emit_all("traceUnCompletion", TraceCompletion {})
+                        .unwrap();
+                }
+                break;
+            }
+        }
+    }
+
+    fn convert(&mut self) -> Result<(), rusqlite::Error> {
+        let vosk_speech = self.sqlite.select_vosk(self.note_id);
+        return vosk_speech.and_then(|speech| {
+            let mut reader = hound::WavReader::open(speech.wav).unwrap();
+
+            let spec = reader.spec();
+            let mut data =
+                Vec::with_capacity((spec.channels as usize) * (reader.duration() as usize));
+            match (spec.bits_per_sample, spec.sample_format) {
+                (16, SampleFormat::Int) => {
+                    for sample in reader.samples::<i16>() {
+                        data.push((sample.unwrap() as f32) / (0x7fffi32 as f32));
+                    }
+                }
+                (24, SampleFormat::Int) => {
+                    for sample in reader.samples::<i32>() {
+                        let val = (sample.unwrap() as f32) / (0x00ff_ffffi32 as f32);
+                        data.push(val);
+                    }
+                }
+                (32, SampleFormat::Int) => {
+                    for sample in reader.samples::<i32>() {
+                        data.push((sample.unwrap() as f32) / (0x7fff_ffffi32 as f32));
+                    }
+                }
+                (32, SampleFormat::Float) => {
+                    for sample in reader.samples::<f32>() {
+                        data.push(sample.unwrap());
+                    }
+                }
+                _ => panic!(
+                    "Tried to read file but there was a problem: {:?}",
+                    hound::Error::Unsupported
+                ),
+            }
+            let data = if spec.channels != 1 {
+                whisper_rs::convert_stereo_to_mono_audio(&data).unwrap()
+            } else {
+                data
+            };
+            let audio_data = convert(
+                spec.sample_rate,
+                16000,
+                1,
+                ConverterType::SincBestQuality,
+                &data,
+            )
+            .unwrap();
+
+            let mut state = self.ctx.create_state().expect("failed to create state");
+            let result = state.full(
+                Transcriber::build_params(
+                    "ja".to_string(),
+                    "large".to_string(),
+                ),
+                &audio_data[..],
+            );
+            if result.is_ok() {
+                let num_segments = state
+                    .full_n_segments()
+                    .expect("failed to get number of segments");
+                let mut converted: Vec<String> = vec!["".to_string()];
+                for i in 0..num_segments {
+                    let segment = state.full_get_segment_text(i);
+                    if segment.is_ok() {
+                        converted.push(segment.unwrap().to_string());
+                    };
+                }
+
+                let result_on_whisper = converted.join("");
+                let sources: Vec<String> = result_on_whisper.lines().map(String::from).collect();
+                let res: Vec<(String, Option<f32>)> = self
+                    .translator
+                    .translate_batch(
+                        &sources,
+                        &TranslationOptions {
+                            beam_size: 5,
+                            ..Default::default()
+                        },
+                        None,
+                    )
+                    .unwrap();
+                let mut translated: Vec<String> = vec!["".to_string()];
+                for (r, _) in res {
+                    translated.push(r);
+                }
+
+                let updated = self
+                    .sqlite
+                    .update_model_vosk_to_whisper(speech.id, translated.join(""));
+
+                let updated = updated.unwrap();
+                if updated.content != "" {
+                    self.app_handle
+                        .clone()
+                        .emit_all("finalTextConverted", updated)
+                        .unwrap();
+                }
+            } else {
+                println!("whisper is temporally failed, so skipping...")
+            }
+
+            Ok(())
+        });
+    }
+}
+
+pub static SINGLETON_INSTANCE: Mutex<Option<TranslationEn>> = Mutex::new(None);
+
+pub fn initialize_translation_en(app_handle: AppHandle, note_id: u64) {
+    let mut singleton = SINGLETON_INSTANCE.lock().unwrap();
+    if singleton.is_none() {
+        *singleton = Some(TranslationEn::new(app_handle, note_id));
+    }
+}
+
+pub fn drop_translation_en() {
+    let mut singleton = SINGLETON_INSTANCE.lock().unwrap();
+    *singleton = None;
+}
diff --git a/src-tauri/src/module/translation_ja.rs b/src-tauri/src/module/translation_ja.rs
index aebaa57..15b0b35 100644
--- a/src-tauri/src/module/translation_ja.rs
+++ b/src-tauri/src/module/translation_ja.rs
@@ -1,7 +1,7 @@
 use super::{sqlite::Sqlite, transcriber::Transcriber};
 
 use crossbeam_channel::Receiver;
-use ct2rs::{config::Config, sentencepiece::Tokenizer, TranslationOptions, Translator};
+use ct2rs::{tokenizers::auto::Tokenizer, Config, TranslationOptions, Translator};
 use hound::SampleFormat;
 use samplerate_rs::{convert, ConverterType};
 use std::sync::Mutex;
@@ -36,7 +36,6 @@ impl TranslationJa {
             ctx: Transcriber::build(app_handle_clone, "large-translate-to-en".to_string()),
             translator: Translator::new(
                 &model_path,
-                Tokenizer::new(&model_path).unwrap(),
                 &Config::default(),
             )
             .unwrap(),
@@ -154,6 +153,7 @@ impl TranslationJa {
                             beam_size: 5,
                             ..Default::default()
                         },
+                        None
                     )
                     .unwrap();
                 let mut translated: Vec<String> = vec!["".to_string()];
diff --git a/src-tauri/src/module/translation_ja_high.rs b/src-tauri/src/module/translation_ja_high.rs
index 1f13d4d..fe112c1 100644
--- a/src-tauri/src/module/translation_ja_high.rs
+++ b/src-tauri/src/module/translation_ja_high.rs
@@ -3,12 +3,15 @@ use super::{sqlite::Sqlite, transcriber::Transcriber};
 use crossbeam_channel::Receiver;
 use hound::SampleFormat;
 use mistralrs::{
-    Constraint, DefaultSchedulerMethod, Device, DeviceMapMetadata, GGUFLoaderBuilder,
-    GGUFSpecificConfig, MistralRs, MistralRsBuilder, ModelDType, NormalRequest, Request,
-    RequestMessage, ResponseOk, SamplingParams, SchedulerConfig, TokenSource,
+    Constraint, DefaultSchedulerMethod, Device, DeviceMapMetadata, MistralRs, MistralRsBuilder,
+    ModelDType, NormalLoaderBuilder, NormalLoaderType, NormalRequest, NormalSpecificConfig,
+    Request, RequestMessage, ResponseOk, SamplingParams, SchedulerConfig, TokenSource,
 };
 use samplerate_rs::{convert, ConverterType};
-use std::sync::{Arc, Mutex};
+use std::{
+    path::PathBuf,
+    sync::{Arc, Mutex},
+};
 use tauri::{AppHandle, Manager};
 use tokio::sync::mpsc::channel;
 use whisper_rs::WhisperContext;
@@ -30,24 +33,30 @@ impl TranslationJaHigh {
         let app_handle_clone = app_handle.clone();
         let model_path = app_handle
             .path_resolver()
-            .resolve_resource(format!("resources/honyaku13b-q4-0"))
+            .resolve_resource(format!("resources/honyaku-13b"))
             .unwrap()
             .to_string_lossy()
             .to_string();
-        let loader = GGUFLoaderBuilder::new(
-            Some(format!("{}/chat_templates_llama2.json", model_path)),
-            None,
-            model_path,
-            vec!["aixsatoshi-Honyaku-13b-Q4_0.gguf".to_string()],
-            // vec!["aixsatoshi-Honyaku-13b-IQ4_XS.gguf".to_string()],
-            GGUFSpecificConfig {
+        let loader = NormalLoaderBuilder::new(
+            NormalSpecificConfig {
+                use_flash_attn: false,
                 prompt_batchsize: None,
                 topology: None,
+                organization: Default::default(),
+                write_uqff: None,
+                from_uqff: Some(PathBuf::from(format!(
+                    "{}/Honyaku-13b-q4_0.uqff",
+                    model_path
+                ))),
             },
+            None,
+            None,
+            Some(model_path),
         )
-        .build();
-        let pipeline = tokio::task::block_in_place(|| {
-            loader.load_model_from_hf(
+        .build(Some(NormalLoaderType::Llama))
+        .unwrap();
+        let pipeline = loader
+            .load_model_from_hf(
                 None,
                 TokenSource::None,
                 &ModelDType::Auto,
@@ -57,8 +66,7 @@ impl TranslationJaHigh {
                 None,
                 None,
             )
-        })
-        .unwrap();
+            .unwrap();
 
         TranslationJaHigh {
             app_handle,
@@ -70,6 +78,7 @@ impl TranslationJaHigh {
                     method: DefaultSchedulerMethod::Fixed(5.try_into().unwrap()),
                 },
             )
+            .with_no_prefix_cache(true)
             .build(),
             speaker_language,
             note_id,
@@ -177,14 +186,14 @@ impl TranslationJaHigh {
 
                 let result_on_whisper = converted.join("");
                 let prompt = format!("<english>: {} <NL>\n\n<japanese>: ", result_on_whisper);
-                let (tx, mut rx) = channel(10_000);
+                let (tx, mut rx) = channel(1);
                 let request = Request::Normal(NormalRequest {
                     messages: RequestMessage::Completion {
                         text: prompt,
                         echo_prompt: false,
                         best_of: 1,
                     },
-                    sampling_params: SamplingParams::default(),
+                    sampling_params: SamplingParams::deterministic(),
                     response: tx,
                     return_logprobs: false,
                     is_streaming: false,
diff --git a/src-tauri/tauri.conf.json b/src-tauri/tauri.conf.json
index 2a64283..6af6636 100644
--- a/src-tauri/tauri.conf.json
+++ b/src-tauri/tauri.conf.json
@@ -8,7 +8,7 @@
   },
   "package": {
     "productName": "Lycoris",
-    "version": "0.9.21"
+    "version": "0.9.22"
   },
   "tauri": {
     "allowlist": {
@@ -60,9 +60,9 @@
     "windows": [
       {
         "fullscreen": false,
-        "width": 1024,
+        "width": 1180,
         "height": 768,
-        "minWidth": 1024,
+        "minWidth": 1180,
         "minHeight": 384,
         "resizable": true,
         "title": "Lycoris"
diff --git a/src/components/Header.tsx b/src/components/Header.tsx
index 1944202..e632ddd 100644
--- a/src/components/Header.tsx
+++ b/src/components/Header.tsx
@@ -1,4 +1,4 @@
-import { useSetRecoilState } from "recoil"
+import { useRecoilValue, useSetRecoilState } from "recoil"
 import { getVersion } from '@tauri-apps/api/app';
 import { featureState } from "../store/atoms/featureState"
 import { selectedNoteState } from "../store/atoms/selectedNoteState"
@@ -6,6 +6,8 @@ import { AudioDevices } from "./molecules/AudioDevice"
 import { SpeakerLanguage } from "./molecules/SpeakerLanguage"
 import { TranscriptionAccuracy } from "./molecules/TranscriptionAccuracy"
 import { useEffect, useState } from "react";
+import { SmartVoice } from "./molecules/SmartVoice";
+import { modelStyleBertVits2DownloadedState } from "../store/atoms/modelStyleBertVits2DownloadedState";
 
 const Header = (): JSX.Element => {
     const setFeature = useSetRecoilState(featureState)
@@ -19,15 +21,20 @@ const Header = (): JSX.Element => {
         fetchVersion();
     }, []);
 
+    const downloadedBaseModels = useRecoilValue(modelStyleBertVits2DownloadedState);
+    const is_base_downloaded = downloadedBaseModels.filter(m => m === "style-bert-vits2").length > 0
+
     return (
         <header className="sticky top-0 z-10" style={{ minWidth: "770px", height: "64px" }}>
             <div className="navbar bg-base-200">
                 <div className="flex flex-1 items-baseline select-none">
-                    <a className="ml-2 font-bold text-xl text-primary mr-1" href="https://github.com/solaoi/lycoris" target="_blank">Lycoris</a>
-                    <p className="text-xs text-slate-500 cursor-default">v{appVersion}</p>
+                    <div className="flex flex-col items-end">
+                        <a className="ml-2 font-bold text-xl text-primary" href="https://github.com/solaoi/lycoris" target="_blank">Lycoris</a>
+                        <p className="text-xs text-slate-500 cursor-default">v{appVersion}</p>
+                    </div>
                 </div>
                 <div className="flex-none mr-1">
-                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
+                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
                         <path d="M7.75 2.75a.75.75 0 00-1.5 0v1.258a32.987 32.987 0 00-3.599.278.75.75 0 10.198 1.487A31.545 31.545 0 018.7 5.545 19.381 19.381 0 017 9.56a19.418 19.418 0 01-1.002-2.05.75.75 0 00-1.384.577 20.935 20.935 0 001.492 2.91 19.613 19.613 0 01-3.828 4.154.75.75 0 10.945 1.164A21.116 21.116 0 007 12.331c.095.132.192.262.29.391a.75.75 0 001.194-.91c-.204-.266-.4-.538-.59-.815a20.888 20.888 0 002.333-5.332c.31.031.618.068.924.108a.75.75 0 00.198-1.487 32.832 32.832 0 00-3.599-.278V2.75z" />
                         <path fillRule="evenodd" d="M13 8a.75.75 0 01.671.415l4.25 8.5a.75.75 0 11-1.342.67L15.787 16h-5.573l-.793 1.585a.75.75 0 11-1.342-.67l4.25-8.5A.75.75 0 0113 8zm2.037 6.5L13 10.427 10.964 14.5h4.073z" clipRule="evenodd" />
                     </svg>
@@ -36,7 +43,7 @@ const Header = (): JSX.Element => {
                     <SpeakerLanguage />
                 </div>
                 <div className="flex-none mr-1">
-                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
+                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
                         <path d="M15.98 1.804a1 1 0 00-1.96 0l-.24 1.192a1 1 0 01-.784.785l-1.192.238a1 1 0 000 1.962l1.192.238a1 1 0 01.785.785l.238 1.192a1 1 0 001.962 0l.238-1.192a1 1 0 01.785-.785l1.192-.238a1 1 0 000-1.962l-1.192-.238a1 1 0 01-.785-.785l-.238-1.192zM6.949 5.684a1 1 0 00-1.898 0l-.683 2.051a1 1 0 01-.633.633l-2.051.683a1 1 0 000 1.898l2.051.684a1 1 0 01.633.632l.683 2.051a1 1 0 001.898 0l.683-2.051a1 1 0 01.633-.633l2.051-.683a1 1 0 000-1.898l-2.051-.683a1 1 0 01-.633-.633L6.95 5.684zM13.949 13.684a1 1 0 00-1.898 0l-.184.551a1 1 0 01-.632.633l-.551.183a1 1 0 000 1.898l.551.183a1 1 0 01.633.633l.183.551a1 1 0 001.898 0l.184-.551a1 1 0 01.632-.633l.551-.183a1 1 0 000-1.898l-.551-.184a1 1 0 01-.633-.632l-.183-.551z" />
                     </svg>
                 </div>
@@ -44,14 +51,30 @@ const Header = (): JSX.Element => {
                     <TranscriptionAccuracy />
                 </div>
                 <div className="flex-none mr-1">
-                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
+                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
                         <path d="M7 4a3 3 0 016 0v6a3 3 0 11-6 0V4z" />
                         <path d="M5.5 9.643a.75.75 0 00-1.5 0V10c0 3.06 2.29 5.585 5.25 5.954V17.5h-1.5a.75.75 0 000 1.5h4.5a.75.75 0 000-1.5h-1.5v-1.546A6.001 6.001 0 0016 10v-.357a.75.75 0 00-1.5 0V10a4.5 4.5 0 01-9 0v-.357z" />
                     </svg>
                 </div>
-                <div className="flex-none mr-4">
-                    <AudioDevices />
-                </div>
+                {is_base_downloaded ?
+                    <>
+                        <div className="flex-none mr-2">
+                            <AudioDevices />
+                        </div>
+                        <div className="flex-none mr-1">
+                            <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                                <path d="M13.92 3.845a19.362 19.362 0 0 1-6.3 1.98C6.765 5.942 5.89 6 5 6a4 4 0 0 0-.504 7.969 15.97 15.97 0 0 0 1.271 3.34c.397.771 1.342 1 2.05.59l.867-.5c.726-.419.94-1.32.588-2.02-.166-.331-.315-.666-.448-1.004 1.8.357 3.511.963 5.096 1.78A17.964 17.964 0 0 0 15 10c0-2.162-.381-4.235-1.08-6.155ZM15.243 3.097A19.456 19.456 0 0 1 16.5 10c0 2.43-.445 4.758-1.257 6.904l-.03.077a.75.75 0 0 0 1.401.537 20.903 20.903 0 0 0 1.312-5.745 2 2 0 0 0 0-3.546 20.902 20.902 0 0 0-1.312-5.745.75.75 0 0 0-1.4.537l.029.078Z" />
+                            </svg>
+                        </div>
+                        <div className="flex-none mr-4">
+                            <SmartVoice />
+                        </div>
+                    </>
+                    :
+                    <div className="flex-none mr-4">
+                        <AudioDevices />
+                    </div>
+                }
                 <div className="group cursor-pointer select-none flex-none mr-2" onClick={() => { setFeature("settings"); setSelectedNote(null); }}>
                     <svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24" strokeWidth={1.5} stroke="currentColor" className="w-6 h-6 hover:animate-spin-slow">
                         <path strokeLinecap="round" strokeLinejoin="round" d="M9.594 3.94c.09-.542.56-.94 1.11-.94h2.593c.55 0 1.02.398 1.11.94l.213 1.281c.063.374.313.686.645.87.074.04.147.083.22.127.324.196.72.257 1.075.124l1.217-.456a1.125 1.125 0 011.37.49l1.296 2.247a1.125 1.125 0 01-.26 1.431l-1.003.827c-.293.24-.438.613-.431.992a6.759 6.759 0 010 .255c-.007.378.138.75.43.99l1.005.828c.424.35.534.954.26 1.43l-1.298 2.247a1.125 1.125 0 01-1.369.491l-1.217-.456c-.355-.133-.75-.072-1.076.124a6.57 6.57 0 01-.22.128c-.331.183-.581.495-.644.869l-.213 1.28c-.09.543-.56.941-1.11.941h-2.594c-.55 0-1.02-.398-1.11-.94l-.213-1.281c-.062-.374-.312-.686-.644-.87a6.52 6.52 0 01-.22-.127c-.325-.196-.72-.257-1.076-.124l-1.217.456a1.125 1.125 0 01-1.369-.49l-1.297-2.247a1.125 1.125 0 01.26-1.431l1.004-.827c.292-.24.437-.613.43-.992a6.932 6.932 0 010-.255c.007-.378-.138-.75-.43-.99l-1.004-.828a1.125 1.125 0 01-.26-1.43l1.297-2.247a1.125 1.125 0 011.37-.491l1.216.456c.356.133.751.072 1.076-.124.072-.044.146-.087.22-.128.332-.183.582-.495.644-.869l.214-1.281z" />
diff --git a/src/components/molecules/ActionSet.tsx b/src/components/molecules/ActionSet.tsx
index fc0ab52..fea59bc 100644
--- a/src/components/molecules/ActionSet.tsx
+++ b/src/components/molecules/ActionSet.tsx
@@ -1,10 +1,12 @@
 import { useRef, useState } from "react"
+import { useRecoilState } from "recoil"
+import { actionState } from "../../store/atoms/actionState"
 
 const ActionSet = (): JSX.Element => {
     const dropdownRef = useRef<HTMLLabelElement>(null)
 
-    const [targetAction, setTargetAction] = useState<string | null>("チャット")
-    const actions = ["チャット"]
+    const [targetAction, setTargetAction] = useRecoilState(actionState)
+    const actions = ["チャット", "発話サジェスト"]
     const [toggle, setToggle] = useState(false)
 
     const change = (actionName: string) => {
diff --git a/src/components/molecules/AppWindow.tsx b/src/components/molecules/AppWindow.tsx
index 54f4056..a275c31 100644
--- a/src/components/molecules/AppWindow.tsx
+++ b/src/components/molecules/AppWindow.tsx
@@ -5,6 +5,8 @@ import { AppWindowType } from "../../type/AppWindow.type"
 import { appWindowState } from "../../store/atoms/appWindowState"
 import { useHasPermissionScreenCapture } from "../../hooks/useHasPermissionScreenCapture"
 import { ScreenShotButton } from "./ScreenshotButton"
+import { appSelectedState } from "../../store/atoms/appSelectedState"
+import { appWindowsState } from "../../store/atoms/appWindowsState"
 
 const AppWindow = (): JSX.Element => {
     const [isDesktopAudioToggled, setIsDesktopAudioToggled] = useState<boolean | null>(null)
@@ -12,25 +14,27 @@ const AppWindow = (): JSX.Element => {
 
     const dropdownRef = useRef<HTMLLabelElement>(null)
 
-    const [targetApp, setTargetApp] = useState<string | null>(null)
-    const [apps, setApps] = useState<string[]>([])
+    const [targetApp, setTargetApp] = useRecoilState(appSelectedState)
+    const [apps, setApps] = useState([] as string[])
     const [toggle, setToggle] = useState(false)
     useEffect(() => {
         invoke('list_apps_command').then(apps => setApps(apps as string[]))
     }, [toggle])
 
     const [targetWindow, setTargetWindow] = useRecoilState(appWindowState)
-    const [appWindows, setAppWindows] = useState<AppWindowType[]>([])
-    const change = (e: ChangeEvent<HTMLInputElement>) => {
+    const [appWindows, setAppWindows] = useRecoilState(appWindowsState)
+    const change = (appWindowId: number) => {
         dropdownRef.current?.focus();
-        if (e.target.checked) {
-            const appWindowId = e.target.value
-            const targetAppWindow = appWindows.filter(({ id }) => id === parseInt(appWindowId))[0]
-            setTargetWindow(targetAppWindow)
+        const targetAppWindows = appWindows.filter(({ id }) => id === appWindowId)
+        if (targetAppWindows.length > 1) {
+            setTargetWindow(null)
+        } else {
+            setTargetWindow(targetAppWindows[0])
         }
     }
     const click = (appName: string) => {
         setTargetApp(appName)
+        setTargetWindow(null)
         invoke('list_app_windows_command', { appName })
             .then(windows => setAppWindows(windows as AppWindowType[]))
     }
@@ -42,48 +46,50 @@ const AppWindow = (): JSX.Element => {
         }
     }
 
-    return (<>
-        <div className="dropdown dropdown-top" onClick={() =>
-            setIsDesktopAudioToggled(!isDesktopAudioToggled)
-        }>
-            <label ref={dropdownRef} onMouseDown={e => checkAndCloseDropDown(e.currentTarget)} tabIndex={0} className="group normal-case btn w-52 flex justify-between" style={{ color: "inherit", backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }}
-            >
-                <div className="w-36 text-left overflow-x-hidden whitespace-nowrap text-ellipsis">{(targetApp === null || targetWindow === null) ? "撮影する画面を選択" : `${targetApp} / ${targetWindow.title}`}</div>
-                <div>
-                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
-                        <path fillRule="evenodd" d="M9.47 6.47a.75.75 0 0 1 1.06 0l4.25 4.25a.75.75 0 1 1-1.06 1.06L10 8.06l-3.72 3.72a.75.75 0 0 1-1.06-1.06l4.25-4.25Z" clipRule="evenodd" />
-                    </svg>
-                </div>
-                <div className="opacity-0 w-24 invisible rounded text-[12px] 
+    return (
+        <>
+            <div className="dropdown dropdown-top" onClick={() =>
+                setIsDesktopAudioToggled(!isDesktopAudioToggled)
+            }>
+                <label ref={dropdownRef} onMouseDown={e => checkAndCloseDropDown(e.currentTarget)} tabIndex={0} className="group normal-case btn w-52 flex justify-between" style={{ color: "inherit", backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }}
+                >
+                    <div className="w-36 text-left overflow-x-hidden whitespace-nowrap text-ellipsis">{(targetApp === null || targetWindow === null) ? "撮影する画面を選択" : `${targetApp} / ${targetWindow.title}`}</div>
+                    <div>
+                        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
+                            <path fillRule="evenodd" d="M9.47 6.47a.75.75 0 0 1 1.06 0l4.25 4.25a.75.75 0 1 1-1.06 1.06L10 8.06l-3.72 3.72a.75.75 0 0 1-1.06-1.06l4.25-4.25Z" clipRule="evenodd" />
+                        </svg>
+                    </div>
+                    <div className="opacity-0 w-24 invisible rounded text-[12px] 
                     font-bold text-white py-1 bg-slate-600 top-[-1.25rem] left-4 z-10
                     group-hover:visible opacity-100 absolute">撮影する画面
-                </div>
-            </label>
-            {hasPermissionScreenCapture && <div tabIndex={0} className="p-0 dropdown-content menu rounded-box w-[15.5rem] bg-white join join-vertical"
-                style={{ backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }}
-            >
-                <div className="max-h-80 overflow-y-scroll rounded-box scrollbar-transparent w-full">
-                    {apps.map((app, i) => (
-                        <div key={"app_" + i} className={"collapse collapse-arrow join-item" + (app === targetApp ? " bg-base-200" : "")}>
-                            <input className="w-full" type="radio" name={"app-window_" + i} checked={app === targetApp} value={app} onChange={() => click(app)} />
-                            <div className="collapse-title font-medium w-[15.5rem]" style={{ overflowWrap: "anywhere" }}>
-                                {app}
+                    </div>
+                </label>
+                {hasPermissionScreenCapture && <div tabIndex={0} className="p-0 dropdown-content menu rounded-box w-[15.5rem] bg-white join join-vertical"
+                    style={{ backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }}
+                >
+                    <div className="max-h-80 overflow-y-scroll rounded-box scrollbar-transparent w-full">
+                        {apps.map((app, i) => (
+                            <div key={"app_" + i} className={"collapse collapse-arrow join-item" + (app === targetApp ? " bg-base-200" : "")}>
+                                <input className="w-full" type="radio" name={"app-window_" + i} checked={app === targetApp} value={app} onChange={() => click(app)} />
+                                <div className="collapse-title font-medium w-[15.5rem]" style={{ overflowWrap: "anywhere" }}>
+                                    {app}
+                                </div>
+                                <div className="collapse-content flex flex-col w-[15.5rem]" style={{ overflowWrap: "anywhere" }}>
+                                    {appWindows.map(({ id, title }) => (
+                                        <label key={"appWindow_" + id} className="label inline-flex active:!bg-inherit cursor-pointer">
+                                            <input type="radio" name="app-window-option" className={"radio radio-accent mr-2" + (id === targetWindow?.id ? " checked" : "")} onChange={() => change(id)} value={id} defaultChecked={id === targetWindow?.id} />
+                                            <a className="grow">{title}</a>
+                                        </label>
+                                    ))}
+                                </div>
                             </div>
-                            <div className="collapse-content flex flex-col w-[15.5rem]" style={{ overflowWrap: "anywhere" }}>
-                                {appWindows.map(({ id, title }) => (
-                                    <label key={"appWindow_" + id} className="label inline-flex active:!bg-inherit cursor-pointer">
-                                        <input type="radio" name="app-window-option" className="radio radio-accent mr-2" onChange={change} value={id} defaultChecked={id === targetWindow?.id} />
-                                        <a className="grow">{title}</a>
-                                    </label>
-                                ))}
-                            </div>
-                        </div>
-                    ))}
-                </div>
-            </div>}
-        </div>
-        <div className="h-2"></div>
-        <ScreenShotButton hasPermissionScreenCapture={hasPermissionScreenCapture} /></>
+                        ))}
+                    </div>
+                </div>}
+            </div>
+            <div className="h-2"></div>
+            <ScreenShotButton hasPermissionScreenCapture={hasPermissionScreenCapture} />
+        </>
     )
 }
 
diff --git a/src/components/molecules/ModelDownloadFugumtEnJaButton.tsx b/src/components/molecules/ModelDownloadFugumtEnJaButton.tsx
new file mode 100644
index 0000000..81261e4
--- /dev/null
+++ b/src/components/molecules/ModelDownloadFugumtEnJaButton.tsx
@@ -0,0 +1,30 @@
+import { invoke } from '@tauri-apps/api/tauri'
+import { useRecoilState, useRecoilValue } from 'recoil'
+import { modelFugumtEnJaDownloadingState } from '../../store/atoms/modelFugumtEnJaDownloadingState'
+import { modelFugumtEnJaDownloadedState } from '../../store/atoms/modelFugumtEnJaDownloadedState'
+import { modelWhisperDownloadedState } from '../../store/atoms/modelWhisperDownloadedState'
+
+const ModelDownloadFugumtEnJaButton = (): JSX.Element => {
+    const modelType = "fugumt-en-ja"
+    const downloadedModels = useRecoilValue(modelFugumtEnJaDownloadedState)
+    const downloadedBaseModels = useRecoilValue(modelWhisperDownloadedState)
+    const [downloadingModels, setDownloadingModels] = useRecoilState(modelFugumtEnJaDownloadingState)
+    const click = () => {
+        setDownloadingModels([...downloadingModels, modelType])
+        invoke('download_fugumt_enja_model_command')
+    }
+    const is_downloaded = downloadedModels.filter(m => m === modelType).length > 0
+    const is_downloading = downloadingModels.filter(m => m === modelType).length > 0
+    const is_base_downloaded = downloadedBaseModels.filter(m => m === "large").length > 0
+
+    return (
+        <button className="btn gap-2 glass border border-solid border-neutral-300 text-secondary select-none" onClick={click} disabled={is_downloaded || is_downloading || !is_base_downloaded}>
+            <svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24" strokeWidth="1.5" stroke="currentColor" className="w-6 h-6">
+                <path strokeLinecap="round" strokeLinejoin="round" d="M9 12.75l3 3m0 0l3-3m-3 3v-7.5M21 12a9 9 0 11-18 0 9 9 0 0118 0z" />
+            </svg>
+            {is_base_downloaded ? "ダウンロード" + (is_downloaded ? "済" : "") : "要：汎用パック"}
+        </button>
+    )
+}
+
+export { ModelDownloadFugumtEnJaButton }
\ No newline at end of file
diff --git a/src/components/molecules/ModelDownloadFugumtProgress.tsx b/src/components/molecules/ModelDownloadFugumtEnJaProgress.tsx
similarity index 73%
rename from src/components/molecules/ModelDownloadFugumtProgress.tsx
rename to src/components/molecules/ModelDownloadFugumtEnJaProgress.tsx
index 33ca420..86c7742 100644
--- a/src/components/molecules/ModelDownloadFugumtProgress.tsx
+++ b/src/components/molecules/ModelDownloadFugumtEnJaProgress.tsx
@@ -1,21 +1,21 @@
 import { useRecoilState, useSetRecoilState } from 'recoil'
-import { modelFugumtDownloadingState } from '../../store/atoms/modelFugumtDownloadingState'
+import { modelFugumtEnJaDownloadingState } from '../../store/atoms/modelFugumtEnJaDownloadingState'
 import { listen } from '@tauri-apps/api/event'
 import { useEffect, useState } from 'react'
 import { ProgressType } from '../../type/progress.type'
-import { modelFugumtDownloadedState } from '../../store/atoms/modelFugumtDownloadedState'
+import { modelFugumtEnJaDownloadedState } from '../../store/atoms/modelFugumtEnJaDownloadedState'
 
-const ModelDownloadFugumtProgress = (): JSX.Element => {
+const ModelDownloadFugumtEnJaProgress = (): JSX.Element => {
     const modelType = "fugumt-en-ja"
-    const setDownloadedModel = useSetRecoilState(modelFugumtDownloadedState)
-    const [downloadingModels, setDownloadingModels] = useRecoilState(modelFugumtDownloadingState)
+    const setDownloadedModel = useSetRecoilState(modelFugumtEnJaDownloadedState)
+    const [downloadingModels, setDownloadingModels] = useRecoilState(modelFugumtEnJaDownloadingState)
     const [progress, setProgress] = useState<ProgressType>({
         model_type: modelType,
         rate: 0,
         is_progress: false
     })
     useEffect(() => {
-        const unlisten = listen('downloadFugumtProgress', event => {
+        const unlisten = listen('downloadFugumtEnJaProgress', event => {
             const p = event.payload as ProgressType
             if (p.model_type === modelType) {
                 setProgress(p)
@@ -39,4 +39,4 @@ const ModelDownloadFugumtProgress = (): JSX.Element => {
     return (<></>)
 }
 
-export { ModelDownloadFugumtProgress }
\ No newline at end of file
+export { ModelDownloadFugumtEnJaProgress }
\ No newline at end of file
diff --git a/src/components/molecules/ModelDownloadFugumtJaEnButton.tsx b/src/components/molecules/ModelDownloadFugumtJaEnButton.tsx
new file mode 100644
index 0000000..a1a7f6f
--- /dev/null
+++ b/src/components/molecules/ModelDownloadFugumtJaEnButton.tsx
@@ -0,0 +1,30 @@
+import { invoke } from '@tauri-apps/api/tauri'
+import { useRecoilState, useRecoilValue } from 'recoil'
+import { modelFugumtJaEnDownloadingState } from '../../store/atoms/modelFugumtJaEnDownloadingState'
+import { modelFugumtJaEnDownloadedState } from '../../store/atoms/modelFugumtJaEnDownloadedState'
+import { modelWhisperDownloadedState } from '../../store/atoms/modelWhisperDownloadedState'
+
+const ModelDownloadFugumtJaEnButton = (): JSX.Element => {
+    const modelType = "fugumt-ja-en"
+    const downloadedModels = useRecoilValue(modelFugumtJaEnDownloadedState)
+    const downloadedBaseModels = useRecoilValue(modelWhisperDownloadedState)
+    const [downloadingModels, setDownloadingModels] = useRecoilState(modelFugumtJaEnDownloadingState)
+    const click = () => {
+        setDownloadingModels([...downloadingModels, modelType])
+        invoke('download_fugumt_jaen_model_command')
+    }
+    const is_downloaded = downloadedModels.filter(m => m === modelType).length > 0
+    const is_downloading = downloadingModels.filter(m => m === modelType).length > 0
+    const is_base_downloaded = downloadedBaseModels.filter(m => m === "large").length > 0
+
+    return (
+        <button className="btn gap-2 glass border border-solid border-neutral-300 text-secondary select-none" onClick={click} disabled={is_downloaded || is_downloading || !is_base_downloaded}>
+            <svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24" strokeWidth="1.5" stroke="currentColor" className="w-6 h-6">
+                <path strokeLinecap="round" strokeLinejoin="round" d="M9 12.75l3 3m0 0l3-3m-3 3v-7.5M21 12a9 9 0 11-18 0 9 9 0 0118 0z" />
+            </svg>
+            {is_base_downloaded ? "ダウンロード" + (is_downloaded ? "済" : "") : "要：汎用パック"}
+        </button>
+    )
+}
+
+export { ModelDownloadFugumtJaEnButton }
\ No newline at end of file
diff --git a/src/components/molecules/ModelDownloadFugumtJaEnProgress.tsx b/src/components/molecules/ModelDownloadFugumtJaEnProgress.tsx
new file mode 100644
index 0000000..8984eb7
--- /dev/null
+++ b/src/components/molecules/ModelDownloadFugumtJaEnProgress.tsx
@@ -0,0 +1,42 @@
+import { useRecoilState, useSetRecoilState } from 'recoil'
+import { modelFugumtJaEnDownloadingState } from '../../store/atoms/modelFugumtJaEnDownloadingState'
+import { listen } from '@tauri-apps/api/event'
+import { useEffect, useState } from 'react'
+import { ProgressType } from '../../type/progress.type'
+import { modelFugumtJaEnDownloadedState } from '../../store/atoms/modelFugumtJaEnDownloadedState'
+
+const ModelDownloadFugumtJaEnProgress = (): JSX.Element => {
+    const modelType = "fugumt-ja-en"
+    const setDownloadedModel = useSetRecoilState(modelFugumtJaEnDownloadedState)
+    const [downloadingModels, setDownloadingModels] = useRecoilState(modelFugumtJaEnDownloadingState)
+    const [progress, setProgress] = useState<ProgressType>({
+        model_type: modelType,
+        rate: 0,
+        is_progress: false
+    })
+    useEffect(() => {
+        const unlisten = listen('downloadFugumtJaEnProgress', event => {
+            const p = event.payload as ProgressType
+            if (p.model_type === modelType) {
+                setProgress(p)
+                if (!p.is_progress) {
+                    setDownloadingModels(prev => prev.filter(m => m !== modelType))
+                    setDownloadedModel(prev => [...prev, modelType])
+                }
+            }
+        })
+        return () => {
+            unlisten.then(f => f());
+        }
+    }, [])
+    if (downloadingModels.filter(m => m === modelType).length > 0) {
+        return (
+            <div className="w-full bg-gray-200 rounded-full dark:bg-gray-700">
+                <div className="bg-blue-600 text-xs font-medium text-blue-100 text-center p-0.5 leading-none rounded-full" style={{ width: `${progress.rate}%` }}>{progress.rate === 100 ? "解凍中" : `${progress.rate}%`}</div>
+            </div>
+        )
+    }
+    return (<></>)
+}
+
+export { ModelDownloadFugumtJaEnProgress }
\ No newline at end of file
diff --git a/src/components/molecules/ModelDownloadHonyaku13BButton.tsx b/src/components/molecules/ModelDownloadHonyaku13BButton.tsx
index ddce6d1..89dbcd7 100644
--- a/src/components/molecules/ModelDownloadHonyaku13BButton.tsx
+++ b/src/components/molecules/ModelDownloadHonyaku13BButton.tsx
@@ -2,10 +2,12 @@ import { invoke } from '@tauri-apps/api/tauri'
 import { useRecoilState, useRecoilValue } from 'recoil'
 import { modelHonyaku13BDownloadingState } from '../../store/atoms/modelHonyaku13BDownloadingState'
 import { modelHonyaku13BDownloadedState } from '../../store/atoms/modelHonyaku13BDownloadedState'
+import { modelWhisperDownloadedState } from '../../store/atoms/modelWhisperDownloadedState'
 
 const ModelDownloadHonyaku13BButton = (): JSX.Element => {
-    const modelType = "honyaku13b-q4-0"
+    const modelType = "honyaku-13b"
     const downloadedModels = useRecoilValue(modelHonyaku13BDownloadedState)
+    const downloadedBaseModels = useRecoilValue(modelWhisperDownloadedState)
     const [downloadingModels, setDownloadingModels] = useRecoilState(modelHonyaku13BDownloadingState)
     const click = () => {
         setDownloadingModels([...downloadingModels, modelType])
@@ -13,13 +15,14 @@ const ModelDownloadHonyaku13BButton = (): JSX.Element => {
     }
     const is_downloaded = downloadedModels.filter(m => m === modelType).length > 0
     const is_downloading = downloadingModels.filter(m => m === modelType).length > 0
+    const is_base_downloaded = downloadedBaseModels.filter(m => m === "large").length > 0
 
     return (
-        <button className="btn gap-2 glass border border-solid border-neutral-300 text-secondary select-none" onClick={click} disabled={is_downloaded || is_downloading}>
+        <button className="btn gap-2 glass border border-solid border-neutral-300 text-secondary select-none" onClick={click} disabled={is_downloaded || is_downloading || !is_base_downloaded}>
             <svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24" strokeWidth="1.5" stroke="currentColor" className="w-6 h-6">
                 <path strokeLinecap="round" strokeLinejoin="round" d="M9 12.75l3 3m0 0l3-3m-3 3v-7.5M21 12a9 9 0 11-18 0 9 9 0 0118 0z" />
             </svg>
-            ダウンロード{is_downloaded && "済"}
+            {is_base_downloaded ? "ダウンロード" + (is_downloaded ? "済" : "") : "要：汎用パック"}
         </button>
     )
 }
diff --git a/src/components/molecules/ModelDownloadHonyaku13BProgress.tsx b/src/components/molecules/ModelDownloadHonyaku13BProgress.tsx
index 54f6523..c1f2b98 100644
--- a/src/components/molecules/ModelDownloadHonyaku13BProgress.tsx
+++ b/src/components/molecules/ModelDownloadHonyaku13BProgress.tsx
@@ -6,7 +6,7 @@ import { ProgressType } from '../../type/progress.type'
 import { modelHonyaku13BDownloadedState } from '../../store/atoms/modelHonyaku13BDownloadedState'
 
 const ModelDownloadHonyaku13BProgress = (): JSX.Element => {
-    const modelType = "honyaku13b-q4-0"
+    const modelType = "honyaku-13b"
     const setDownloadedModel = useSetRecoilState(modelHonyaku13BDownloadedState)
     const [downloadingModels, setDownloadingModels] = useRecoilState(modelHonyaku13BDownloadingState)
     const [progress, setProgress] = useState<ProgressType>({
diff --git a/src/components/molecules/ModelDownloadFugumtButton.tsx b/src/components/molecules/ModelDownloadStyleBertVits2Button.tsx
similarity index 65%
rename from src/components/molecules/ModelDownloadFugumtButton.tsx
rename to src/components/molecules/ModelDownloadStyleBertVits2Button.tsx
index 50bc0b2..17ea18a 100644
--- a/src/components/molecules/ModelDownloadFugumtButton.tsx
+++ b/src/components/molecules/ModelDownloadStyleBertVits2Button.tsx
@@ -1,15 +1,15 @@
 import { invoke } from '@tauri-apps/api/tauri'
 import { useRecoilState, useRecoilValue } from 'recoil'
-import { modelFugumtDownloadingState } from '../../store/atoms/modelFugumtDownloadingState'
-import { modelFugumtDownloadedState } from '../../store/atoms/modelFugumtDownloadedState'
+import { modelStyleBertVits2DownloadingState } from '../../store/atoms/modelStyleBertVits2DownloadingState'
+import { modelStyleBertVits2DownloadedState } from '../../store/atoms/modelStyleBertVits2DownloadedState'
 
-const ModelDownloadFugumtButton = (): JSX.Element => {
-    const modelType = "fugumt-en-ja"
-    const downloadedModels = useRecoilValue(modelFugumtDownloadedState)
-    const [downloadingModels, setDownloadingModels] = useRecoilState(modelFugumtDownloadingState)
+const ModelDownloadStyleBertVits2Button = (): JSX.Element => {
+    const modelType = "style-bert-vits2"
+    const downloadedModels = useRecoilValue(modelStyleBertVits2DownloadedState)
+    const [downloadingModels, setDownloadingModels] = useRecoilState(modelStyleBertVits2DownloadingState)
     const click = () => {
         setDownloadingModels([...downloadingModels, modelType])
-        invoke('download_fugumt_model_command')
+        invoke('download_sbv2_command')
     }
     const is_downloaded = downloadedModels.filter(m => m === modelType).length > 0
     const is_downloading = downloadingModels.filter(m => m === modelType).length > 0
@@ -24,4 +24,4 @@ const ModelDownloadFugumtButton = (): JSX.Element => {
     )
 }
 
-export { ModelDownloadFugumtButton }
\ No newline at end of file
+export { ModelDownloadStyleBertVits2Button }
\ No newline at end of file
diff --git a/src/components/molecules/ModelDownloadStyleBertVits2Progress.tsx b/src/components/molecules/ModelDownloadStyleBertVits2Progress.tsx
new file mode 100644
index 0000000..3e43361
--- /dev/null
+++ b/src/components/molecules/ModelDownloadStyleBertVits2Progress.tsx
@@ -0,0 +1,42 @@
+import { useRecoilState, useSetRecoilState } from 'recoil'
+import { modelStyleBertVits2DownloadingState } from '../../store/atoms/modelStyleBertVits2DownloadingState'
+import { listen } from '@tauri-apps/api/event'
+import { useEffect, useState } from 'react'
+import { ProgressType } from '../../type/progress.type'
+import { modelStyleBertVits2DownloadedState } from '../../store/atoms/modelStyleBertVits2DownloadedState'
+
+const ModelDownloadStyleBertVits2Progress = (): JSX.Element => {
+    const modelType = "style-bert-vits2"
+    const setDownloadedModel = useSetRecoilState(modelStyleBertVits2DownloadedState)
+    const [downloadingModels, setDownloadingModels] = useRecoilState(modelStyleBertVits2DownloadingState)
+    const [progress, setProgress] = useState<ProgressType>({
+        model_type: modelType,
+        rate: 0,
+        is_progress: false
+    })
+    useEffect(() => {
+        const unlisten = listen('downloadStyleBertVits2Progress', event => {
+            const p = event.payload as ProgressType
+            if (p.model_type === modelType) {
+                setProgress(p)
+                if (!p.is_progress) {
+                    setDownloadingModels(prev => prev.filter(m => m !== modelType))
+                    setDownloadedModel(prev => [...prev, modelType])
+                }
+            }
+        })
+        return () => {
+            unlisten.then(f => f());
+        }
+    }, [])
+    if (downloadingModels.filter(m => m === modelType).length > 0) {
+        return (
+            <div className="w-full bg-gray-200 rounded-full dark:bg-gray-700">
+                <div className="bg-blue-600 text-xs font-medium text-blue-100 text-center p-0.5 leading-none rounded-full" style={{ width: `${progress.rate}%` }}>{progress.rate === 100 ? "解凍中" : `${progress.rate}%`}</div>
+            </div>
+        )
+    }
+    return (<></>)
+}
+
+export { ModelDownloadStyleBertVits2Progress }
\ No newline at end of file
diff --git a/src/components/molecules/ModelDownloadStyleBertVits2VoiceButton.tsx b/src/components/molecules/ModelDownloadStyleBertVits2VoiceButton.tsx
new file mode 100644
index 0000000..9705460
--- /dev/null
+++ b/src/components/molecules/ModelDownloadStyleBertVits2VoiceButton.tsx
@@ -0,0 +1,34 @@
+import { invoke } from '@tauri-apps/api/tauri'
+import { useRecoilState, useRecoilValue } from 'recoil'
+import { modelStyleBertVits2VoiceDownloadingState } from '../../store/atoms/modelStyleBertVits2VoiceDownloadingState'
+import { modelStyleBertVits2VoiceDownloadedState } from '../../store/atoms/modelStyleBertVits2VoiceDownloadedState'
+import { modelStyleBertVits2DownloadedState } from '../../store/atoms/modelStyleBertVits2DownloadedState'
+
+type Props = {
+    modelType: string
+}
+
+const ModelDownloadStyleBertVits2VoiceButton = (props: Props): JSX.Element => {
+    const { modelType } = props
+    const downloadedModels = useRecoilValue(modelStyleBertVits2VoiceDownloadedState);
+    const downloadedBaseModels = useRecoilValue(modelStyleBertVits2DownloadedState);
+    const [downloadingModels, setDownloadingModels] = useRecoilState(modelStyleBertVits2VoiceDownloadingState)
+    const click = () => {
+        setDownloadingModels([...downloadingModels, modelType])
+        invoke('download_sbv2_model_command', { model: modelType })
+    }
+    const is_downloaded = downloadedModels.filter(m => m === modelType).length > 0
+    const is_downloading = downloadingModels.filter(m => m === modelType).length > 0
+    const is_base_downloaded = downloadedBaseModels.filter(m => m === "style-bert-vits2").length > 0
+
+    return (
+        <button className="btn glass border border-solid border-neutral-300 gap-2 text-secondary select-none" onClick={click} disabled={is_downloaded || is_downloading || !is_base_downloaded}>
+            <svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24" strokeWidth="1.5" stroke="currentColor" className="w-6 h-6">
+                <path strokeLinecap="round" strokeLinejoin="round" d="M9 12.75l3 3m0 0l3-3m-3 3v-7.5M21 12a9 9 0 11-18 0 9 9 0 0118 0z" />
+            </svg>
+            {is_base_downloaded ? "ダウンロード" + (is_downloaded ? "済" : "") : "要：基本エンジン"}
+        </button>
+    )
+}
+
+export { ModelDownloadStyleBertVits2VoiceButton }
\ No newline at end of file
diff --git a/src/components/molecules/ModelDownloadStyleBertVits2VoiceProgress.tsx b/src/components/molecules/ModelDownloadStyleBertVits2VoiceProgress.tsx
new file mode 100644
index 0000000..ac1615c
--- /dev/null
+++ b/src/components/molecules/ModelDownloadStyleBertVits2VoiceProgress.tsx
@@ -0,0 +1,46 @@
+import { useRecoilState, useSetRecoilState } from 'recoil'
+import { listen } from '@tauri-apps/api/event'
+import { useEffect, useState } from 'react'
+import { ProgressType } from '../../type/progress.type'
+import { modelStyleBertVits2VoiceDownloadingState } from '../../store/atoms/modelStyleBertVits2VoiceDownloadingState'
+import { modelStyleBertVits2VoiceDownloadedState } from '../../store/atoms/modelStyleBertVits2VoiceDownloadedState'
+
+type Props = {
+    modelType: string
+}
+
+const ModelDownloadStyleBertVits2VoiceProgress = (props: Props): JSX.Element => {
+    const { modelType } = props
+    const setDownloadedModel = useSetRecoilState(modelStyleBertVits2VoiceDownloadedState)
+    const [downloadingModels, setDownloadingModels] = useRecoilState(modelStyleBertVits2VoiceDownloadingState)
+    const [progress, setProgress] = useState<ProgressType>({
+        model_type: modelType,
+        rate: 0,
+        is_progress: false
+    })
+    useEffect(() => {
+        const unlisten = listen('downloadStyleBertVits2VoiceProgress', event => {
+            const p = event.payload as ProgressType
+            if (p.model_type === modelType) {
+                setProgress(p)
+                if (!p.is_progress) {
+                    setDownloadingModels(prev => prev.filter(m => m !== modelType))
+                    setDownloadedModel(prev => [...prev, modelType])
+                }
+            }
+        })
+        return () => {
+            unlisten.then(f => f());
+        }
+    }, [])
+    if (downloadingModels.filter(m => m === modelType).length > 0) {
+        return (
+            <div className="w-full bg-gray-200 rounded-full dark:bg-gray-700">
+                <div className="bg-blue-600 text-xs font-medium text-blue-100 text-center p-0.5 leading-none rounded-full" style={{ width: `${progress.rate}%` }}>{`${progress.rate}%`}</div>
+            </div>
+        )
+    }
+    return (<></>)
+}
+
+export { ModelDownloadStyleBertVits2VoiceProgress }
\ No newline at end of file
diff --git a/src/components/molecules/MyMarkdown.tsx b/src/components/molecules/MyMarkdown.tsx
index c6bf412..329c2ae 100644
--- a/src/components/molecules/MyMarkdown.tsx
+++ b/src/components/molecules/MyMarkdown.tsx
@@ -25,6 +25,9 @@ const MyMarkdown = (props: MyMarkdownProps) => {
 
     const [contents, setContents] = useState<string[]>([]);
 
+    const [isTableSelected, setIsTableSelected] = useState(false);
+    const [tableId, setTableId] = useState(0);
+
     const [isTextSelected, setIsTextSelected] = useState(false);
     const [textSelected, setTextSelected] = useState("");
     const handleMouseDown = (e: MouseEvent) => {
@@ -49,18 +52,34 @@ const MyMarkdown = (props: MyMarkdownProps) => {
         clipboard.writeText(contents[elementId]);
     }
     const handleImage = async (type: "copy" | "download") => {
-        const target = rootRef.current?.querySelectorAll("pre code")[elementId] as HTMLElement;
-        const canvas = await html2canvas(target,
-            {
-                backgroundColor: null,
-                onclone: (_, element) => {
-                    element.style.setProperty("overflow-x", "unset");
-                    element.style.setProperty("width", "fit-content");
-                    if (!target.className.includes("mermaid")) {
-                        element.style.backgroundColor = "#1a2638";
-                    }
-                }
-            });
+        const target = (() => {
+            if (isTableSelected) return rootRef.current?.querySelectorAll("table")[tableId] as HTMLElement;
+            return rootRef.current?.querySelectorAll("pre code")[elementId] as HTMLElement;
+        })();
+        const canvas = await (async () => {
+            if (isTableSelected) {
+                return await html2canvas(target,
+                    {
+                        backgroundColor: null,
+                        onclone: (_, element) => {
+                            element.style.setProperty("overflow-x", "unset");
+                            element.style.setProperty("width", "fit-content");
+                        }
+                    });
+            } else {
+                return await html2canvas(target,
+                    {
+                        backgroundColor: null,
+                        onclone: (_, element) => {
+                            element.style.setProperty("overflow-x", "unset");
+                            if (!target.className.includes("mermaid")) {
+                                element.style.backgroundColor = "#1a2638";
+                                element.style.width = "unset";
+                            }
+                        }
+                    });
+            }
+        })();
         if (type === "download") {
             const blob = await new Promise<Blob>((resolve) => {
                 canvas.toBlob((blob) => {
@@ -90,11 +109,13 @@ const MyMarkdown = (props: MyMarkdownProps) => {
                 block.classList.add("hover:border-base-300", "border-2", "border-transparent", "rounded-lg", "cursor-pointer");
             } else {
                 hljs.highlightBlock(block as HTMLElement);
+                block.classList.add("cursor-pointer", "w-full");
             }
 
             const handleContextMenu = (e: MouseEvent) => {
                 e.preventDefault();
                 setAnchorPoint({ x: e.clientX, y: e.clientY });
+                setIsTableSelected(false);
                 setElementId(index);
                 setOpen(true);
             };
@@ -103,6 +124,21 @@ const MyMarkdown = (props: MyMarkdownProps) => {
             listeners.set(block, ['contextmenu', handleContextMenu]);
         });
 
+        rootRef.current?.querySelectorAll('table').forEach(async (block, index) => {
+            block.classList.add("hover:border-base-300", "border-2", "border-transparent", "rounded-lg", "cursor-pointer", "!w-fit");
+
+            const handleContextMenu = (e: MouseEvent) => {
+                e.preventDefault();
+                setAnchorPoint({ x: e.clientX, y: e.clientY });
+                setIsTableSelected(true);
+                setTableId(index);
+                setOpen(true);
+            };
+
+            (block as HTMLElement).addEventListener('contextmenu', handleContextMenu);
+            listeners.set(block, ['contextmenu', handleContextMenu]);
+        });
+
         return () => {
             listeners.forEach(([event, listener], block) => {
                 (block as HTMLElement).removeEventListener(event, listener);
@@ -135,20 +171,31 @@ const MyMarkdown = (props: MyMarkdownProps) => {
                             <p className='pl-2'>コピー</p>
                         </MenuItem>
                     </> :
-                    <>
-                        <MenuItem onClick={handleText}>
-                            <PaperClip />
-                            <p className='pl-2'>全体をコピー</p>
-                        </MenuItem>
-                        <MenuItem onClick={() => handleImage("copy")}>
-                            <PaperClip />
-                            <p className='pl-2'>画像としてコピー</p>
-                        </MenuItem>
-                        <MenuItem onClick={() => handleImage("download")}>
-                            <Download />
-                            <p className='pl-2'>画像としてダウンロード</p>
-                        </MenuItem>
-                    </>}
+                    isTableSelected ?
+                        <>
+                            <MenuItem onClick={() => handleImage("copy")}>
+                                <PaperClip />
+                                <p className='pl-2'>画像としてコピー</p>
+                            </MenuItem>
+                            <MenuItem onClick={() => handleImage("download")}>
+                                <Download />
+                                <p className='pl-2'>画像としてダウンロード</p>
+                            </MenuItem>
+                        </> :
+                        <>
+                            <MenuItem onClick={handleText}>
+                                <PaperClip />
+                                <p className='pl-2'>全体をコピー</p>
+                            </MenuItem>
+                            <MenuItem onClick={() => handleImage("copy")}>
+                                <PaperClip />
+                                <p className='pl-2'>画像としてコピー</p>
+                            </MenuItem>
+                            <MenuItem onClick={() => handleImage("download")}>
+                                <Download />
+                                <p className='pl-2'>画像としてダウンロード</p>
+                            </MenuItem>
+                        </>}
             </ControlledMenu>
         </div>
     )
diff --git a/src/components/molecules/Screenshot.tsx b/src/components/molecules/Screenshot.tsx
index 46d42c0..56c86f1 100644
--- a/src/components/molecules/Screenshot.tsx
+++ b/src/components/molecules/Screenshot.tsx
@@ -14,7 +14,12 @@ const Screenshot = (props: ScreenshotProps): JSX.Element => {
             <div className="w-16 pl-2 flex-none">{date}</div>
             <div className="pr-2 pb-4 ml-5">
                 <Zoom>
-                    <img className="w-2/3" src={convertFileSrc(content)} alt="screenshot" />
+                    <img
+                        alt="screenshot"
+                        src={convertFileSrc(content)}
+                        height="500"
+                        width="500"
+                        />
                 </Zoom>
             </div>
         </div>
diff --git a/src/components/molecules/SettingFCfunctionCall.tsx b/src/components/molecules/SettingFCfunctionCall.tsx
index 36ff534..118fd5d 100644
--- a/src/components/molecules/SettingFCfunctionCall.tsx
+++ b/src/components/molecules/SettingFCfunctionCall.tsx
@@ -14,7 +14,7 @@ const SettingFCfunctionCall = (): JSX.Element => {
             <p className="w-[12rem]">Function Calling<br />(function_call)</p>
             <div className="flex flex-col w-full">
                 <div className="flex flex-col ml-2.5 mb-2">
-                    <p className="font-medium">AIからの返答に利用する関数を選択</p>
+                    <p className="font-medium">アシスタントからの返答に利用する関数を選択</p>
                     <p>無指定では、必要なときのみ関数が実行されます</p>
                     <p>必ず実行する場合は、関数名を指定してください</p>
                 </div>
diff --git a/src/components/molecules/SettingFCfunctions.tsx b/src/components/molecules/SettingFCfunctions.tsx
index 6bb8ecf..287b668 100644
--- a/src/components/molecules/SettingFCfunctions.tsx
+++ b/src/components/molecules/SettingFCfunctions.tsx
@@ -14,7 +14,7 @@ const SettingFCfunctions = (): JSX.Element => {
             <p className="w-[12rem]">Function Calling<br />(functions)</p>
             <div className="flex flex-col w-full">
                 <div className="flex flex-col ml-2.5 mb-2">
-                    <p className="font-medium">AIからの返答に利用する関数一覧</p>
+                    <p className="font-medium">アシスタントからの返答に利用する関数一覧</p>
                 </div>
                 <textarea rows={16} placeholder='[&#13;    {&#13;        "name": "functionA_name",&#13;        "description": "functionA_description",&#13;        "parameters": {&#13;            "type": "object",&#13;            "properties": {&#13;                "sample": {&#13;                    "type": "string",&#13;                    "description": "sample property description"&#13;                }&#13;            },&#13;            "required": ["sample"]&#13;        }&#13;    }&#13;]' className="p-2.5 h-full rounded-2xl input input-bordered focus:outline-none" value={settingKey} onChange={change} />
             </div>
diff --git a/src/components/molecules/SettingHook.tsx b/src/components/molecules/SettingHook.tsx
index a9ffee8..fada233 100644
--- a/src/components/molecules/SettingHook.tsx
+++ b/src/components/molecules/SettingHook.tsx
@@ -14,10 +14,10 @@ const SettingHook = (): JSX.Element => {
             <p className="w-[12rem]">CLI Hook</p>
             <div className="flex flex-col w-full">
                 <div className="flex flex-col ml-2.5 mb-2">
-                    <p className="font-medium mb-2">ターミナルで任意のコマンドを実行（AI実行後）</p>
+                    <p className="font-medium mb-2">ターミナルで任意のコマンドを実行（アシスタント返答後）</p>
                     <p>ユーザーの入力を、{"{{question}}"}</p>
                     <p>CLI Resourceを、{"{{resource}}"}</p>
-                    <p>AIからの返答を、{"{{answer}}"}、として利用可能</p>
+                    <p>アシスタントからの返答を、{"{{answer}}"}、として利用可能</p>
                 </div>
                 <textarea rows={3} placeholder='echo "{{question}} > {{answer}}" > ~/Desktop/sample.txt' className="p-2.5 h-full rounded-2xl input input-bordered focus:outline-none flex-1" value={settingKey} onChange={change} onKeyDown={e => { if (e.key === 'Enter') { e.preventDefault(); } }} />
             </div>
diff --git a/src/components/molecules/SettingProcesses.tsx b/src/components/molecules/SettingProcesses.tsx
index 6eaa38e..e6cde0d 100644
--- a/src/components/molecules/SettingProcesses.tsx
+++ b/src/components/molecules/SettingProcesses.tsx
@@ -3,7 +3,7 @@ import { useRecoilState } from 'recoil';
 import { settingProcessState } from "../../store/atoms/settingProcessState";
 
 const SettingProcesses = (): JSX.Element => {
-    const settingProcesses = ["文字起こし", "翻訳"]
+    const settingProcesses = ["文字起こし（汎用）", "文字起こし（言語特化）", "翻訳（18言語⇒日本語）", "翻訳（日本語⇒英語）", "翻訳（日本語⇔英語）"]
     const [settingProcess, setSettingProcess] = useRecoilState(settingProcessState)
 
     const change = (e: ChangeEvent<HTMLSelectElement>) => {
@@ -12,7 +12,7 @@ const SettingProcesses = (): JSX.Element => {
     }
 
     return (
-        <select className="select focus:outline-none pl-1 pr-0 w-32" name="processes" onChange={change} >
+        <select className="select focus:outline-none pl-1 pr-0 w-44" name="processes" onChange={change} >
             {settingProcesses?.map((process, i) => (
                 <option key={"setting-process" + i} value={process} selected={process === settingProcess}>{process}</option>
             ))}
diff --git a/src/components/molecules/SettingResource.tsx b/src/components/molecules/SettingResource.tsx
index 459ea39..22394e6 100644
--- a/src/components/molecules/SettingResource.tsx
+++ b/src/components/molecules/SettingResource.tsx
@@ -14,7 +14,7 @@ const SettingResource = (): JSX.Element => {
             <p className="w-[12rem]">CLI Resource</p>
             <div className="flex flex-col w-full">
                 <div className="flex flex-col ml-2.5 mb-2">
-                    <p className="font-medium mb-2">ターミナルで任意のコマンドを実行（AI実行前）</p>
+                    <p className="font-medium mb-2">ターミナルで任意のコマンドを実行（アシスタント返答前）</p>
                     <p>ユーザーの入力を、{"{{question}}"}、として利用可能</p>
                 </div>
                 <textarea rows={3} placeholder='curl -s "https://example.com/latest?query={{question}}"' className="p-2.5 h-full rounded-2xl input input-bordered focus:outline-none" value={settingKey} onChange={change} onKeyDown={e => { if (e.key === 'Enter') { e.preventDefault(); } }} />
diff --git a/src/components/molecules/SettingTemplate.tsx b/src/components/molecules/SettingTemplate.tsx
index 2eae29b..d6550fc 100644
--- a/src/components/molecules/SettingTemplate.tsx
+++ b/src/components/molecules/SettingTemplate.tsx
@@ -14,7 +14,7 @@ const SettingTemplate = (): JSX.Element => {
             <p className="w-[12rem]">システム ロール</p>
             <div className="flex flex-col w-full">
                 <div className="flex flex-col ml-2.5 mb-2">
-                    <p className="font-medium mb-2">AIへの役割設定</p>
+                    <p className="font-medium mb-2">アシスタントへの役割設定</p>
                     <p>ユーザーの入力を、{"{{question}}"}</p>
                     <p>CLI Resourceを、{"{{resource}}"}、として利用可能</p>
                 </div>
diff --git a/src/components/molecules/SettingVoices.tsx b/src/components/molecules/SettingVoices.tsx
new file mode 100644
index 0000000..57b9e39
--- /dev/null
+++ b/src/components/molecules/SettingVoices.tsx
@@ -0,0 +1,23 @@
+import { ChangeEvent } from "react";
+import { useRecoilState } from 'recoil';
+import { settingVoiceState } from "../../store/atoms/settingVoiceState";
+
+const SettingVoices = (): JSX.Element => {
+    const settingVoices = ["JVNV", "つくよみちゃん", "小春音アミ・あみたろ", "カスタマイズ"]
+    const [settingVoice, setSettingVoice] = useRecoilState(settingVoiceState)
+
+    const change = (e: ChangeEvent<HTMLSelectElement>) => {
+        const settingVoice = e.target.value
+        setSettingVoice(settingVoice)
+    }
+
+    return (
+        <select className="select focus:outline-none pl-1 pr-0 w-44" name="voices" onChange={change} >
+            {settingVoices?.map((voice, i) => (
+                <option key={"setting-process" + i} value={voice} selected={voice === settingVoice}>{voice}</option>
+            ))}
+        </select>
+    )
+}
+
+export { SettingVoices }
diff --git a/src/components/molecules/SmartVoice.tsx b/src/components/molecules/SmartVoice.tsx
new file mode 100644
index 0000000..a772b7b
--- /dev/null
+++ b/src/components/molecules/SmartVoice.tsx
@@ -0,0 +1,169 @@
+import { ChangeEvent, useEffect, useRef, useState } from "react";
+import { useRecoilState } from 'recoil';
+import { lengthScaleState } from "../../store/atoms/smartVoices/lengthScaleState";
+import { sdpRatioState } from "../../store/atoms/smartVoices/sdpRatioState";
+import { smartVoiceState } from "../../store/atoms/smartVoices/smartVoiceState";
+import { invoke } from "@tauri-apps/api";
+
+const SmartVoice = (): JSX.Element => {
+    const [models, setModels] = useState([] as string[])
+    const [toggle, setToggle] = useState(false)
+    useEffect(() => {
+        invoke('list_synthesize_models_command').then(models => setModels(models as string[]))
+    }, [toggle])
+    const defaultModels = ["jvnv-F1-jp", "jvnv-F2-jp", "jvnv-M1-jp", "jvnv-M2-jp", "tsukuyomi-chan", "koharune-ami", "amitaro"]
+    const [lengthScale, setLengthScale] = useRecoilState(lengthScaleState)
+    const [sdpRatio, setSdpRatio] = useRecoilState(sdpRatioState)
+    const [selectedModel, setSelectedModel] = useRecoilState(smartVoiceState)
+    const [isLoading, setIsLoading] = useState(false)
+
+    const dropdownRef = useRef<HTMLLabelElement>(null)
+
+    const change = (e: ChangeEvent<HTMLInputElement>) => {
+        dropdownRef.current?.focus();
+        if (e.target.checked) {
+            setIsLoading(true)
+            const value = e.target.value
+            if (value === "off") {
+                invoke('synthesize_finalize_command')
+                    .then(() => {
+                        setSelectedModel(value)
+                        setIsLoading(false)
+                    })
+            } else {
+                invoke('synthesize_init_command', { model: value })
+                    .then(() => {
+                        setSelectedModel(value)
+                        setIsLoading(false)
+                    })
+            }
+        }
+    }
+
+    const checkAndCloseDropDown = (target: EventTarget & HTMLLabelElement) => {
+        setToggle(!toggle)
+        if (target && target.matches(':focus')) {
+            setTimeout(() => target.blur(), 0);
+        }
+    }
+
+    const mapModel = (model: string) => {
+        switch (model) {
+            case "off":
+                return "オフ";
+            case "jvnv-F1-jp":
+                return "女性1";
+            case "jvnv-F2-jp":
+                return "女性2";
+            case "jvnv-M1-jp":
+                return "男性1";
+            case "jvnv-M2-jp":
+                return "男性2";
+            case "tsukuyomi-chan":
+                return "つくよみちゃん";
+            case "koharune-ami":
+                return "小春音アミ";
+            case "amitaro":
+                return "あみたろ";
+            default:
+                return model;
+        }
+    }
+
+    return (
+        <div className="dropdown">
+            <label ref={dropdownRef} onMouseDown={e => checkAndCloseDropDown(e.currentTarget)} tabIndex={0} className="group normal-case btn w-52 flex justify-between" style={{ color: "inherit", backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }} >
+                <div className="w-36 text-left overflow-x-hidden whitespace-nowrap text-ellipsis">{selectedModel === null ? "スマート読み上げ" : mapModel(selectedModel)}</div>
+                <div>
+                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
+                        <path fillRule="evenodd" d="M5.22 8.22a.75.75 0 0 1 1.06 0L10 11.94l3.72-3.72a.75.75 0 1 1 1.06 1.06l-4.25 4.25a.75.75 0 0 1-1.06 0L5.22 9.28a.75.75 0 0 1 0-1.06Z" clipRule="evenodd" />
+                    </svg>
+                </div>
+                <div className="opacity-0 w-28 invisible rounded text-[12px] 
+                        font-bold text-white py-1 bg-slate-600 top-12 left-4
+                        group-hover:visible opacity-100 absolute ">スマート読み上げ
+                </div>
+            </label>
+            <ul tabIndex={0} className="dropdown-content menu rounded-box w-60"
+                style={{ backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }}
+            >
+                <ul className="max-h-56 overflow-y-scroll rounded-box scrollbar-transparent" style={selectedModel !== "off" || (isLoading && selectedModel === "off") ? { paddingBottom: "0.5rem" } : {}}>
+                    <li key="transcription-accuracy_off">
+                        <label className="label inline-flex active:!bg-inherit">
+                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="off" checked={selectedModel === "off"} />
+                            <a className="grow">オフ</a>
+                        </label>
+                    </li>
+                    {models.length > 0 && <>
+                        {models
+                            .filter(m => defaultModels.includes(m))
+                            .sort((a, b) => {
+                                return a.localeCompare(b, 'ja');
+                            })
+                            .map((model, i) => (
+                                <>
+                                    {i === 0 && <>
+                                        <hr className="my-2" />
+                                        <div className="flex justify-center sticky top-0 z-10 w-full mb-2" style={{ backgroundColor: "hsl(24 33% 97%)" }}>
+                                            <p className="text-xs text-gray-400">デフォルト</p>
+                                        </div>
+                                    </>}
+                                    <li key={"smart-voice_" + i}>
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input disabled={isLoading} type="radio" name="voice-option" className="radio radio-accent" onChange={change} value={model} checked={model === selectedModel} />
+                                            <a className="grow">{mapModel(model)}</a>
+                                        </label>
+                                    </li>
+                                </>
+                            ))
+                        }
+                        {models
+                            .filter(m => !defaultModels.includes(m))
+                            .sort((a, b) => {
+                                return a.localeCompare(b, 'ja');
+                            })
+                            .map((model, i) => (
+                                <>
+                                    {i === 0 && <>
+                                        <hr className="my-2" />
+                                        <div className="flex justify-center sticky top-0 z-10 w-full mb-2" style={{ backgroundColor: "hsl(24 33% 97%)" }}>
+                                            <p className="text-xs text-gray-400">カスタマイズ</p>
+                                        </div>
+                                    </>}
+                                    <li key={"smart-voice-custom_" + i}>
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input disabled={isLoading} type="radio" name="voice-option" className="radio radio-accent" onChange={change} value={model} checked={model === selectedModel} />
+                                            <a className="grow">{mapModel(model)}</a>
+                                        </label>
+                                    </li>
+                                </>
+                            ))
+                        }
+                    </>}
+                </ul>
+                {selectedModel !== "off" && !isLoading &&
+                    <div className="bg-base-200 rounded-lg h-28 flex flex-col justify-center">
+                        <label className="cursor-pointer label flex-col items-start">
+                            <span className="label-text">話速：{lengthScale === 1 ? "1（デフォルト）" : lengthScale}</span>
+                            <input type="range" min={0.1} max={2.0} step={0.1} value={lengthScale} className="range range-warning range-xs" onChange={e => setLengthScale(parseFloat(e.target.value))} />
+                        </label>
+                        <label className="cursor-pointer label flex-col items-start">
+                            <span className="label-text">抑揚：{sdpRatio === 0.2 ? "0.2（デフォルト）" : sdpRatio}</span>
+                            <input type="range" min={0} max={1.0} step={0.1} value={sdpRatio} className="range range-warning range-xs" onChange={e => setSdpRatio(parseFloat(e.target.value))} />
+                        </label>
+                    </div>
+                }
+                {isLoading &&
+                    <div className="bg-base-200 rounded-lg h-28 flex flex-col justify-center">
+                        <div className="flex items-center justify-center h-full bg-gray-200 rounded-lg animate-pulse">
+                            <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-10">
+                                <path d="M10 3.75a2 2 0 1 0-4 0 2 2 0 0 0 4 0ZM17.25 4.5a.75.75 0 0 0 0-1.5h-5.5a.75.75 0 0 0 0 1.5h5.5ZM5 3.75a.75.75 0 0 1-.75.75h-1.5a.75.75 0 0 1 0-1.5h1.5a.75.75 0 0 1 .75.75ZM4.25 17a.75.75 0 0 0 0-1.5h-1.5a.75.75 0 0 0 0 1.5h1.5ZM17.25 17a.75.75 0 0 0 0-1.5h-5.5a.75.75 0 0 0 0 1.5h5.5ZM9 10a.75.75 0 0 1-.75.75h-5.5a.75.75 0 0 1 0-1.5h5.5A.75.75 0 0 1 9 10ZM17.25 10.75a.75.75 0 0 0 0-1.5h-1.5a.75.75 0 0 0 0 1.5h1.5ZM14 10a2 2 0 1 0-4 0 2 2 0 0 0 4 0ZM10 16.25a2 2 0 1 0-4 0 2 2 0 0 0 4 0Z" />
+                            </svg>
+                        </div>
+                    </div>}
+            </ul>
+        </div >
+    )
+}
+
+export { SmartVoice }
diff --git a/src/components/molecules/SpeakerLanguage.tsx b/src/components/molecules/SpeakerLanguage.tsx
index b675611..d4b347c 100644
--- a/src/components/molecules/SpeakerLanguage.tsx
+++ b/src/components/molecules/SpeakerLanguage.tsx
@@ -114,26 +114,43 @@ const SpeakerLanguage = (): JSX.Element => {
             <ul tabIndex={0} className="dropdown-content menu rounded-box w-52"
                 style={{ backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }}
             >
-                {downloadedModels.length > 0 && <ul className="max-h-56 overflow-y-scroll rounded-box scrollbar-transparent">
-                    {downloadedModels.filter(model => model.startsWith("small")).length > 0 && downloadedModels.filter(model => !model.startsWith("small")).length > 0 && <p className="text-sm ml-2 mb-2">通常</p>}
-                    {downloadedModels.filter(model => !model.startsWith("small")).map((model, i) => (
-                        <li key={"speaker-language_" + i}>
-                            <label className="label inline-flex active:!bg-inherit">
-                                <input type="radio" name="language-option" className="radio radio-accent" onChange={change} value={model} checked={model === speakerLanguage} />
-                                <a className="grow">{mapModel(model)}</a>
-                            </label>
-                        </li>
-                    ))}
-                    {downloadedModels.filter(model => model.startsWith("small")).length > 0 && downloadedModels.filter(model => !model.startsWith("small")).length > 0 && <><hr className="mt-2" /><p className="text-sm ml-2 my-2">ライト</p></>}
-                    {downloadedModels.filter(model => model.startsWith("small")).map((model, i) => (
-                        <li key={"speaker-language_" + i}>
-                            <label className="label inline-flex active:!bg-inherit">
-                                <input type="radio" name="language-option" className="radio radio-accent" onChange={change} value={model} checked={model === speakerLanguage} />
-                                <a className="grow">{mapModel(model)}</a>
-                            </label>
-                        </li>
-                    ))}
-                </ul>}
+                {downloadedModels.length > 0 &&
+                    <ul className="max-h-56 overflow-y-scroll rounded-box scrollbar-transparent">
+                        {downloadedModels.filter(model => model.startsWith("small")).length > 0 && downloadedModels.filter(model => !model.startsWith("small")).length > 0 &&
+                            <p className="text-sm ml-2 my-2 flex items-center">
+                                <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                    <path fillRule="evenodd" d="M7.487 2.89a.75.75 0 1 0-1.474-.28l-.455 2.388H3.61a.75.75 0 0 0 0 1.5h1.663l-.571 2.998H2.75a.75.75 0 0 0 0 1.5h1.666l-.403 2.114a.75.75 0 0 0 1.474.28l.456-2.394h2.973l-.403 2.114a.75.75 0 0 0 1.474.28l.456-2.394h1.947a.75.75 0 0 0 0-1.5h-1.661l.57-2.998h1.95a.75.75 0 0 0 0-1.5h-1.664l.402-2.108a.75.75 0 0 0-1.474-.28l-.455 2.388H7.085l.402-2.108ZM6.8 6.498l-.571 2.998h2.973l.57-2.998H6.8Z" clipRule="evenodd" />
+                                </svg>
+                                通常
+                            </p>
+                        }
+                        {downloadedModels.filter(model => !model.startsWith("small")).map((model, i) => (
+                            <li key={"speaker-language_" + i}>
+                                <label className="label inline-flex active:!bg-inherit">
+                                    <input type="radio" name="language-option" className="radio radio-accent" onChange={change} value={model} checked={model === speakerLanguage} />
+                                    <a className="grow">{mapModel(model)}</a>
+                                </label>
+                            </li>
+                        ))}
+                        {downloadedModels.filter(model => model.startsWith("small")).length > 0 && downloadedModels.filter(model => !model.startsWith("small")).length > 0 &&
+                            <>
+                                <hr className="mt-2" />
+                                <p className="text-sm ml-2 my-2 flex items-center">
+                                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                        <path fillRule="evenodd" d="M7.487 2.89a.75.75 0 1 0-1.474-.28l-.455 2.388H3.61a.75.75 0 0 0 0 1.5h1.663l-.571 2.998H2.75a.75.75 0 0 0 0 1.5h1.666l-.403 2.114a.75.75 0 0 0 1.474.28l.456-2.394h2.973l-.403 2.114a.75.75 0 0 0 1.474.28l.456-2.394h1.947a.75.75 0 0 0 0-1.5h-1.661l.57-2.998h1.95a.75.75 0 0 0 0-1.5h-1.664l.402-2.108a.75.75 0 0 0-1.474-.28l-.455 2.388H7.085l.402-2.108ZM6.8 6.498l-.571 2.998h2.973l.57-2.998H6.8Z" clipRule="evenodd" />
+                                    </svg>
+                                    ライト
+                                </p>
+                            </>}
+                        {downloadedModels.filter(model => model.startsWith("small")).map((model, i) => (
+                            <li key={"speaker-language_" + i}>
+                                <label className="label inline-flex active:!bg-inherit">
+                                    <input type="radio" name="language-option" className="radio radio-accent" onChange={change} value={model} checked={model === speakerLanguage} />
+                                    <a className="grow">{mapModel(model)}</a>
+                                </label>
+                            </li>
+                        ))}
+                    </ul>}
             </ul>
         </div>
     )
diff --git a/src/components/molecules/SpeechHistory.tsx b/src/components/molecules/SpeechHistory.tsx
index 93f7942..1fb0ff8 100644
--- a/src/components/molecules/SpeechHistory.tsx
+++ b/src/components/molecules/SpeechHistory.tsx
@@ -7,13 +7,16 @@ import { Screenshot } from './Screenshot'
 import { MyMarkdown } from './MyMarkdown'
 import 'zenn-content-css';
 import { selectedNoteState } from '../../store/atoms/selectedNoteState'
+import { useState } from 'react'
+import { SuggestCard } from './SuggestCard'
 
 type SpeechHistoryProps = {
     histories: SpeechHistoryType[]
+    setHistories: (valOrUpdater: SpeechHistoryType[] | ((currVal: SpeechHistoryType[]) => SpeechHistoryType[])) => void
 }
 
 const SpeechHistory = (props: SpeechHistoryProps): JSX.Element => {
-    const { histories = [] } = props
+    const { histories = [], setHistories } = props
     const filterTarget = useRecoilValue(speechFilterState)
     const filterdHistories = histories.filter(
         h => {
@@ -31,6 +34,7 @@ const SpeechHistory = (props: SpeechHistoryProps): JSX.Element => {
         }
     );
     const selectedNote = useRecoilValue(selectedNoteState)
+    const [editMemoId, setEditMemoId] = useState<number | null>(null)
 
     return (
         <div>
@@ -50,8 +54,11 @@ const SpeechHistory = (props: SpeechHistoryProps): JSX.Element => {
                             {c.speech_type === "memo"
                                 && <div className='flex py-1' key={"memo_" + i}>
                                     <div className="w-16 pl-2 flex-none">{date}</div>
-                                    <div className="flex flex-col items-start ml-5" >
-                                        <MyMarkdown content={c.content} title={`${selectedNote?.note_title.trim()}_memo_${i}`} />
+                                    <div className="flex flex-col items-start ml-5 cursor-pointer hover:border-base-300 border-2 border-transparent rounded-lg"
+                                        onDoubleClick={(e) => { e.preventDefault(); setEditMemoId(i); }}>
+                                        {editMemoId === null || editMemoId !== i ?
+                                            <MyMarkdown content={c.content} title={`${selectedNote?.note_title.trim()}_memo_${i}`} />
+                                            : <textarea rows={c.content.split("\n").length} value={c.content} autoFocus onBlur={() => { setEditMemoId(null) }} />}
                                     </div>
                                 </div>}
                             {
@@ -60,20 +67,46 @@ const SpeechHistory = (props: SpeechHistoryProps): JSX.Element => {
                                     <div className="w-16 pl-2 flex-none">{date}</div>
                                     <div className="card w-4/5 bg-base-200 shadow-xl ml-5">
                                         <div className="card-body">
-                                            <div className="chat chat-start">
-                                                <div className="flex chat-bubble bg-white text-slate-500">
-                                                    <MyMarkdown content={c.content} title={`${selectedNote?.note_title.trim()}_action-start_${i}`} />
+                                            {c.action_type === "chat" &&
+                                                <>
+                                                    <div className="chat chat-start">
+                                                        <div className="flex chat-bubble bg-white text-slate-500">
+                                                            <MyMarkdown content={c.content} title={`${selectedNote?.note_title.trim()}_action-start_${i}`} />
+                                                        </div>
+                                                    </div>
+                                                    <div className="chat chat-end">
+                                                        <div className="flex chat-bubble bg-white text-slate-500 py-5 w-full">
+                                                            {c.content_2 ?
+                                                                <MyMarkdown content={c.content_2} title={`${selectedNote?.note_title.trim()}_action-end_${i}`} />
+                                                                :
+                                                                <span className="loading loading-dots loading-sm"></span>
+                                                            }
+                                                        </div>
+                                                    </div>
+                                                </>
+                                            }
+                                            {c.action_type === "suggest" &&
+                                                <div className="chat chat-start">
+                                                    <div className="flex chat-bubble bg-white text-slate-500">
+                                                        {c.content_2 ?
+                                                            <SuggestCard
+                                                                id={c.id!}
+                                                                active={c.content}
+                                                                suggestions={c.content_2}
+                                                                update={
+                                                                    (id, active) => {
+                                                                        setHistories((prev) => {
+                                                                            return prev.map(h => {
+                                                                                if (h.id === id) { return { ...h, content: active } } else { return h }
+                                                                            })
+                                                                        })
+                                                                    }} />
+                                                            :
+                                                            <span className="loading loading-dots loading-sm"></span>
+                                                        }
+                                                    </div>
                                                 </div>
-                                            </div>
-                                            <div className="chat chat-end">
-                                                <div className="flex chat-bubble bg-white text-slate-500 py-5 w-full">
-                                                    {c.content_2 ?
-                                                        <MyMarkdown content={c.content_2} title={`${selectedNote?.note_title.trim()}_action-end_${i}`} />
-                                                        :
-                                                        <span className="loading loading-dots loading-sm"></span>
-                                                    }
-                                                </div>
-                                            </div>
+                                            }
                                         </div>
                                     </div>
                                 </div>
diff --git a/src/components/molecules/SuggestCard.tsx b/src/components/molecules/SuggestCard.tsx
new file mode 100644
index 0000000..4a49a4c
--- /dev/null
+++ b/src/components/molecules/SuggestCard.tsx
@@ -0,0 +1,181 @@
+import { invoke } from "@tauri-apps/api";
+import { useEffect, useRef, useState } from "react";
+import { useRecoilValue } from "recoil";
+import { lengthScaleState } from "../../store/atoms/smartVoices/lengthScaleState";
+import { sdpRatioState } from "../../store/atoms/smartVoices/sdpRatioState";
+import { smartVoiceState } from "../../store/atoms/smartVoices/smartVoiceState";
+
+type SuggestCardProps = {
+    id: number,
+    active: string,
+    suggestions: string,
+    update: (id: number, active: string) => void
+}
+
+const SuggestCard = ({ id, active, suggestions, update }: SuggestCardProps) => {
+    const lengthScale = useRecoilValue(lengthScaleState)
+    const sdpRatio = useRecoilValue(sdpRatioState)
+    const selectedModel = useRecoilValue(smartVoiceState)
+
+    const obj = (() => {
+        try {
+            return JSON.parse(suggestions) as { [key in "neutral" | "positive" | "negative"]: { content: string, reason: string } }
+        } catch (e) {
+            return null;
+        }
+    })();
+    if (obj === null) {
+        return <div>発話サジェストに失敗しました。</div>
+    }
+    const { neutral, positive, negative } = obj;
+
+    const [audio, setAudio] = useState<string | null>(null)
+    const [isLoading, setIsLoading] = useState(false)
+    const audioRef = useRef<HTMLAudioElement>(null)
+    useEffect(() => {
+        return () => {
+            if (audio) {
+                URL.revokeObjectURL(audio);
+            }
+        };
+    }, [])
+    const synthesize = async (text: string) => {
+        if (!text.length) return;
+        setIsLoading(true);
+
+        invoke('synthesize_command', { text, sdpRatio, lengthScale })
+            .then(buffer => {
+                const res = new Blob([new Uint8Array(buffer as ArrayBufferLike)], { type: "audio/wav" });
+                setAudio((prev) => {
+                    if (prev !== null) URL.revokeObjectURL(prev);
+                    setIsLoading(false);
+                    return URL.createObjectURL(res)
+                });
+            });
+    };
+    const playAudio = async (e: React.MouseEvent<HTMLButtonElement>) => {
+        e.stopPropagation();
+        if (audioRef.current) {
+            try {
+                await audioRef.current.play();
+            } catch (error) {
+                console.error('Audio playback failed:', error);
+            }
+        }
+    }
+    type ActiveType = "neutral" | "positive" | "negative";
+    const activateCard = async (a: ActiveType) => {
+        if (active === a) return;
+        update(id, a);
+        if (selectedModel !== "off") {
+            const content =
+                a === "neutral" ? neutral.content :
+                    a === "positive" ? positive.content :
+                        negative.content;
+            await synthesize(content);
+        }
+    }
+    const isAudioLoading = (a: ActiveType) => {
+        return a === active && isLoading;
+    };
+
+    return (
+        <div className="suggest-card flex gap-2 my-3">
+            {audio && <audio className="hidden" controls src={audio} ref={audioRef}></audio>}
+            <div className={"mr-1 cursor-pointer h-full border border-solid border-neutral-300 rounded-md p-5 duration-200 hover:scale-105 hover:shadow hover:bg-white" + (active === "neutral" ? " scale-105 shadow mr-2" : " bg-base-100")}
+                onClick={async () => await activateCard("neutral")}>
+                <div className="flex flex-col gap-1">
+                    <div className="flex items-center justify-between mb-2">
+                        <p className="text-xs font-semibold">ニュートラル</p>
+                        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                            <path fillRule="evenodd" d="M10 18a8 8 0 1 0 0-16 8 8 0 0 0 0 16ZM7 8.5c0 .828-.448 1.5-1 1.5s-1-.672-1-1.5S5.448 7 6 7s1 .672 1 1.5Zm5 0c0 .828-.448 1.5-1 1.5s-1-.672-1-1.5S10.448 7 11 7s1 .672 1 1.5Zm-6.5 5.5a.75.75 0 0 1 .75-.75h7.5a.75.75 0 0 1 0 1.5h-7.5a.75.75 0 0 1-.75-.75Z" clipRule="evenodd" />
+                        </svg>
+                    </div>
+                    <div>
+                        <p className="text-sm font-semibold">{neutral.content}</p>
+                        {selectedModel !== "off" && <div className="flex justify-center mt-2">
+                            {isAudioLoading("neutral") ?
+                                <span className="loading loading-spinner loading-md"></span>
+                                :
+                                <button className={"btn gap-2 glass border border-solid border-neutral-300 text-primary" + (active === "neutral" ? "" : " btn-disabled")} onClick={playAudio}>
+                                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                                        <path d="M6.3 2.84A1.5 1.5 0 0 0 4 4.11v11.78a1.5 1.5 0 0 0 2.3 1.27l9.344-5.891a1.5 1.5 0 0 0 0-2.538L6.3 2.841Z" />
+                                    </svg>
+                                    再生
+                                </button>
+                            }
+                        </div>}
+                        {active === "neutral" && <>
+                            <hr className="mb-4 mt-2" />
+                            <p className="text-xs font-medium">{neutral.reason}</p>
+                        </>}
+                    </div>
+                </div>
+            </div>
+
+            <div className={"mr-1 cursor-pointer h-full border border-solid border-neutral-300 rounded-md p-5 duration-200 hover:scale-105 hover:shadow hover:bg-white" + (active === "positive" ? " scale-105 shadow mr-3 ml-2" : " bg-base-100")}
+                onClick={async () => await activateCard("positive")}>
+                <div className="flex flex-col gap-1">
+                    <div className="flex items-center justify-between text-primary mb-2">
+                        <p className="text-xs font-semibold">ポジティブ</p>
+                        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                            <path fillRule="evenodd" d="M10 18a8 8 0 1 0 0-16 8 8 0 0 0 0 16Zm3.536-4.464a.75.75 0 1 0-1.061-1.061 3.5 3.5 0 0 1-4.95 0 .75.75 0 0 0-1.06 1.06 5 5 0 0 0 7.07 0ZM9 8.5c0 .828-.448 1.5-1 1.5s-1-.672-1-1.5S7.448 7 8 7s1 .672 1 1.5Zm3 1.5c.552 0 1-.672 1-1.5S12.552 7 12 7s-1 .672-1 1.5.448 1.5 1 1.5Z" clipRule="evenodd" />
+                        </svg>
+                    </div>
+                    <div>
+                        <p className="text-sm font-semibold">{positive.content}</p>
+                        {selectedModel !== "off" && <div className="flex justify-center mt-2">
+                            {isAudioLoading("positive") ?
+                                <span className="loading loading-spinner loading-md"></span>
+                                :
+                                <button className={"btn gap-2 glass border border-solid border-neutral-300 text-primary" + (active === "positive" ? "" : " btn-disabled")} onClick={playAudio}>
+                                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                                        <path d="M6.3 2.84A1.5 1.5 0 0 0 4 4.11v11.78a1.5 1.5 0 0 0 2.3 1.27l9.344-5.891a1.5 1.5 0 0 0 0-2.538L6.3 2.841Z" />
+                                    </svg>
+                                    再生
+                                </button>
+                            }
+                        </div>}
+                        {active === "positive" && <>
+                            <hr className="mb-4 mt-2" />
+                            <p className="text-xs font-medium">{positive.reason}</p>
+                        </>}
+                    </div>
+                </div>
+            </div>
+
+            <div className={"cursor-pointer h-full border border-solid border-neutral-300 rounded-md p-5 duration-200 hover:scale-105 hover:shadow hover:bg-white" + (active === "negative" ? " scale-105 shadow ml-2" : " bg-base-100")}
+                onClick={async () => await activateCard("negative")}>
+                <div className="flex flex-col gap-1">
+                    <div className="flex items-center justify-between text-error mb-2">
+                        <p className="text-xs font-semibold">ネガティブ</p>
+                        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                            <path fillRule="evenodd" d="M10 18a8 8 0 1 0 0-16 8 8 0 0 0 0 16Zm-3.536-3.475a.75.75 0 0 0 1.061 0 3.5 3.5 0 0 1 4.95 0 .75.75 0 1 0 1.06-1.06 5 5 0 0 0-7.07 0 .75.75 0 0 0 0 1.06ZM9 8.5c0 .828-.448 1.5-1 1.5s-1-.672-1-1.5S7.448 7 8 7s1 .672 1 1.5Zm3 1.5c.552 0 1-.672 1-1.5S12.552 7 12 7s-1 .672-1 1.5.448 1.5 1 1.5Z" clipRule="evenodd" />
+                        </svg>
+                    </div>
+                    <div>
+                        <p className="text-sm font-semibold">{negative.content}</p>
+                        {selectedModel !== "off" && <div className="flex justify-center mt-2">
+                            {isAudioLoading("negative") ?
+                                <span className="loading loading-spinner loading-md"></span>
+                                :
+                                <button className={"btn gap-2 glass border border-solid border-neutral-300 text-primary" + (active === "negative" ? "" : " btn-disabled")} onClick={playAudio}>
+                                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                                        <path d="M6.3 2.84A1.5 1.5 0 0 0 4 4.11v11.78a1.5 1.5 0 0 0 2.3 1.27l9.344-5.891a1.5 1.5 0 0 0 0-2.538L6.3 2.841Z" />
+                                    </svg>
+                                    再生
+                                </button>
+                            }
+                        </div>}
+                        {active === "negative" && <>
+                            <hr className="mb-4 mt-2" />
+                            <p className="text-xs font-medium">{negative.reason}</p>
+                        </>}
+                    </div>
+                </div>
+            </div>
+        </div>
+    )
+}
+
+export { SuggestCard }
diff --git a/src/components/molecules/TranscriptionAccuracy.tsx b/src/components/molecules/TranscriptionAccuracy.tsx
index c6322a9..d11ca5f 100644
--- a/src/components/molecules/TranscriptionAccuracy.tsx
+++ b/src/components/molecules/TranscriptionAccuracy.tsx
@@ -6,12 +6,14 @@ import { recordState } from "../../store/atoms/recordState";
 import { speakerLanguageState } from "../../store/atoms/speakerLanguageState";
 import { settingKeyState } from "../../store/atoms/settingKeyState";
 import { tracingState } from "../../store/atoms/tracingState";
-import { modelFugumtDownloadedState } from "../../store/atoms/modelFugumtDownloadedState";
+import { modelFugumtEnJaDownloadedState } from "../../store/atoms/modelFugumtEnJaDownloadedState";
+import { modelFugumtJaEnDownloadedState } from "../../store/atoms/modelFugumtJaEnDownloadedState";
 import { modelHonyaku13BDownloadedState } from "../../store/atoms/modelHonyaku13BDownloadedState";
 
 const TranscriptionAccuracy = (): JSX.Element => {
     const downloadedModels = useRecoilValue(modelWhisperDownloadedState)
-    const downloadedModelsFugumt = useRecoilValue(modelFugumtDownloadedState)
+    const downloadedModelsFugumtEnJa = useRecoilValue(modelFugumtEnJaDownloadedState)
+    const downloadedModelsFugumtJaEn = useRecoilValue(modelFugumtJaEnDownloadedState)
     const downloadedModelsHonyaku13B = useRecoilValue(modelHonyaku13BDownloadedState)
     const [transcriptionAccuracy, setTranscriptionAccuracy] = useRecoilState(transcriptionAccuracyState)
     const isRecording = useRecoilValue(recordState)
@@ -41,36 +43,47 @@ const TranscriptionAccuracy = (): JSX.Element => {
             case "off":
                 return "オフ";
             case "small":
-                return "文字起こし：低";
+                return "汎用パック（低精度）";
             case "medium":
-                return "文字起こし：中";
+                return "汎用パック（中精度）";
             case "large":
-                return "文字起こし：高";
+                return "汎用パック（高精度）";
+            case "large-turbo":
+                return "汎用パック（速度優先）";
             case "large-distil.en":
+                return "英語パック";
             case "large-distil.ja":
-                return "文字起こし：速度優先";
+                return "日本語パック";
+            case "large-distil.bilingual":
+                return "バイリンガルパック";
             case "online-transcript":
-                return "文字起こし：WhisperAPI";
+                return "Whisper";
             case "online-transcript-to-en":
-                return "翻訳（英）：WhisperAPI";
+                return "Whisper";
             case "online-amivoice":
-                return "文字起こし：AmiVoiceAPI";
+                return "AmiVoice";
             case "online-chat":
-                return "AI：ChatGPT";
+                return "ChatGPT";
             case "small-translate-to-en":
-                return "翻訳（英）：低";
+                return "汎用パック（低精度）";
             case "medium-translate-to-en":
-                return "翻訳（英）：中";
+                return "汎用パック（中精度）";
             case "large-translate-to-en":
-                return "翻訳（英）：高";
+                return "汎用パック（高精度）";
+            case "large-turbo-translate-to-en":
+                return "汎用パック（速度優先）";
             case "fugumt-en-ja":
-                return "翻訳（日）：速度優先";
-            case "honyaku13b-q4-0":
-                return "翻訳（日）：精度優先";
+                return "日本語パック（標準）";
+            case "fugumt-ja-en":
+                return "英語パック（標準）";
+            case "honyaku-13b":
+                return "日本語パック（精度優先）";
             default:
                 throw new Error("unknown modelType: " + model);
         }
     }
+    const transcriptionModels = ["small", "medium", "large", "large-turbo"];
+    const targetedTranscriptionModels = ["large-distil.en", "large-distil.ja"];
 
     return (
         <div className="dropdown">
@@ -80,11 +93,13 @@ const TranscriptionAccuracy = (): JSX.Element => {
                 (downloadedModels.length === 0 &&
                     // 2. WhisperのAPIキーが設定されていない場合
                     settingKeyOpenai === "" &&
-                    // 3. ローカルにWhisperLargeモデルがダウンロードされていない場合 or ローカルにFugumtモデルがダウンロードされていない場合 or ダウンロードされていても、話し手の言語が日本語の場合
-                    !(downloadedModels.includes("large") && downloadedModelsFugumt.length !== 0 && !(speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja"))) &&
-                    // 4. ローカルにWhisperLargeモデルがダウンロードされていない場合 or ローカルにHonyaku13Bモデルがダウンロードされていない場合 or ダウンロードされていても、話し手の言語が日本語の場合
+                    // 3. ローカルにWhisperLargeモデルがダウンロードされていない場合 or ローカルにFugumtEnJaモデルがダウンロードされていない場合 or ダウンロードされていても、話し手の言語が日本語の場合
+                    !(downloadedModels.includes("large") && downloadedModelsFugumtEnJa.length !== 0 && !(speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja"))) &&
+                    // 4. ローカルにWhisperLargeモデルがダウンロードされていない場合 or ローカルにFugumtJaEnモデルがダウンロードされていない場合 or ダウンロードされていても、話し手の言語が日本語以外の場合
+                    !(downloadedModels.includes("large") && downloadedModelsFugumtJaEn.length !== 0 && (speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja"))) &&
+                    // 5. ローカルにWhisperLargeモデルがダウンロードされていない場合 or ローカルにHonyaku13Bモデルがダウンロードされていない場合 or ダウンロードされていても、話し手の言語が日本語の場合
                     !(downloadedModels.includes("large") && downloadedModelsHonyaku13B.length !== 0 && !(speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja"))) &&
-                    // 5. AmiVoiceのAPIキーが設定されていない場合 or 設定されていても、話し手の言語が日本語以外の場合
+                    // 6. AmiVoiceのAPIキーが設定されていない場合 or 設定されていても、話し手の言語が日本語以外の場合
                     !(settingKeyAmivoice !== "" && (speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja"))))) ? <label tabIndex={0} className="group normal-case btn w-52 flex justify-between btn-disabled" style={{ color: "inherit", backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }}>
                 <div className="w-36 text-left overflow-x-hidden whitespace-nowrap text-ellipsis">{transcriptionAccuracy === null ? "追っかけ方法を選択" : mapModel(transcriptionAccuracy)}</div>
                 <div>
@@ -109,7 +124,7 @@ const TranscriptionAccuracy = (): JSX.Element => {
                         group-hover:visible opacity-100 absolute ">追っかけ方法
                 </div>
             </label>}
-            <ul tabIndex={0} className="dropdown-content menu rounded-box w-52"
+            <ul tabIndex={0} className="dropdown-content menu rounded-box w-60"
                 style={{ backgroundColor: "hsl(var(--b1) / var(--tw-bg-opacity))", border: "1px solid hsl(var(--bc) / 0.2)" }}
             >
                 <ul className="max-h-56 overflow-y-scroll rounded-box scrollbar-transparent">
@@ -120,78 +135,240 @@ const TranscriptionAccuracy = (): JSX.Element => {
                         </label>
                     </li>
                     {downloadedModels.length > 0 && <>
-                        {downloadedModels?.reduce((a: string[], c) => {
-                            if (c === "large-distil.en") {
-                                if (speakerLanguage?.startsWith("en-us") || speakerLanguage?.startsWith("small-en-us")) {
-                                    return [...a, c]
-                                } else {
-                                    return a
+                        <hr className="my-2" />
+                        <div className="flex justify-center sticky top-0 z-10 w-full" style={{ backgroundColor: "hsl(24 33% 97%)" }}>
+                            <p className="text-xs text-gray-400">オフライン</p>
+                        </div>
+                        {downloadedModels
+                            .filter(m => transcriptionModels.includes(m))
+                            .map((model, i) => (
+                                <>
+                                    {i === 0 ?
+                                        <p className="text-sm ml-2 my-2 flex items-center">
+                                            <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                                <path d="M13.488 2.513a1.75 1.75 0 0 0-2.475 0L6.75 6.774a2.75 2.75 0 0 0-.596.892l-.848 2.047a.75.75 0 0 0 .98.98l2.047-.848a2.75 2.75 0 0 0 .892-.596l4.261-4.262a1.75 1.75 0 0 0 0-2.474Z" />
+                                                <path d="M4.75 3.5c-.69 0-1.25.56-1.25 1.25v6.5c0 .69.56 1.25 1.25 1.25h6.5c.69 0 1.25-.56 1.25-1.25V9A.75.75 0 0 1 14 9v2.25A2.75 2.75 0 0 1 11.25 14h-6.5A2.75 2.75 0 0 1 2 11.25v-6.5A2.75 2.75 0 0 1 4.75 2H7a.75.75 0 0 1 0 1.5H4.75Z" />
+                                            </svg>
+                                            文字起こし（汎用）
+                                        </p> : ""}
+                                    <li key={"transcription-accuracy_" + i}>
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value={model} checked={model === transcriptionAccuracy} />
+                                            <a className="grow">{mapModel(model)}</a>
+                                        </label>
+                                    </li>
+                                </>
+                            ))
+                        }
+                        {downloadedModels
+                            .filter(m => targetedTranscriptionModels.includes(m))
+                            .reduce((a: string[], c) => {
+                                if (c === "large-distil.en") {
+                                    if (speakerLanguage?.startsWith("en-us") || speakerLanguage?.startsWith("small-en-us")) {
+                                        return [...a, c]
+                                    } else {
+                                        return a
+                                    }
                                 }
-                            }
-                            if (c === "large-distil.ja") {
-                                if (speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja")) {
-                                    return [...a, c]
-                                } else {
-                                    return a
+                                if (c === "large-distil.ja") {
+                                    if (speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja")) {
+                                        return [...a, c]
+                                    } else {
+                                        return a
+                                    }
                                 }
-                            }
-                            if (speakerLanguage?.startsWith("en-us") || speakerLanguage?.startsWith("small-en-us")) {
                                 return [...a, c]
-                            }
-                            return [...a, c, `${c}-translate-to-en`]
-                        }, []).map((model, i) => (
-                            <li key={"transcription-accuracy_" + i}>
+                            }, [])
+                            .map((model, i) => (
+                                <>
+                                    {i === 0 ?
+                                        <p className="text-sm ml-2 my-2 flex items-center">
+                                            <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                                <path d="M13.488 2.513a1.75 1.75 0 0 0-2.475 0L6.75 6.774a2.75 2.75 0 0 0-.596.892l-.848 2.047a.75.75 0 0 0 .98.98l2.047-.848a2.75 2.75 0 0 0 .892-.596l4.261-4.262a1.75 1.75 0 0 0 0-2.474Z" />
+                                                <path d="M4.75 3.5c-.69 0-1.25.56-1.25 1.25v6.5c0 .69.56 1.25 1.25 1.25h6.5c.69 0 1.25-.56 1.25-1.25V9A.75.75 0 0 1 14 9v2.25A2.75 2.75 0 0 1 11.25 14h-6.5A2.75 2.75 0 0 1 2 11.25v-6.5A2.75 2.75 0 0 1 4.75 2H7a.75.75 0 0 1 0 1.5H4.75Z" />
+                                            </svg>
+                                            文字起こし（言語特化）
+                                        </p> : ""}
+                                    <li key={"transcription-accuracy_" + i}>
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value={model} checked={model === transcriptionAccuracy} />
+                                            <a className="grow">{mapModel(model)}</a>
+                                        </label>
+                                    </li>
+                                </>
+                            ))
+                        }
+                        {(speakerLanguage?.startsWith("en-us") || speakerLanguage?.startsWith("small-en-us")) && downloadedModels
+                            .filter(m => m === "large-distil.bilingual")
+                            .map((model, i) => (
+                                <>
+                                    {i === 0 ?
+                                        <p className="text-sm ml-2 my-2 flex items-center">
+                                            <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                                <path d="M1 8.849c0 1 .738 1.851 1.734 1.947L3 10.82v2.429a.75.75 0 0 0 1.28.53l1.82-1.82A3.484 3.484 0 0 1 5.5 10V9A3.5 3.5 0 0 1 9 5.5h4V4.151c0-1-.739-1.851-1.734-1.947a44.539 44.539 0 0 0-8.532 0C1.738 2.3 1 3.151 1 4.151V8.85Z" />
+                                                <path d="M7 9a2 2 0 0 1 2-2h4a2 2 0 0 1 2 2v1a2 2 0 0 1-2 2h-.25v1.25a.75.75 0 0 1-1.28.53L9.69 12H9a2 2 0 0 1-2-2V9Z" />
+                                            </svg>
+                                            翻訳（英語⇒日本語）
+                                        </p> : ""}
+                                    <li key={"transcription-accuracy_" + i}>
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value={model} checked={model === transcriptionAccuracy} />
+                                            <a className="grow">{mapModel(model)}</a>
+                                        </label>
+                                    </li>
+                                </>
+                            ))
+                        }
+                        {(speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja")) && downloadedModels
+                            .filter(m => m === "large-distil.bilingual")
+                            .map((model, i) => (
+                                <>
+                                    {i === 0 ?
+                                        <p className="text-sm ml-2 my-2 flex items-center">
+                                            <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                                <path d="M1 8.849c0 1 .738 1.851 1.734 1.947L3 10.82v2.429a.75.75 0 0 0 1.28.53l1.82-1.82A3.484 3.484 0 0 1 5.5 10V9A3.5 3.5 0 0 1 9 5.5h4V4.151c0-1-.739-1.851-1.734-1.947a44.539 44.539 0 0 0-8.532 0C1.738 2.3 1 3.151 1 4.151V8.85Z" />
+                                                <path d="M7 9a2 2 0 0 1 2-2h4a2 2 0 0 1 2 2v1a2 2 0 0 1-2 2h-.25v1.25a.75.75 0 0 1-1.28.53L9.69 12H9a2 2 0 0 1-2-2V9Z" />
+                                            </svg>
+                                            翻訳（日本語⇒英語）
+                                        </p> : ""}
+                                    <li key={"transcription-accuracy_" + i}>
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value={model} checked={model === transcriptionAccuracy} />
+                                            <a className="grow">{mapModel(model)}</a>
+                                        </label>
+                                    </li>
+                                </>
+                            ))
+                        }
+                        {!(speakerLanguage?.startsWith("en-us") || speakerLanguage?.startsWith("small-en-us")) && downloadedModels
+                            .filter(m => transcriptionModels.includes(m))
+                            .map(m => `${m}-translate-to-en`)
+                            .map((model, i) => (
+                                <>
+                                    {i === 0 ?
+                                        <p className="text-sm ml-2 my-2 flex items-center">
+                                            <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                                <path d="M1 8.849c0 1 .738 1.851 1.734 1.947L3 10.82v2.429a.75.75 0 0 0 1.28.53l1.82-1.82A3.484 3.484 0 0 1 5.5 10V9A3.5 3.5 0 0 1 9 5.5h4V4.151c0-1-.739-1.851-1.734-1.947a44.539 44.539 0 0 0-8.532 0C1.738 2.3 1 3.151 1 4.151V8.85Z" />
+                                                <path d="M7 9a2 2 0 0 1 2-2h4a2 2 0 0 1 2 2v1a2 2 0 0 1-2 2h-.25v1.25a.75.75 0 0 1-1.28.53L9.69 12H9a2 2 0 0 1-2-2V9Z" />
+                                            </svg>
+                                            翻訳（18言語⇒英語）
+                                        </p> : ""}
+                                    <li key={"transcription-accuracy_" + i}>
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value={model} checked={model === transcriptionAccuracy} />
+                                            <a className="grow">{mapModel(model)}</a>
+                                        </label>
+                                    </li>
+                                </>
+                            ))
+                        }
+                        {downloadedModels.includes("large")
+                            && !(speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja"))
+                            && (downloadedModelsFugumtEnJa.length > 0 || downloadedModelsHonyaku13B.length > 0) && <>
+                                <p className="text-sm ml-2 my-2 flex items-center">
+                                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                        <path d="M1 8.849c0 1 .738 1.851 1.734 1.947L3 10.82v2.429a.75.75 0 0 0 1.28.53l1.82-1.82A3.484 3.484 0 0 1 5.5 10V9A3.5 3.5 0 0 1 9 5.5h4V4.151c0-1-.739-1.851-1.734-1.947a44.539 44.539 0 0 0-8.532 0C1.738 2.3 1 3.151 1 4.151V8.85Z" />
+                                        <path d="M7 9a2 2 0 0 1 2-2h4a2 2 0 0 1 2 2v1a2 2 0 0 1-2 2h-.25v1.25a.75.75 0 0 1-1.28.53L9.69 12H9a2 2 0 0 1-2-2V9Z" />
+                                    </svg>
+                                    翻訳（18言語⇒日本語）
+                                </p>
+                                {downloadedModelsFugumtEnJa.length > 0 && <>
+                                    <li key="transcription-accuracy_fugumt-en-ja">
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="fugumt-en-ja" checked={"fugumt-en-ja" === transcriptionAccuracy} />
+                                            <a className="grow">日本語パック（標準）</a>
+                                        </label>
+                                    </li>
+                                </>}
+                                {downloadedModelsHonyaku13B.length > 0 && <>
+                                    <li key="transcription-accuracy_honyaku-13b">
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="honyaku-13b" checked={"honyaku-13b" === transcriptionAccuracy} />
+                                            <a className="grow">日本語パック（精度優先）</a>
+                                        </label>
+                                    </li>
+                                </>}
+                            </>
+                        }
+                        {downloadedModels.includes("large")
+                            && (speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja"))
+                            && (downloadedModelsFugumtJaEn.length > 0) && <>
+                                <p className="text-sm ml-2 my-2 flex items-center">
+                                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                        <path d="M1 8.849c0 1 .738 1.851 1.734 1.947L3 10.82v2.429a.75.75 0 0 0 1.28.53l1.82-1.82A3.484 3.484 0 0 1 5.5 10V9A3.5 3.5 0 0 1 9 5.5h4V4.151c0-1-.739-1.851-1.734-1.947a44.539 44.539 0 0 0-8.532 0C1.738 2.3 1 3.151 1 4.151V8.85Z" />
+                                        <path d="M7 9a2 2 0 0 1 2-2h4a2 2 0 0 1 2 2v1a2 2 0 0 1-2 2h-.25v1.25a.75.75 0 0 1-1.28.53L9.69 12H9a2 2 0 0 1-2-2V9Z" />
+                                    </svg>
+                                    翻訳（日本語⇒英語）
+                                </p>
+                                {downloadedModelsFugumtJaEn.length > 0 && <>
+                                    <li key="transcription-accuracy_fugumt-en-ja">
+                                        <label className="label inline-flex active:!bg-inherit">
+                                            <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="fugumt-ja-en" checked={"fugumt-ja-en" === transcriptionAccuracy} />
+                                            <a className="grow">英語パック（標準）</a>
+                                        </label>
+                                    </li>
+                                </>}
+                            </>
+                        }
+                    </>}
+                    {(settingKeyOpenai || settingKeyAmivoice) && <>
+                        <hr className="my-2" />
+                        <div className="flex justify-center sticky top-0 z-10 w-full" style={{ backgroundColor: "hsl(24 33% 97%)" }}>
+                            <p className="text-xs text-gray-400">オンライン</p>
+                        </div>
+                        <p className="text-sm ml-2 my-2 flex items-center">
+                            <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                <path d="M13.488 2.513a1.75 1.75 0 0 0-2.475 0L6.75 6.774a2.75 2.75 0 0 0-.596.892l-.848 2.047a.75.75 0 0 0 .98.98l2.047-.848a2.75 2.75 0 0 0 .892-.596l4.261-4.262a1.75 1.75 0 0 0 0-2.474Z" />
+                                <path d="M4.75 3.5c-.69 0-1.25.56-1.25 1.25v6.5c0 .69.56 1.25 1.25 1.25h6.5c.69 0 1.25-.56 1.25-1.25V9A.75.75 0 0 1 14 9v2.25A2.75 2.75 0 0 1 11.25 14h-6.5A2.75 2.75 0 0 1 2 11.25v-6.5A2.75 2.75 0 0 1 4.75 2H7a.75.75 0 0 1 0 1.5H4.75Z" />
+                            </svg>
+                            文字起こし
+                        </p>
+                        {settingKeyOpenai && <>
+                            <li key="transcription-accuracy_online-transcript">
                                 <label className="label inline-flex active:!bg-inherit">
-                                    <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value={model} checked={model === transcriptionAccuracy} />
-                                    <a className="grow">{mapModel(model)}</a>
+                                    <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="online-transcript" checked={"online-transcript" === transcriptionAccuracy} />
+                                    <a className="grow">Whisper</a>
                                 </label>
                             </li>
-                        ))}
-                    </>}
-                    {downloadedModels.includes("large") && downloadedModelsFugumt.length > 0 && !(speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja")) && <>
-                        <li key="transcription-accuracy_fugumt-en-ja">
-                            <label className="label inline-flex active:!bg-inherit">
-                                <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="fugumt-en-ja" checked={"fugumt-en-ja" === transcriptionAccuracy} />
-                                <a className="grow">翻訳（日）：速度優先</a>
-                            </label>
-                        </li>
-                    </>}
-                    {downloadedModels.includes("large") && downloadedModelsHonyaku13B.length > 0 && !(speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja")) && <>
-                        <li key="transcription-accuracy_honyaku13b-q4-0">
-                            <label className="label inline-flex active:!bg-inherit">
-                                <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="honyaku13b-q4-0" checked={"honyaku13b-q4-0" === transcriptionAccuracy} />
-                                <a className="grow">翻訳（日）：精度優先</a>
-                            </label>
-                        </li>
-                    </>}
-                    {settingKeyOpenai && <>
-                        <li key="transcription-accuracy_online-transcript">
-                            <label className="label inline-flex active:!bg-inherit">
-                                <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="online-transcript" checked={"online-transcript" === transcriptionAccuracy} />
-                                <a className="grow">文字起こし：WhisperAPI</a>
-                            </label>
-                        </li>
-                        <li key="transcription-accuracy_online-chat">
-                            <label className="label inline-flex active:!bg-inherit">
-                                <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="online-chat" checked={"online-chat" === transcriptionAccuracy} />
-                                <a className="grow">AI：ChatGPT</a>
-                            </label>
-                        </li>
-                        {(!speakerLanguage?.startsWith("en-us") && !speakerLanguage?.startsWith("small-en-us")) && (
-                            <li key="online-transcript-to-en">
+                        </>}
+                        {settingKeyAmivoice && (speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja")) && <>
+                            <li key="transcription-accuracy_online-amivoice">
                                 <label className="label inline-flex active:!bg-inherit">
-                                    <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="online-transcript-to-en" checked={"online-transcript-to-en" === transcriptionAccuracy} />
-                                    <a className="grow">翻訳（英）：WhisperAPI</a>
+                                    <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="online-amivoice" checked={"online-amivoice" === transcriptionAccuracy} />
+                                    <a className="grow">AmiVoice</a>
                                 </label>
                             </li>
-                        )}</>}
-                    {settingKeyAmivoice && (speakerLanguage?.startsWith("ja") || speakerLanguage?.startsWith("small-ja")) && <>
-                        <li key="transcription-accuracy_online-amivoice">
-                            <label className="label inline-flex active:!bg-inherit">
-                                <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="online-amivoice" checked={"online-amivoice" === transcriptionAccuracy} />
-                                <a className="grow">文字起こし：AmiVoiceAPI</a>
-                            </label>
-                        </li></>}
+                        </>}
+                        {settingKeyOpenai && <>
+                            {(!speakerLanguage?.startsWith("en-us") && !speakerLanguage?.startsWith("small-en-us")) && (<>
+                                <p className="text-sm ml-2 my-2 flex items-center">
+                                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                        <path d="M1 8.849c0 1 .738 1.851 1.734 1.947L3 10.82v2.429a.75.75 0 0 0 1.28.53l1.82-1.82A3.484 3.484 0 0 1 5.5 10V9A3.5 3.5 0 0 1 9 5.5h4V4.151c0-1-.739-1.851-1.734-1.947a44.539 44.539 0 0 0-8.532 0C1.738 2.3 1 3.151 1 4.151V8.85Z" />
+                                        <path d="M7 9a2 2 0 0 1 2-2h4a2 2 0 0 1 2 2v1a2 2 0 0 1-2 2h-.25v1.25a.75.75 0 0 1-1.28.53L9.69 12H9a2 2 0 0 1-2-2V9Z" />
+                                    </svg>
+                                    翻訳（18言語⇒英語）
+                                </p>
+                                <li key="online-transcript-to-en">
+                                    <label className="label inline-flex active:!bg-inherit">
+                                        <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="online-transcript-to-en" checked={"online-transcript-to-en" === transcriptionAccuracy} />
+                                        <a className="grow">Whisper</a>
+                                    </label>
+                                </li>
+                            </>)}
+                            <p className="text-sm ml-2 my-2 flex items-center">
+                                <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" fill="currentColor" className="size-4 mr-1">
+                                    <path fillRule="evenodd" d="M15 8A7 7 0 1 1 1 8a7 7 0 0 1 14 0Zm-5-2a2 2 0 1 1-4 0 2 2 0 0 1 4 0ZM8 9c-1.825 0-3.422.977-4.295 2.437A5.49 5.49 0 0 0 8 13.5a5.49 5.49 0 0 0 4.294-2.063A4.997 4.997 0 0 0 8 9Z" clipRule="evenodd" />
+                                </svg>
+                                アシスタント
+                            </p>
+                            <li key="transcription-accuracy_online-chat">
+                                <label className="label inline-flex active:!bg-inherit">
+                                    <input type="radio" name="trace-option" className="radio radio-accent" onChange={change} value="online-chat" checked={"online-chat" === transcriptionAccuracy} />
+                                    <a className="grow">ChatGPT</a>
+                                </label>
+                            </li>
+                        </>}
+                    </>}
                 </ul>
             </ul>
         </div>
diff --git a/src/components/organisms/NoteFooter.tsx b/src/components/organisms/NoteFooter.tsx
index b5fc622..b341315 100644
--- a/src/components/organisms/NoteFooter.tsx
+++ b/src/components/organisms/NoteFooter.tsx
@@ -5,6 +5,7 @@ import { speechHistoryState } from '../../store/atoms/speechHistoryState'
 import { AppWindow } from '../molecules/AppWindow'
 import { ActionSet } from '../molecules/ActionSet'
 import { settingKeyState } from '../../store/atoms/settingKeyState'
+import { actionState } from '../../store/atoms/actionState'
 
 type NoteFooterProps = {
     titleRef: React.RefObject<HTMLInputElement>
@@ -20,7 +21,8 @@ const NoteFooter = (props: NoteFooterProps): JSX.Element => {
     const settingKeyOpenai = useRecoilValue(settingKeyState("settingKeyOpenai"))
     const selectedNote = useRecoilValue(selectedNoteState)
     const setHistories = useSetRecoilState(speechHistoryState(selectedNote!.note_id))
-    const update = (type: "memo" | "action") => {
+    const targetAction = useRecoilValue(actionState)
+    const update = (type: "memo" | "action", action_type?: "chat" | "suggest") => {
         if (type === "memo") {
             if (inputValue === "") {
                 return
@@ -39,22 +41,38 @@ const NoteFooter = (props: NoteFooterProps): JSX.Element => {
             inputEl.current?.focus();
             setInputValue("")
         } else if (type === "action") {
-            if (inputActionValue === "") {
-                return
+            if (action_type === "chat") {
+                if (inputActionValue === "") {
+                    return
+                }
+                setHistories(prev =>
+                    [...prev, {
+                        speech_type: "action",
+                        action_type: "chat",
+                        created_at_unixtime: Math.floor(new Date().getTime() / 1000),
+                        content: inputActionValue,
+                        wav: "",
+                        model: "manual",
+                        model_description: "manual",
+                        note_id: selectedNote!.note_id
+                    }]
+                )
+                inputActionEl.current?.focus();
+                setInputActionValue("")
+            } else if (action_type === "suggest") {
+                setHistories(prev =>
+                    [...prev, {
+                        speech_type: "action",
+                        action_type: "suggest",
+                        created_at_unixtime: Math.floor(new Date().getTime() / 1000),
+                        content: "",
+                        wav: "",
+                        model: "manual",
+                        model_description: "manual",
+                        note_id: selectedNote!.note_id
+                    }]
+                )
             }
-            setHistories(prev =>
-                [...prev, {
-                    speech_type: "action",
-                    created_at_unixtime: Math.floor(new Date().getTime() / 1000),
-                    content: inputActionValue,
-                    wav: "",
-                    model: "manual",
-                    model_description: "manual",
-                    note_id: selectedNote!.note_id
-                }]
-            )
-            inputActionEl.current?.focus();
-            setInputActionValue("")
         }
     };
     const clear = (type: "memo" | "action", e: KeyboardEvent<HTMLTextAreaElement>) => {
@@ -70,7 +88,7 @@ const NoteFooter = (props: NoteFooterProps): JSX.Element => {
         if (!(e.shiftKey && e.key === 'Enter')) {
             return
         }
-        update(type);
+        update(type, type === "action" ? "chat" : undefined);
     }
 
     useEffect(() => {
@@ -92,28 +110,67 @@ const NoteFooter = (props: NoteFooterProps): JSX.Element => {
                     onClick={() => { setIsMemo(false); }}
                 >各種アクション</a>
             </div>
-            <div className={"flex-1 flex flex-col mr-2 relative" + (isMemo ? "" : " hidden")}>
-                <textarea value={inputValue} rows={3} ref={inputEl} placeholder="書き留めたいこと…" className="scrollbar-transparent pr-16 resize-none leading-6 rounded-2xl flex-1 w-full textarea textarea-bordered bg-white focus:outline-none" onKeyDown={e => enter("memo", e)} onKeyUp={e => clear("memo", e)} onChange={(e) => setInputValue(e.target.value)} />
-                <button disabled={inputValue === ""} className="w-12 h-12 absolute bottom-0 right-0 mb-5 mr-2 btn glass border border-solid border-neutral-300 text-primary" onClick={() => update("memo")}>
-                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
-                        <path fillRule="evenodd" d="M7.793 2.232a.75.75 0 0 1-.025 1.06L3.622 7.25h10.003a5.375 5.375 0 0 1 0 10.75H10.75a.75.75 0 0 1 0-1.5h2.875a3.875 3.875 0 0 0 0-7.75H3.622l4.146 3.957a.75.75 0 0 1-1.036 1.085l-5.5-5.25a.75.75 0 0 1 0-1.085l5.5-5.25a.75.75 0 0 1 1.06.025Z" clipRule="evenodd" />
-                    </svg>
-                </button>
-            </div>
-            <div className={"flex flex-col items-center" + (isMemo ? "" : " hidden")}>
-                <AppWindow />
-            </div>
-            <div className={"flex-1 flex flex-col mr-2 relative" + (isMemo ? " hidden" : "")}>
-                <textarea value={inputActionValue} rows={3} ref={inputActionEl} placeholder="今回の記録を活用し、アシスタントにやってもらいたいこと…" className="scrollbar-transparent pr-16 resize-none leading-6 rounded-2xl flex-1 w-full textarea textarea-bordered bg-white focus:outline-none" onKeyDown={e => enter("action", e)} onKeyUp={e => clear("action", e)} onChange={(e) => setInputActionValue(e.target.value)} />
-                <button disabled={inputActionValue === ""} className="w-12 h-12 absolute bottom-0 right-0 mb-5 mr-2 btn glass border border-solid border-neutral-300 text-primary" onClick={() => update("action")}>
-                    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
-                        <path fillRule="evenodd" d="M7.793 2.232a.75.75 0 0 1-.025 1.06L3.622 7.25h10.003a5.375 5.375 0 0 1 0 10.75H10.75a.75.75 0 0 1 0-1.5h2.875a3.875 3.875 0 0 0 0-7.75H3.622l4.146 3.957a.75.75 0 0 1-1.036 1.085l-5.5-5.25a.75.75 0 0 1 0-1.085l5.5-5.25a.75.75 0 0 1 1.06.025Z" clipRule="evenodd" />
-                    </svg>
-                </button>
-            </div>
-            <div className={"flex flex-col items-center w-52" + (isMemo ? " hidden" : "")}>
-                <ActionSet />
-            </div>
+            {isMemo && <>
+                <div className={"flex-1 flex flex-col mr-2 relative"}>
+                    <textarea value={inputValue} rows={3} ref={inputEl} placeholder="書き留めたいこと…" className="scrollbar-transparent pr-16 resize-none leading-6 rounded-2xl flex-1 w-full textarea textarea-bordered bg-white focus:outline-none" onKeyDown={e => enter("memo", e)} onKeyUp={e => clear("memo", e)} onChange={(e) => setInputValue(e.target.value)} />
+                    <button disabled={inputValue === ""} className="w-12 h-12 absolute bottom-0 right-0 mb-5 mr-2 btn glass border border-solid border-neutral-300 text-primary" onClick={() => update("memo")}>
+                        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
+                            <path fillRule="evenodd" d="M7.793 2.232a.75.75 0 0 1-.025 1.06L3.622 7.25h10.003a5.375 5.375 0 0 1 0 10.75H10.75a.75.75 0 0 1 0-1.5h2.875a3.875 3.875 0 0 0 0-7.75H3.622l4.146 3.957a.75.75 0 0 1-1.036 1.085l-5.5-5.25a.75.75 0 0 1 0-1.085l5.5-5.25a.75.75 0 0 1 1.06.025Z" clipRule="evenodd" />
+                        </svg>
+                    </button>
+                </div>
+                <div className={"flex flex-col items-center"}>
+                    <AppWindow />
+                </div>
+            </>}
+            {!isMemo && targetAction === "チャット" &&
+                <div className={"flex-1 flex flex-col mr-2 relative"}>
+                    <textarea value={inputActionValue} rows={3} ref={inputActionEl} placeholder="今回の記録を活用し、アシスタントにやってもらいたいこと…" className="scrollbar-transparent pr-16 resize-none leading-6 rounded-2xl flex-1 w-full textarea textarea-bordered bg-white focus:outline-none" onKeyDown={e => enter("action", e)} onKeyUp={e => clear("action", e)} onChange={(e) => setInputActionValue(e.target.value)} />
+                    <button disabled={inputActionValue === ""} className="w-12 h-12 absolute bottom-0 right-0 mb-5 mr-2 btn glass border border-solid border-neutral-300 text-primary" onClick={() => update("action", "chat")}>
+                        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="w-5 h-5">
+                            <path fillRule="evenodd" d="M7.793 2.232a.75.75 0 0 1-.025 1.06L3.622 7.25h10.003a5.375 5.375 0 0 1 0 10.75H10.75a.75.75 0 0 1 0-1.5h2.875a3.875 3.875 0 0 0 0-7.75H3.622l4.146 3.957a.75.75 0 0 1-1.036 1.085l-5.5-5.25a.75.75 0 0 1 0-1.085l5.5-5.25a.75.75 0 0 1 1.06.025Z" clipRule="evenodd" />
+                        </svg>
+                    </button>
+                </div>
+            }
+            {!isMemo && targetAction === "発話サジェスト" &&
+                <div className={"flex-1 flex flex-col mr-2 relative h-[5.5rem]"}>
+                    <div className="rounded-2xl flex-1 w-full bg-base-200 pt-2 pl-3 cursor-default">
+                        <p className='font-medium text-sm'>アシスタントが最適な発話をサジェスト</p>
+                        <p className='text-xs'>ボタン1つで状況に応じた3つの発話を提案</p>
+                        <div className='flex mt-2 text-sm'>
+                            <div className='flex items-center bg-gray-100 rounded-lg py-1 px-2 mr-2'>
+                                <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                                    <path fillRule="evenodd" d="M10 18a8 8 0 1 0 0-16 8 8 0 0 0 0 16ZM7 8.5c0 .828-.448 1.5-1 1.5s-1-.672-1-1.5S5.448 7 6 7s1 .672 1 1.5Zm5 0c0 .828-.448 1.5-1 1.5s-1-.672-1-1.5S10.448 7 11 7s1 .672 1 1.5Zm-6.5 5.5a.75.75 0 0 1 .75-.75h7.5a.75.75 0 0 1 0 1.5h-7.5a.75.75 0 0 1-.75-.75Z" clipRule="evenodd" />
+                                </svg>
+                                <p className='pl-1'>ニュートラル</p>
+                            </div>
+                            <div className='flex items-center bg-gray-100 rounded-lg py-1 px-2 mr-2 text-primary'>
+                                <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                                    <path fillRule="evenodd" d="M10 18a8 8 0 1 0 0-16 8 8 0 0 0 0 16Zm3.536-4.464a.75.75 0 1 0-1.061-1.061 3.5 3.5 0 0 1-4.95 0 .75.75 0 0 0-1.06 1.06 5 5 0 0 0 7.07 0ZM9 8.5c0 .828-.448 1.5-1 1.5s-1-.672-1-1.5S7.448 7 8 7s1 .672 1 1.5Zm3 1.5c.552 0 1-.672 1-1.5S12.552 7 12 7s-1 .672-1 1.5.448 1.5 1 1.5Z" clipRule="evenodd" />
+                                </svg>
+                                <p className='pl-1'>ポジティブ</p>
+                            </div>
+                            <div className='flex items-center bg-gray-100 rounded-lg py-1 px-2 text-error'>
+                                <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 20 20" fill="currentColor" className="size-5">
+                                    <path fillRule="evenodd" d="M10 18a8 8 0 1 0 0-16 8 8 0 0 0 0 16Zm-3.536-3.475a.75.75 0 0 0 1.061 0 3.5 3.5 0 0 1 4.95 0 .75.75 0 1 0 1.06-1.06 5 5 0 0 0-7.07 0 .75.75 0 0 0 0 1.06ZM9 8.5c0 .828-.448 1.5-1 1.5s-1-.672-1-1.5S7.448 7 8 7s1 .672 1 1.5Zm3 1.5c.552 0 1-.672 1-1.5S12.552 7 12 7s-1 .672-1 1.5.448 1.5 1 1.5Z" clipRule="evenodd" />
+                                </svg>
+                                <p className='pl-1'>ネガティブ</p>
+                            </div>
+                        </div>
+                    </div>
+                    <button className="w-12 h-12 absolute bottom-0 right-0 mb-5 mr-2 btn bg-white border border-solid border-neutral-300 text-primary" onClick={() => update("action", "suggest")}>
+                        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="currentColor" className="size-6">
+                            <path fillRule="evenodd" d="M4.848 2.771A49.144 49.144 0 0 1 12 2.25c2.43 0 4.817.178 7.152.52 1.978.292 3.348 2.024 3.348 3.97v6.02c0 1.946-1.37 3.678-3.348 3.97a48.901 48.901 0 0 1-3.476.383.39.39 0 0 0-.297.17l-2.755 4.133a.75.75 0 0 1-1.248 0l-2.755-4.133a.39.39 0 0 0-.297-.17 48.9 48.9 0 0 1-3.476-.384c-1.978-.29-3.348-2.024-3.348-3.97V6.741c0-1.946 1.37-3.68 3.348-3.97ZM6.75 8.25a.75.75 0 0 1 .75-.75h9a.75.75 0 0 1 0 1.5h-9a.75.75 0 0 1-.75-.75Zm.75 2.25a.75.75 0 0 0 0 1.5H12a.75.75 0 0 0 0-1.5H7.5Z" clipRule="evenodd" />
+                        </svg>
+                    </button>
+                </div>
+            }
+            {!isMemo &&
+                <div className={"flex flex-col items-center w-52" + (isMemo ? " hidden" : "")}>
+                    <ActionSet />
+                </div>
+            }
         </div>
     )
 }
diff --git a/src/components/organisms/NoteMain.tsx b/src/components/organisms/NoteMain.tsx
index b242462..bd14233 100644
--- a/src/components/organisms/NoteMain.tsx
+++ b/src/components/organisms/NoteMain.tsx
@@ -73,7 +73,7 @@ const NoteMain = (): JSX.Element => {
             const rect = bottomRef.current?.getBoundingClientRect();
             if (rect) {
                 const isInViewport = rect.top >= 0 && rect.bottom <= (window.innerHeight || document.documentElement.clientHeight);
-                if (isInViewport) {
+                if (isInViewport || histories.at(-1)?.speech_type === "screenshot") {
                     bottomRef.current?.scrollIntoView({ behavior: 'smooth' });
                 }
             }
@@ -186,123 +186,125 @@ const NoteMain = (): JSX.Element => {
     }, [isRecording])
 
     return (<>
-        <div className="max-w-7xl mx-auto py-2 px-4 sm:px-6 lg:px-8 bg-white flex items-center group relative overflow-x-hidden" style={{ height: "64px" }} >
-            <h1 className="overflow-hidden select-none text-ellipsis whitespace-nowrap text-2xl tracking-tight font-bold text-gray-600 flex-1 cursor-pointer mr-2 hover:border-base-300 border-2 border-transparent rounded-lg"
-                onDoubleClick={(e) => { e.preventDefault(); setEditTitle(true); }}>
-                {editTitle ?
-                    <input className='w-full bg-base-200 focus:outline-none pl-1 tracking-normal' autoFocus value={selectedNote!.note_title} ref={inputEl}
-                        onKeyDown={e => {
-                            if (e.key === "Enter" && e.keyCode === 13) {
-                                setEditTitle(false)
-                            }
-                        }}
-                        onBlur={() => { setEditTitle(false) }}
-                        onChange={(e) => {
-                            const target = e.target.value
-                            setSelectedNote(prev => { return { ...prev!, note_title: target } });
-                            setNotes(prev => prev.map(note => {
-                                if (note.id === selectedNote!.note_id) {
-                                    return { ...note, note_title: target }
-                                } else {
-                                    return note;
+        <div className='bg-white'>
+            <div className="max-w-7xl mx-auto py-2 px-4 sm:px-6 lg:px-8 bg-white flex items-center group relative overflow-x-hidden" style={{ height: "64px" }} >
+                <h1 className="overflow-hidden select-none text-ellipsis whitespace-nowrap text-2xl tracking-tight font-bold text-gray-600 flex-1 cursor-pointer mr-2 hover:border-base-300 border-2 border-transparent rounded-lg"
+                    onDoubleClick={(e) => { e.preventDefault(); setEditTitle(true); }}>
+                    {editTitle ?
+                        <input className='w-full bg-base-200 focus:outline-none pl-1 tracking-normal' autoFocus value={selectedNote!.note_title} ref={inputEl}
+                            onKeyDown={e => {
+                                if (e.key === "Enter" && e.keyCode === 13) {
+                                    setEditTitle(false)
                                 }
-                            }))
-                        }} />
-                    : <p className='pl-1 tracking-normal'>{selectedNote!.note_title}</p>}
-            </h1>
-            <div className="flex-none mr-2">
-                {isTracing && tracingNote === selectedNote?.note_id ?
-                    <TraceStopButton /> :
-                    <TraceStartButton />}
-            </div>
-            <div className="flex-none">
-                {(isRecording && recordingNote === selectedNote?.note_id) ? isReadyToRecognize ? <RecordStopButton /> : <RecordPreparingButton /> : <RecordStartButton />}
+                            }}
+                            onBlur={() => { setEditTitle(false) }}
+                            onChange={(e) => {
+                                const target = e.target.value
+                                setSelectedNote(prev => { return { ...prev!, note_title: target } });
+                                setNotes(prev => prev.map(note => {
+                                    if (note.id === selectedNote!.note_id) {
+                                        return { ...note, note_title: target }
+                                    } else {
+                                        return note;
+                                    }
+                                }))
+                            }} />
+                        : <p className='pl-1 tracking-normal'>{selectedNote!.note_title}</p>}
+                </h1>
+                <div className="flex-none mr-2">
+                    {isTracing && tracingNote === selectedNote?.note_id ?
+                        <TraceStopButton /> :
+                        <TraceStartButton />}
+                </div>
+                <div className="flex-none">
+                    {(isRecording && recordingNote === selectedNote?.note_id) ? isReadyToRecognize ? <RecordStopButton /> : <RecordPreparingButton /> : <RecordStartButton />}
+                </div>
+                <div className={`absolute top-0 -inset-full h-full w-1/2 z-5 block transform -skew-x-12 bg-gradient-to-r from-transparent to-red-100 opacity-40 ${(isRecording && recordingNote === selectedNote?.note_id) && "animate-shine"}`} />
+                <div className={`absolute top-0 -inset-full h-full w-1/2 z-5 block transform -skew-x-12 bg-gradient-to-r from-transparent to-yellow-100 opacity-40 ${(isTracing && tracingNote === selectedNote?.note_id) && "animate-shine"}`} />
             </div>
-            <div className={`absolute top-0 -inset-full h-full w-1/2 z-5 block transform -skew-x-12 bg-gradient-to-r from-transparent to-red-100 opacity-40 ${(isRecording && recordingNote === selectedNote?.note_id) && "animate-shine"}`} />
-            <div className={`absolute top-0 -inset-full h-full w-1/2 z-5 block transform -skew-x-12 bg-gradient-to-r from-transparent to-yellow-100 opacity-40 ${(isTracing && tracingNote === selectedNote?.note_id) && "animate-shine"}`} />
-        </div>
-        <div className="bg-white max-w-7xl mx-auto pl-2 py-2 flex items-center justify-between" style={{ height: "32px" }}>
-            <FilterTabs />
-            <div className="group mr-4">
-                <button className="text-slate-500 hover:text-slate-800" onClick={async () => {
-                    const typeMapper = (speech_type: string) => {
-                        switch (speech_type) {
-                            case "speech":
-                                return "発言";
-                            case "memo":
-                                return "メモ";
-                            case "screenshot":
-                                return "スクリーンショット";
-                            case "action":
-                                return "アクション";
-                            default:
-                                return "不明";
-                        }
-                    }
-                    const filterHistory = (speech_type: string) => {
-                        if (filterTarget === "speech") {
-                            if (speech_type === "speech") {
-                                return true;
+            <div className="bg-white max-w-7xl mx-auto pl-2 py-2 flex items-center justify-between" style={{ height: "32px" }}>
+                <FilterTabs />
+                <div className="group mr-4">
+                    <button className="text-slate-500 hover:text-slate-800" onClick={async () => {
+                        const typeMapper = (speech_type: string) => {
+                            switch (speech_type) {
+                                case "speech":
+                                    return "発言";
+                                case "memo":
+                                    return "メモ";
+                                case "screenshot":
+                                    return "スクリーンショット";
+                                case "action":
+                                    return "アクション";
+                                default:
+                                    return "不明";
                             }
-                            return false;
-                        } else if (filterTarget === "memo") {
-                            if (speech_type === "memo") {
-                                return true;
+                        }
+                        const filterHistory = (speech_type: string) => {
+                            if (filterTarget === "speech") {
+                                if (speech_type === "speech") {
+                                    return true;
+                                }
+                                return false;
+                            } else if (filterTarget === "memo") {
+                                if (speech_type === "memo") {
+                                    return true;
+                                }
+                                return false;
+                            } else if (filterTarget === "screenshot") {
+                                if (speech_type === "screenshot") {
+                                    return true;
+                                }
+                                return false;
+                            } else if (filterTarget === "action") {
+                                if (speech_type === "action") {
+                                    return true;
+                                }
+                                return false;
                             }
-                            return false;
-                        } else if (filterTarget === "screenshot") {
-                            if (speech_type === "screenshot") {
-                                return true;
+                            return true;
+                        }
+                        const csvSuffix = (() => {
+                            switch (filterTarget) {
+                                case null:
+                                    return "all";
+                                case "speech":
+                                    return "speech";
+                                case "memo":
+                                    return "memo";
+                                case "screenshot":
+                                    return "screenshot";
+                                case "action":
+                                    return "action";
+                                default:
+                                    return "unknown";
                             }
-                            return false;
-                        } else if (filterTarget === "action") {
-                            if (speech_type === "action") {
-                                return true;
+                        })();
+                        const csvData = (() => {
+                            if (settingKeyOpenai !== "") {
+                                return "日付,種別,内容1,内容2\n" + histories.filter(h => filterHistory(h.speech_type)).map(h => `${dayjs.unix(h.created_at_unixtime).format('YYYY-M-D H:mm')},${typeMapper(h.speech_type)},"${h.content}","${h.content_2 || ""}"`).join("\n");
+                            } else if (histories.some(h => h.speech_type === "action")) {
+                                return "日付,種別,内容1,内容2\n" + histories.filter(h => filterHistory(h.speech_type)).map(h => `${dayjs.unix(h.created_at_unixtime).format('YYYY-M-D H:mm')},${typeMapper(h.speech_type)},"${h.content}","${h.content_2 || ""}"`).join("\n");
+                            } else {
+                                return "日付,種別,内容\n" + histories.filter(h => filterHistory(h.speech_type)).map(h => `${dayjs.unix(h.created_at_unixtime).format('YYYY-M-D H:mm')},${typeMapper(h.speech_type)},"${h.content}"`).join("\n");
                             }
-                            return false;
+                        })()
+                        const path = await save({ defaultPath: `${selectedNote?.note_title.trim()}_${csvSuffix}.csv` });
+                        if (path) {
+                            await writeTextFile(path, csvData);
                         }
-                        return true;
-                    }
-                    const csvSuffix = (() => {
-                        switch (filterTarget) {
-                            case null:
-                                return "all";
-                            case "speech":
-                                return "speech";
-                            case "memo":
-                                return "memo";
-                            case "screenshot":
-                                return "screenshot";
-                            case "action":
-                                return "action";
-                            default:
-                                return "unknown";
-                        }
-                    })();
-                    const csvData = (() => {
-                        if (settingKeyOpenai !== "") {
-                            return "日付,種別,内容1,内容2\n" + histories.filter(h => filterHistory(h.speech_type)).map(h => `${dayjs.unix(h.created_at_unixtime).format('YYYY-M-D H:mm')},${typeMapper(h.speech_type)},"${h.content}","${h.content_2 || ""}"`).join("\n");
-                        } else if (histories.some(h=>h.speech_type === "action")) {
-                            return "日付,種別,内容1,内容2\n" + histories.filter(h => filterHistory(h.speech_type)).map(h => `${dayjs.unix(h.created_at_unixtime).format('YYYY-M-D H:mm')},${typeMapper(h.speech_type)},"${h.content}","${h.content_2 || ""}"`).join("\n");
-                        } else {
-                            return "日付,種別,内容\n" + histories.filter(h => filterHistory(h.speech_type)).map(h => `${dayjs.unix(h.created_at_unixtime).format('YYYY-M-D H:mm')},${typeMapper(h.speech_type)},"${h.content}"`).join("\n");
-                        }
-                    })()
-                    const path = await save({ defaultPath: `${selectedNote?.note_title.trim()}_${csvSuffix}.csv` });
-                    if (path) {
-                        await writeTextFile(path, csvData);
-                    }
-                }}>
-                    <Download />
-                </button>
-                <div className="opacity-0 w-20 invisible rounded text-[12px] 
+                    }}>
+                        <Download />
+                    </button>
+                    <div className="opacity-0 w-20 invisible rounded text-[12px] 
                         font-bold text-white py-1 bg-slate-600 top-[154px] right-4
                         group-hover:visible opacity-100 absolute text-center">ダウンロード
+                    </div>
                 </div>
             </div>
         </div>
         <div className="p-5 overflow-auto z-0" style={{ height: `calc(100vh - 160px)` }} ref={scrollContainerRef}>
-            <SpeechHistory histories={histories} />
+            <SpeechHistory histories={histories} setHistories={setHistories} />
             <div className="ml-[3.75rem] mb-[243px] text-gray-400" ref={bottomRef} >
                 {partialTextDesktop !== null && partialText !== null && <div className='flex flex-col'>
                     <div className="flex items-start"><span className="loading loading-ring loading-xs mr-[5px] mt-1 flex-none"></span><p>デスクトップ音声：{partialTextDesktop}</p></div>
diff --git a/src/components/organisms/SettingsMain.tsx b/src/components/organisms/SettingsMain.tsx
index 9891ba3..496ce6e 100644
--- a/src/components/organisms/SettingsMain.tsx
+++ b/src/components/organisms/SettingsMain.tsx
@@ -16,18 +16,28 @@ import { SettingResource } from "../molecules/SettingResource"
 import { SettingModel } from "../molecules/SettingModel"
 import { SettingAILanguage } from "../molecules/SettingAILanguage"
 import { SettingAmiVoiceModel } from "../molecules/SettingAmiVoiceModel"
-import { ModelDownloadFugumtButton } from "../molecules/ModelDownloadFugumtButton"
-import { ModelDownloadFugumtProgress } from "../molecules/ModelDownloadFugumtProgress"
+import { ModelDownloadFugumtEnJaButton } from "../molecules/ModelDownloadFugumtEnJaButton"
+import { ModelDownloadFugumtEnJaProgress } from "../molecules/ModelDownloadFugumtEnJaProgress"
 import { ModelDownloadHonyaku13BButton } from "../molecules/ModelDownloadHonyaku13BButton"
 import { ModelDownloadHonyaku13BProgress } from "../molecules/ModelDownloadHonyaku13BProgress"
 import { SettingProcesses } from "../molecules/SettingProcesses"
 import { SettingOnlines } from "../molecules/SettingOnlines"
 import { SettingAmiVoiceLogging } from "../molecules/SettingAmiVoiceLogging"
+import { ModelDownloadStyleBertVits2Button } from "../molecules/ModelDownloadStyleBertVits2Button"
+import { ModelDownloadStyleBertVits2Progress } from "../molecules/ModelDownloadStyleBertVits2Progress"
+import { SettingVoices } from "../molecules/SettingVoices"
+import { ModelDownloadStyleBertVits2VoiceButton } from "../molecules/ModelDownloadStyleBertVits2VoiceButton"
+import { ModelDownloadStyleBertVits2VoiceProgress } from "../molecules/ModelDownloadStyleBertVits2VoiceProgress"
+import { settingVoiceState } from "../../store/atoms/settingVoiceState"
+import { ModelDownloadFugumtJaEnButton } from "../molecules/ModelDownloadFugumtJaEnButton"
+import { ModelDownloadFugumtJaEnProgress } from "../molecules/ModelDownloadFugumtJaEnProgress"
 
 const SettingsMain = (): JSX.Element => {
     const settingLanguage = useRecoilValue(settingLanguageState);
     const settingProcess = useRecoilValue(settingProcessState);
     const settingOnline = useRecoilValue(settingOnlineState);
+    const settingVoice = useRecoilValue(settingVoiceState);
+
     return (
         <div className="p-5 overflow-auto" style={{ height: `calc(100vh - 64px)` }}>
             <h1 className="text-3xl flex items-center select-none cursor-default">
@@ -44,10 +54,10 @@ const SettingsMain = (): JSX.Element => {
                     </svg>
                     話し手の言語
                 </h2>
-                <div className="px-5">
+                <div className="px-5 mt-2">
                     <div className="mb-8">
                         <p>音声認識を行う対象の、言語パックをダウンロードしてください。</p>
-                        <p>言語によっては、利用メモリが少ないライト版のみ存在します。</p>
+                        <p>言語によっては、メモリ使用量が少ないライト版のみ存在します。</p>
                     </div>
                     <div className="mb-4 border-b">
                         <SettingLanguages />
@@ -452,43 +462,43 @@ const SettingsMain = (): JSX.Element => {
                     </>}
                 </div>
             </div>
-            <div className="px-5 select-none cursor-default">
+            <div className="px-5 select-none cursor-default mt-10">
                 <h2 className="text-xl mt-5 mb-4 flex items-center">
                     <svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24" strokeWidth={1.5} stroke="currentColor" className="w-6 h-6 mr-2">
                         <path strokeLinecap="round" strokeLinejoin="round" d="M9.813 15.904L9 18.75l-.813-2.846a4.5 4.5 0 00-3.09-3.09L2.25 12l2.846-.813a4.5 4.5 0 003.09-3.09L9 5.25l.813 2.846a4.5 4.5 0 003.09 3.09L15.75 12l-2.846.813a4.5 4.5 0 00-3.09 3.09zM18.259 8.715L18 9.75l-.259-1.035a3.375 3.375 0 00-2.455-2.456L14.25 6l1.036-.259a3.375 3.375 0 002.455-2.456L18 2.25l.259 1.035a3.375 3.375 0 002.456 2.456L21.75 6l-1.035.259a3.375 3.375 0 00-2.456 2.456zM16.894 20.567L16.5 21.75l-.394-1.183a2.25 2.25 0 00-1.423-1.423L13.5 18.75l1.183-.394a2.25 2.25 0 001.423-1.423l.394-1.183.394 1.183a2.25 2.25 0 001.423 1.423l1.183.394-1.183.394a2.25 2.25 0 00-1.423 1.423z" />
                     </svg>
                     追っかけ文字起こし・翻訳
                 </h2>
-                <div className="px-5">
+                <div className="px-5 mt-2">
                     <div className="mb-8">
-                        <p>通常の文字起こしを追いかける形で、高精度の文字起こしや翻訳を行います。</p>
+                        <p>通常の文字起こしを追いかける形式で、高精度の文字起こしや翻訳を行います。</p>
                         <p>各パックをダウンロードするか、オンライン設定を行ってください。</p>
                     </div>
                     <div className="mb-4 border-b">
                         <SettingProcesses />
                     </div>
-                    {settingProcess === "文字起こし" && <>
-                        <p className="text-sm mt-4 mb-4">汎用パック（高精度）を推奨します。速度に問題がある場合のみ、他を検討してください。</p>
-                        <div style={{ height: "86px" }}>
+                    {settingProcess === "文字起こし（汎用）" && <>
+                        <p className="text-sm mt-4 mb-4">汎用パック（高精度）を推奨します。<br />速度・メモリ使用量に問題がある場合は、汎用パック（速度優先）を利用ください。</p>
+                        {/* <div style={{ height: "86px" }}>
                             <div className="flex items-center justify-between mb-2">
                                 <div>
                                     <p>汎用パック（低精度）</p>
                                     <div className="flex my-1">
                                         <div className="badge bg-slate-400 text-white">whisper-small</div>
-                                        <div className="badge bg-slate-400 text-white ml-1">610 MB</div>
+                                        <div className="badge bg-slate-400 text-white ml-1">447 MB</div>
                                     </div>
                                 </div>
                                 <ModelDownloadWhisperButton modelType="small" />
                             </div>
                             <ModelDownloadWhisperProgress modelType="small" />
-                        </div>
+                        </div> */}
                         <div style={{ height: "86px" }}>
                             <div className="flex items-center justify-between mb-2">
                                 <div>
                                     <p>汎用パック（中精度）</p>
                                     <div className="flex my-1">
                                         <div className="badge bg-slate-400 text-white">whisper-medium</div>
-                                        <div className="badge bg-slate-400 text-white ml-1">2.0 GB</div>
+                                        <div className="badge bg-slate-400 text-white ml-1">1.4 GB</div>
                                     </div>
                                 </div>
                                 <ModelDownloadWhisperButton modelType="medium" />
@@ -501,7 +511,7 @@ const SettingsMain = (): JSX.Element => {
                                     <p>汎用パック（高精度）</p>
                                     <div className="flex my-1">
                                         <div className="badge bg-slate-400 text-white">whisper-large-v3</div>
-                                        <div className="badge bg-slate-400 text-white ml-1">4.0 GB</div>
+                                        <div className="badge bg-slate-400 text-white ml-1">2.9 GB</div>
                                     </div>
                                 </div>
                                 <ModelDownloadWhisperButton modelType="large" />
@@ -511,10 +521,26 @@ const SettingsMain = (): JSX.Element => {
                         <div style={{ height: "86px" }}>
                             <div className="flex items-center justify-between mb-2">
                                 <div>
-                                    <p>英語パック（速度優先）</p>
+                                    <p>汎用パック（速度優先）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white">whisper-large-v3-turbo</div>
+                                        <div className="badge bg-slate-400 text-white ml-1">1.5 GB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadWhisperButton modelType="large-turbo" />
+                            </div>
+                            <ModelDownloadWhisperProgress modelType="large-turbo" />
+                        </div>
+                    </>}
+                    {settingProcess === "文字起こし（言語特化）" && <>
+                        <p className="text-sm mt-4 mb-4">汎用パック（高精度）を推奨します。</p>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>英語パック</p>
                                     <div className="flex my-1">
                                         <div className="badge bg-slate-400 text-white">distil-whisper/distil-large-v3</div>
-                                        <div className="badge bg-slate-400 text-white ml-1">2.6 GB</div>
+                                        <div className="badge bg-slate-400 text-white ml-1">1.4 GB</div>
                                     </div>
                                 </div>
                                 <ModelDownloadWhisperButton modelType="large-distil.en" />
@@ -524,10 +550,10 @@ const SettingsMain = (): JSX.Element => {
                         <div style={{ height: "86px" }}>
                             <div className="flex items-center justify-between mb-2">
                                 <div>
-                                    <p>日本語パック（速度優先）</p>
+                                    <p>日本語パック</p>
                                     <div className="flex my-1">
-                                        <div className="badge bg-slate-400 text-white">Kotoba-Whisper-v1.1</div>
-                                        <div className="badge bg-slate-400 text-white ml-1">2.6 GB</div>
+                                        <div className="badge bg-slate-400 text-white">Kotoba-Whisper-v2.0</div>
+                                        <div className="badge bg-slate-400 text-white ml-1">1.2 GB</div>
                                     </div>
                                 </div>
                                 <ModelDownloadWhisperButton modelType="large-distil.ja" />
@@ -535,22 +561,22 @@ const SettingsMain = (): JSX.Element => {
                             <ModelDownloadWhisperProgress modelType="large-distil.ja" />
                         </div>
                     </>}
-                    {settingProcess === "翻訳" && <>
-                        <p className="text-sm mt-4 mb-4">有効にするには、文字起こしの汎用パック（高精度）が必要です。<br/>英語への翻訳も、文字起こしの汎用パックが担います。</p>
+                    {settingProcess === "翻訳（18言語⇒日本語）" && <>
+                        <p className="text-sm mt-4 mb-4">有効化するには、文字起こし（汎用）の汎用パック（高精度）が必要です。</p>
                         <div style={{ height: "86px" }}>
                             <div className="flex items-center justify-between mb-2">
                                 <div>
-                                    <p>日本語パック（速度優先）</p>
+                                    <p>日本語パック（標準）</p>
                                     <div className="flex my-1">
                                         <div className="badge bg-slate-400 text-white">staka/fugumt-en-ja</div>
                                         <div className="badge bg-slate-400 text-white ml-1">114 MB</div>
                                     </div>
                                 </div>
-                                <ModelDownloadFugumtButton />
+                                <ModelDownloadFugumtEnJaButton />
                             </div>
-                            <ModelDownloadFugumtProgress />
+                            <ModelDownloadFugumtEnJaProgress />
                         </div>
-                        <div style={{ height: "86px" }}>
+                        <div style={{ height: "106px" }}>
                             <div className="flex items-center justify-between mb-2">
                                 <div>
                                     <p>日本語パック（精度優先）</p>
@@ -559,7 +585,7 @@ const SettingsMain = (): JSX.Element => {
                                         <div className="badge bg-slate-400 text-white ml-1">7.1 GB</div>
                                     </div>
                                     <p className="text-sm">
-                                        ※ 処理が重いため、リアルタイムでの利用は推奨しません。
+                                        ※ メモリ解放されないバグのため、利用後にアプリ再起動が必要。
                                     </p>
                                 </div>
                                 <ModelDownloadHonyaku13BButton />
@@ -567,18 +593,201 @@ const SettingsMain = (): JSX.Element => {
                             <ModelDownloadHonyaku13BProgress />
                         </div>
                     </>}
+                    {settingProcess === "翻訳（日本語⇒英語）" && <>
+                        <p className="text-sm mt-4 mb-4">有効化するには、文字起こし（汎用）の汎用パック（高精度）が必要です。</p>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>英語パック（標準）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white">staka/fugumt-ja-en</div>
+                                        <div className="badge bg-slate-400 text-white ml-1">114 MB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadFugumtJaEnButton />
+                            </div>
+                            <ModelDownloadFugumtJaEnProgress />
+                        </div>
+                    </>}
+                    {settingProcess === "翻訳（日本語⇔英語）" && <>
+                        <p className="text-sm mt-4 mb-4">翻訳（18言語⇒日本語）及び翻訳（日本語⇒英語）にて、<br/>速度に問題がある場合は、バイリンガルパックを利用ください。</p>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>バイリンガルパック</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white">kotoba-whisper-bilingual-v1.0</div>
+                                        <div className="badge bg-slate-400 text-white ml-1">1.2 GB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadWhisperButton modelType="large-distil.bilingual" />
+                            </div>
+                            <ModelDownloadWhisperProgress modelType="large-distil.bilingual" />
+                        </div>
+                    </>}
+                </div>
+            </div>
+            <div className="px-5 select-none cursor-default mt-10">
+                <h2 className="text-xl mt-5 mb-4 flex items-center">
+                    <svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24" strokeWidth="1.5" stroke="currentColor" className="w-6 h-6 mr-2">
+                        <path strokeLinecap="round" strokeLinejoin="round" d="M10.34 15.84c-.688-.06-1.386-.09-2.09-.09H7.5a4.5 4.5 0 1 1 0-9h.75c.704 0 1.402-.03 2.09-.09m0 9.18c.253.962.584 1.892.985 2.783.247.55.06 1.21-.463 1.511l-.657.38c-.551.318-1.26.117-1.527-.461a20.845 20.845 0 0 1-1.44-4.282m3.102.069a18.03 18.03 0 0 1-.59-4.59c0-1.586.205-3.124.59-4.59m0 9.18a23.848 23.848 0 0 1 8.835 2.535M10.34 6.66a23.847 23.847 0 0 0 8.835-2.535m0 0A23.74 23.74 0 0 0 18.795 3m.38 1.125a23.91 23.91 0 0 1 1.014 5.395m-1.014 8.855c-.118.38-.245.754-.38 1.125m.38-1.125a23.91 23.91 0 0 0 1.014-5.395m0-3.46c.495.413.811 1.035.811 1.73 0 .695-.316 1.317-.811 1.73m0-3.46a24.347 24.347 0 0 1 0 3.46" />
+                    </svg>
+                    スマート読み上げ
+                </h2>
+                <div className="px-5 mt-2">
+                    <div className="mb-8">
+                        <p>テキストを感情豊かな音声で読み上げます。現在は発話サジェストで有効です。</p>
+                        <p>基本エンジンをダウンロードの上、各ボイスパックをダウンロードしてください。</p>
+                    </div>
+                    <div style={{ height: "86px" }}>
+                        <div className="flex items-center justify-between mb-2">
+                            <div>
+                                <p>基本エンジン</p>
+                                <div className="flex my-1">
+                                    <div className="badge bg-slate-400 text-white">Style-Bert-VITS2 JP-Extra</div>
+                                    <div className="badge bg-slate-400 text-white ml-1">1.2 GB</div>
+                                </div>
+                            </div>
+                            <ModelDownloadStyleBertVits2Button />
+                        </div>
+                        <ModelDownloadStyleBertVits2Progress />
+                    </div>
+                    <div className="mb-4 border-b">
+                        <SettingVoices />
+                    </div>
+                    {settingVoice === "JVNV" && <>
+                        <div className="text-sm mt-4 mb-4">
+                            <p>
+                                <a className="text-[#0f83fd]" href="https://sites.google.com/site/shinnosuketakamichi/research-topics/jvnv_corpus" target="_blank">JVNVコーパス</a>の音声で学習されました。
+                            </p>
+                            <p>このコーパスのライセンスは、<a className="text-[#0f83fd]" href="https://creativecommons.org/licenses/by-sa/4.0/deed.ja" target="_blank">CC BY-SA 4.0</a>のため、利用規約はこれを継承します。</p>
+                        </div>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>ボイスパック（女性1：jvnv-F1-jp）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white ml-1">231 MB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadStyleBertVits2VoiceButton modelType="jvnv-F1-jp" />
+                            </div>
+                            <ModelDownloadStyleBertVits2VoiceProgress modelType="jvnv-F1-jp" />
+                        </div>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>ボイスパック（女性2：jvnv-F2-jp）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white ml-1">231 MB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadStyleBertVits2VoiceButton modelType="jvnv-F2-jp" />
+                            </div>
+                            <ModelDownloadStyleBertVits2VoiceProgress modelType="jvnv-F2-jp" />
+                        </div>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>ボイスパック（男性1：jvnv-M1-jp）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white ml-1">231 MB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadStyleBertVits2VoiceButton modelType="jvnv-M1-jp" />
+                            </div>
+                            <ModelDownloadStyleBertVits2VoiceProgress modelType="jvnv-M1-jp" />
+                        </div>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>ボイスパック（男性2：jvnv-M2-jp）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white ml-1">231 MB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadStyleBertVits2VoiceButton modelType="jvnv-M2-jp" />
+                            </div>
+                            <ModelDownloadStyleBertVits2VoiceProgress modelType="jvnv-M2-jp" />
+                        </div>
+                    </>}
+                    {settingVoice === "つくよみちゃん" && <>
+                        <div className="text-sm mt-4 mb-4">
+                            <p className="mb-4">
+                                本ソフトウェアの音声合成には、<br />フリー素材キャラクター「つくよみちゃん」が無料公開している音声データを使用しています。
+                            </p>
+                            <p>■つくよみちゃんコーパス（CV.夢前黎）</p>
+                            <a className="text-[#0f83fd]" href="https://tyc.rei-yumesaki.net/material/corpus/" target="_blank">https://tyc.rei-yumesaki.net/material/corpus/</a>
+                            <p className="mt-2">© Rei Yumesaki</p>
+                        </div>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>ボイスパック（つくよみちゃん）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white ml-1">231 MB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadStyleBertVits2VoiceButton modelType="tsukuyomi-chan" />
+                            </div>
+                            <ModelDownloadStyleBertVits2VoiceProgress modelType="tsukuyomi-chan" />
+                        </div>
+                    </>}
+                    {settingVoice === "小春音アミ・あみたろ" && <>
+                        <div className="text-sm mt-4 mb-4">
+                            <p>
+                                <a className="text-[#0f83fd]" href="https://amitaro.net/" target="_blank">あみたろの声素材工房</a>のコーパス音声・ライブ配信音声から許可を得て学習されたモデルを使用しています。
+                            </p>
+                            <p>
+                                利用の際には、<a className="text-[#0f83fd]" href="https://amitaro.net/voice/voice_rule/" target="_blank">あみたろの声素材工房の規約</a>と<a className="text-[#0f83fd]" href="https://amitaro.net/voice/voice_rule/" target="_blank">あみたろのライブ配信音声・利用規約</a>を遵守してください。
+                            </p>
+                        </div>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>ボイスパック（小春音アミ）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white ml-1">231 MB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadStyleBertVits2VoiceButton modelType="koharune-ami" />
+                            </div>
+                            <ModelDownloadStyleBertVits2VoiceProgress modelType="koharune-ami" />
+                        </div>
+                        <div style={{ height: "86px" }}>
+                            <div className="flex items-center justify-between mb-2">
+                                <div>
+                                    <p>ボイスパック（あみたろ）</p>
+                                    <div className="flex my-1">
+                                        <div className="badge bg-slate-400 text-white ml-1">231 MB</div>
+                                    </div>
+                                </div>
+                                <ModelDownloadStyleBertVits2VoiceButton modelType="amitaro" />
+                            </div>
+                            <ModelDownloadStyleBertVits2VoiceProgress modelType="amitaro" />
+                        </div>
+                    </>}
+                    {settingVoice === "カスタマイズ" &&
+                        <div className="text-sm mt-4 pb-[26px]">
+                            <p className="mb-4">
+                                sbv2ファイルを用意することで、<br />自身のStyle-Bert-ViTS2 JP-Extraモデルを利用することができます。
+                            </p>
+                            <p>下記ディレクトリに、用意したsbv2ファイルを格納してください。</p>
+                            <div className="text-white bg-gray-600 select-auto max-w-fit mt-1 px-2 py-1 rounded-sm">/Applications/Lycoris.app/Contents/Resources/resources/style-bert-vits/models</div>
+                        </div>
+                    }
                 </div>
             </div>
-            <div className="px-5 select-none cursor-default">
+            <div className="px-5 select-none cursor-default mt-10">
                 <h2 className="text-xl mt-5 mb-4 flex items-center">
                     <svg xmlns="http://www.w3.org/2000/svg" fill="none" viewBox="0 0 24 24" strokeWidth={1.5} stroke="currentColor" className="w-6 h-6 mr-2">
                         <path strokeLinecap="round" strokeLinejoin="round" d="M8.288 15.038a5.25 5.25 0 017.424 0M5.106 11.856c3.807-3.808 9.98-3.808 13.788 0M1.924 8.674c5.565-5.565 14.587-5.565 20.152 0M12.53 18.22l-.53.53-.53-.53a.75.75 0 011.06 0z" />
                     </svg>
                     オンライン設定
                 </h2>
-                <div className="px-5">
+                <div className="px-5 mt-2">
                     <div className="mb-8">
-                        <p>各利用したいAPIとの疎通設定を行ってください。</p>
+                        <p>利用したい各APIとの疎通設定を行ってください。</p>
                     </div>
                     <div className="mb-4 border-b">
                         <SettingOnlines />
@@ -587,7 +796,7 @@ const SettingsMain = (): JSX.Element => {
                 <div className="pl-5">
                     {settingOnline === "OpenAI" && <>
                         <div className="mb-6 text-sm">
-                            <p>OpenAI社のAPIを利用することで、高速な追っかけ文字起こし・翻訳やAIが選択可能となります。</p>
+                            <p>高速な追っかけ文字起こし・翻訳やアシスタントが選択可能となります。</p>
                             <p className="pb-2">あなたのアカウントのTierに応じて、利用可能なモデルが異なります。</p>
                             <a className="text-[#0f83fd]" href="https://platform.openai.com/settings/organization/limits" target="_blank">https://platform.openai.com/settings/organization/limits</a>
                         </div>
@@ -596,7 +805,7 @@ const SettingsMain = (): JSX.Element => {
                         </div>
                         <SettingModel />
                         <div className="mt-8 mb-4">
-                            <p className="mb-2">AIオプション</p>
+                            <p className="mb-2">アシスタント設定</p>
                             <hr />
                         </div>
                         <div className="mb-8">
@@ -618,7 +827,6 @@ const SettingsMain = (): JSX.Element => {
                     </>}
                     {settingOnline === "AmiVoice" && <>
                         <div className="mb-4 text-sm">
-                            <p>AmiVoice社のAPIを利用することで、</p>
                             <p>特定の業界に特化した文字起こしが選択可能となります。</p>
                         </div>
                         <div className="mb-8">
@@ -632,7 +840,7 @@ const SettingsMain = (): JSX.Element => {
                 </div>
             </div>
             <div className="h-48"></div>
-        </div>
+        </div >
     )
 }
 
diff --git a/src/hooks/useHasPermissionScreenCapture.tsx b/src/hooks/useHasPermissionScreenCapture.tsx
index 8051e54..9c16de8 100644
--- a/src/hooks/useHasPermissionScreenCapture.tsx
+++ b/src/hooks/useHasPermissionScreenCapture.tsx
@@ -1,8 +1,10 @@
-import { useState, useEffect } from 'react';
+import { useEffect } from 'react';
 import { invoke } from '@tauri-apps/api/tauri'
+import { useRecoilState } from 'recoil';
+import { hasPermissionState } from '../store/atoms/hasPermissionState';
 
 const useHasPermissionScreenCapture = (forceReload: boolean | null = null) => {
-  const [hasPermission, setPermission] = useState(false);
+  const [hasPermission, setPermission] = useRecoilState(hasPermissionState);
   useEffect(() => {
     if (forceReload !== null && !hasPermission) {
       invoke('has_screen_capture_permission_command').then(trusted => setPermission(trusted as boolean))
diff --git a/src/index.css b/src/index.css
index 7851cdf..66ff121 100644
--- a/src/index.css
+++ b/src/index.css
@@ -87,3 +87,22 @@ body {
 .tabs-boxed .tab-active:not(.tab-disabled):not([disabled]) {
     background-color: hsl(var(--b3) / var(--tw-bg-opacity));
 }
+
+.radio.checked {
+    --tw-bg-opacity: 1;
+    background-color: hsl(var(--bc) / var(--tw-bg-opacity));
+    animation: radiomark var(--animation-input, 0.2s) ease-out;
+    box-shadow: 0 0 0 4px hsl(var(--b1)) inset, 0 0 0 4px hsl(var(--b1)) inset;
+}
+.radio-accent.checked {
+    --tw-border-opacity: 1;
+    border-color: hsl(var(--a) / var(--tw-border-opacity));
+    --tw-bg-opacity: 1;
+    background-color: hsl(var(--a) / var(--tw-bg-opacity));
+    --tw-text-opacity: 1;
+    color: hsl(var(--ac) / var(--tw-text-opacity));
+}
+
+.chat-bubble:has(.suggest-card) {
+    width: fit-content;
+}
\ No newline at end of file
diff --git a/src/lib/sqlite.ts b/src/lib/sqlite.ts
index 6a32e8d..f9ff637 100644
--- a/src/lib/sqlite.ts
+++ b/src/lib/sqlite.ts
@@ -26,8 +26,15 @@ export default class DB {
 
   public async updateSpeech(speech: SpeechHistoryType) {
     await this.db.execute(
-      'UPDATE speeches SET speech_type = $1, created_at_unixtime = $2, content = $3, wav = $4, model = $5, model_description = $6, note_id = $7 WHERE id = $8',
-      [speech.speech_type, speech.created_at_unixtime, speech.content, speech.wav, speech.model, speech.model_description, speech.note_id, speech.id]
+      'UPDATE speeches SET speech_type = $1, action_type = $2, created_at_unixtime = $3, content = $4, wav = $5, model = $6, model_description = $7, note_id = $8 WHERE id = $9',
+      [speech.speech_type, speech.action_type, speech.created_at_unixtime, speech.content, speech.wav, speech.model, speech.model_description, speech.note_id, speech.id]
+    )
+  }
+
+  public async updateSuggest(id: number, active: string) {
+    await this.db.execute(
+      'UPDATE speeches SET content = $1 WHERE id = $2',
+      [active, id]
     )
   }
 
@@ -53,8 +60,8 @@ export default class DB {
 
   public async saveSpeech(speech: SpeechHistoryType): Promise<SpeechHistoryType> {
     const { lastInsertId } = await this.db.execute(
-      'INSERT INTO speeches(speech_type, created_at_unixtime, content, wav, model, model_description, note_id) VALUES($1, $2, $3, $4, $5, $6, $7)',
-      [speech.speech_type, speech.created_at_unixtime, speech.content, speech.wav, speech.model, speech.model_description, speech.note_id]
+      'INSERT INTO speeches(speech_type, action_type, created_at_unixtime, content, wav, model, model_description, note_id) VALUES($1, $2, $3, $4, $5, $6, $7, $8)',
+      [speech.speech_type, speech.action_type, speech.created_at_unixtime, speech.content, speech.wav, speech.model, speech.model_description, speech.note_id]
     )
 
     return {
diff --git a/src/store/atoms/actionState.ts b/src/store/atoms/actionState.ts
new file mode 100644
index 0000000..a1cfa3d
--- /dev/null
+++ b/src/store/atoms/actionState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const actionState = atom<string|null>({
+  key: 'actionState',
+  default: "チャット"
+})
\ No newline at end of file
diff --git a/src/store/atoms/appSelectedState.ts b/src/store/atoms/appSelectedState.ts
new file mode 100644
index 0000000..8f95ab0
--- /dev/null
+++ b/src/store/atoms/appSelectedState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const appSelectedState = atom<string|null>({
+  key: 'appSelectedState',
+  default: null
+})
\ No newline at end of file
diff --git a/src/store/atoms/appWindowsState.ts b/src/store/atoms/appWindowsState.ts
new file mode 100644
index 0000000..360c454
--- /dev/null
+++ b/src/store/atoms/appWindowsState.ts
@@ -0,0 +1,7 @@
+import { atom } from 'recoil'
+import { AppWindowType } from '../../type/AppWindow.type'
+
+export const appWindowsState = atom<AppWindowType[]>({
+  key: 'appWindowsState',
+  default: []
+})
diff --git a/src/store/atoms/hasPermissionState.ts b/src/store/atoms/hasPermissionState.ts
new file mode 100644
index 0000000..af3c8b6
--- /dev/null
+++ b/src/store/atoms/hasPermissionState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const hasPermissionState = atom({
+  key: 'hasPermissionState',
+  default: false
+})
\ No newline at end of file
diff --git a/src/store/atoms/modelFugumtDownloadingState.ts b/src/store/atoms/modelFugumtDownloadingState.ts
deleted file mode 100644
index 8373f55..0000000
--- a/src/store/atoms/modelFugumtDownloadingState.ts
+++ /dev/null
@@ -1,6 +0,0 @@
-import { atom } from 'recoil'
-
-export const modelFugumtDownloadingState = atom<string[]>({
-  key: 'modelFugumtDownloadingState',
-  default: []
-})
\ No newline at end of file
diff --git a/src/store/atoms/modelFugumtDownloadedState.ts b/src/store/atoms/modelFugumtEnJaDownloadedState.ts
similarity index 68%
rename from src/store/atoms/modelFugumtDownloadedState.ts
rename to src/store/atoms/modelFugumtEnJaDownloadedState.ts
index cf1d699..c3487ef 100644
--- a/src/store/atoms/modelFugumtDownloadedState.ts
+++ b/src/store/atoms/modelFugumtEnJaDownloadedState.ts
@@ -4,7 +4,7 @@ import DB from '../../lib/sqlite';
 const sqliteEffect: AtomEffect<string[]> = ({setSelf, trigger}) => {
   const loadPersisted = async () => {
     const db = (await DB.getInstance())
-    const savedValue =  await db.loadDownloadedModels("fugumt");
+    const savedValue =  await db.loadDownloadedModels("fugumt-en-ja");
     setSelf(savedValue.map(obj=>obj.model_name));
   };
 
@@ -13,8 +13,8 @@ const sqliteEffect: AtomEffect<string[]> = ({setSelf, trigger}) => {
   }
 };
 
-export const modelFugumtDownloadedState = atom<string[]>({
-  key: 'modelFugumtDownloadedState',
+export const modelFugumtEnJaDownloadedState = atom<string[]>({
+  key: 'modelFugumtEnJaDownloadedState',
   default: [],
   effects: [
     sqliteEffect,
diff --git a/src/store/atoms/modelFugumtEnJaDownloadingState.ts b/src/store/atoms/modelFugumtEnJaDownloadingState.ts
new file mode 100644
index 0000000..1a2a850
--- /dev/null
+++ b/src/store/atoms/modelFugumtEnJaDownloadingState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const modelFugumtEnJaDownloadingState = atom<string[]>({
+  key: 'modelFugumtEnJaDownloadingState',
+  default: []
+})
\ No newline at end of file
diff --git a/src/store/atoms/modelFugumtJaEnDownloadedState.ts b/src/store/atoms/modelFugumtJaEnDownloadedState.ts
new file mode 100644
index 0000000..48477b9
--- /dev/null
+++ b/src/store/atoms/modelFugumtJaEnDownloadedState.ts
@@ -0,0 +1,22 @@
+import { atom, AtomEffect } from 'recoil'
+import DB from '../../lib/sqlite';
+
+const sqliteEffect: AtomEffect<string[]> = ({setSelf, trigger}) => {
+  const loadPersisted = async () => {
+    const db = (await DB.getInstance())
+    const savedValue =  await db.loadDownloadedModels("fugumt-ja-en");
+    setSelf(savedValue.map(obj=>obj.model_name));
+  };
+
+  if (trigger === 'get') {
+    loadPersisted();
+  }
+};
+
+export const modelFugumtJaEnDownloadedState = atom<string[]>({
+  key: 'modelFugumtJaEnDownloadedState',
+  default: [],
+  effects: [
+    sqliteEffect,
+  ]
+})
\ No newline at end of file
diff --git a/src/store/atoms/modelFugumtJaEnDownloadingState.ts b/src/store/atoms/modelFugumtJaEnDownloadingState.ts
new file mode 100644
index 0000000..955402f
--- /dev/null
+++ b/src/store/atoms/modelFugumtJaEnDownloadingState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const modelFugumtJaEnDownloadingState = atom<string[]>({
+  key: 'modelFugumtJaEnDownloadingState',
+  default: []
+})
\ No newline at end of file
diff --git a/src/store/atoms/modelHonyaku13BDownloadedState.ts b/src/store/atoms/modelHonyaku13BDownloadedState.ts
index 96bad98..b92eae9 100644
--- a/src/store/atoms/modelHonyaku13BDownloadedState.ts
+++ b/src/store/atoms/modelHonyaku13BDownloadedState.ts
@@ -4,7 +4,7 @@ import DB from '../../lib/sqlite';
 const sqliteEffect: AtomEffect<string[]> = ({setSelf, trigger}) => {
   const loadPersisted = async () => {
     const db = (await DB.getInstance())
-    const savedValue =  await db.loadDownloadedModels("honyaku13b");
+    const savedValue =  await db.loadDownloadedModels("honyaku-13b");
     setSelf(savedValue.map(obj=>obj.model_name));
   };
 
diff --git a/src/store/atoms/modelStyleBertVits2DownloadedState.ts b/src/store/atoms/modelStyleBertVits2DownloadedState.ts
new file mode 100644
index 0000000..fdc68a7
--- /dev/null
+++ b/src/store/atoms/modelStyleBertVits2DownloadedState.ts
@@ -0,0 +1,22 @@
+import { atom, AtomEffect } from 'recoil'
+import DB from '../../lib/sqlite';
+
+const sqliteEffect: AtomEffect<string[]> = ({setSelf, trigger}) => {
+  const loadPersisted = async () => {
+    const db = (await DB.getInstance())
+    const savedValue =  await db.loadDownloadedModels("style-bert-vits2");
+    setSelf(savedValue.map(obj=>obj.model_name));
+  };
+
+  if (trigger === 'get') {
+    loadPersisted();
+  }
+};
+
+export const modelStyleBertVits2DownloadedState = atom<string[]>({
+  key: 'modelStyleBertVits2DownloadedState',
+  default: [],
+  effects: [
+    sqliteEffect,
+  ]
+})
\ No newline at end of file
diff --git a/src/store/atoms/modelStyleBertVits2DownloadingState.ts b/src/store/atoms/modelStyleBertVits2DownloadingState.ts
new file mode 100644
index 0000000..89e4176
--- /dev/null
+++ b/src/store/atoms/modelStyleBertVits2DownloadingState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const modelStyleBertVits2DownloadingState = atom<string[]>({
+  key: 'modelStyleBertVits2DownloadingState',
+  default: []
+})
\ No newline at end of file
diff --git a/src/store/atoms/modelStyleBertVits2VoiceDownloadedState.ts b/src/store/atoms/modelStyleBertVits2VoiceDownloadedState.ts
new file mode 100644
index 0000000..e759ee6
--- /dev/null
+++ b/src/store/atoms/modelStyleBertVits2VoiceDownloadedState.ts
@@ -0,0 +1,22 @@
+import { atom, AtomEffect } from 'recoil'
+import DB from '../../lib/sqlite';
+
+const sqliteEffect: AtomEffect<string[]> = ({setSelf, trigger}) => {
+  const loadPersisted = async () => {
+    const db = (await DB.getInstance())
+    const savedValue =  await db.loadDownloadedModels("style-bert-vits2-voice");
+    setSelf(savedValue.map(obj=>obj.model_name));
+  };
+
+  if (trigger === 'get') {
+    loadPersisted();
+  }
+};
+
+export const modelStyleBertVits2VoiceDownloadedState = atom<string[]>({
+  key: 'modelStyleBertVits2VoiceDownloadedState',
+  default: [],
+  effects: [
+    sqliteEffect,
+  ]
+})
\ No newline at end of file
diff --git a/src/store/atoms/modelStyleBertVits2VoiceDownloadingState.ts b/src/store/atoms/modelStyleBertVits2VoiceDownloadingState.ts
new file mode 100644
index 0000000..e0977be
--- /dev/null
+++ b/src/store/atoms/modelStyleBertVits2VoiceDownloadingState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const modelStyleBertVits2VoiceDownloadingState = atom<string[]>({
+  key: 'modelStyleBertVits2VoiceDownloadingState',
+  default: []
+})
\ No newline at end of file
diff --git a/src/store/atoms/settingProcessState.ts b/src/store/atoms/settingProcessState.ts
index b098c34..ebd2823 100644
--- a/src/store/atoms/settingProcessState.ts
+++ b/src/store/atoms/settingProcessState.ts
@@ -6,7 +6,7 @@ const sqliteEffect: AtomEffect<string> = ({setSelf, onSet, trigger}) => {
     const db = (await DB.getInstance())
     const savedValue =  await db.loadSetting("settingProcess");
     if (savedValue === null) {
-      setSelf("文字起こし");
+      setSelf("文字起こし（汎用）");
     } else {
       setSelf(savedValue!.setting_status);
     }
@@ -19,7 +19,7 @@ const sqliteEffect: AtomEffect<string> = ({setSelf, onSet, trigger}) => {
   onSet(async(newValue, _, isReset:any) => {
     const db = await DB.getInstance()
     if (isReset) {
-      await db.updateSetting("settingProcess", "文字起こし")
+      await db.updateSetting("settingProcess", "文字起こし（汎用）")
     } else {
       await db.updateSetting("settingProcess", newValue)
     }
@@ -28,7 +28,7 @@ const sqliteEffect: AtomEffect<string> = ({setSelf, onSet, trigger}) => {
 
 export const settingProcessState = atom<string>({
   key: 'settingProcessState',
-  default: "文字起こし",
+  default: "文字起こし（汎用）",
   effects: [
     sqliteEffect,
   ]
diff --git a/src/store/atoms/settingVoiceState.ts b/src/store/atoms/settingVoiceState.ts
new file mode 100644
index 0000000..95d3d8b
--- /dev/null
+++ b/src/store/atoms/settingVoiceState.ts
@@ -0,0 +1,35 @@
+import { atom, AtomEffect } from 'recoil'
+import DB from '../../lib/sqlite';
+
+const sqliteEffect: AtomEffect<string> = ({setSelf, onSet, trigger}) => {
+  const loadPersisted = async () => {
+    const db = (await DB.getInstance())
+    const savedValue =  await db.loadSetting("settingVoice");
+    if (savedValue === null) {
+      setSelf("JVNV");
+    } else {
+      setSelf(savedValue!.setting_status);
+    }
+  };
+
+  if (trigger === 'get') {
+    loadPersisted();
+  }
+
+  onSet(async(newValue, _, isReset:any) => {
+    const db = await DB.getInstance()
+    if (isReset) {
+      await db.updateSetting("settingVoice", "JVNV")
+    } else {
+      await db.updateSetting("settingVoice", newValue)
+    }
+  });
+};
+
+export const settingVoiceState = atom<string>({
+  key: 'settingVoiceState',
+  default: "JVNV",
+  effects: [
+    sqliteEffect,
+  ]
+})
\ No newline at end of file
diff --git a/src/store/atoms/smartVoices/lengthScaleState.ts b/src/store/atoms/smartVoices/lengthScaleState.ts
new file mode 100644
index 0000000..19ce56d
--- /dev/null
+++ b/src/store/atoms/smartVoices/lengthScaleState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const lengthScaleState = atom({
+  key: 'lengthScaleState',
+  default: 1.0
+})
\ No newline at end of file
diff --git a/src/store/atoms/smartVoices/sdpRatioState.ts b/src/store/atoms/smartVoices/sdpRatioState.ts
new file mode 100644
index 0000000..af02d78
--- /dev/null
+++ b/src/store/atoms/smartVoices/sdpRatioState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const sdpRatioState = atom({
+  key: 'sdpRatioState',
+  default: 0.2
+})
\ No newline at end of file
diff --git a/src/store/atoms/smartVoices/smartVoiceState.ts b/src/store/atoms/smartVoices/smartVoiceState.ts
new file mode 100644
index 0000000..9448163
--- /dev/null
+++ b/src/store/atoms/smartVoices/smartVoiceState.ts
@@ -0,0 +1,6 @@
+import { atom } from 'recoil'
+
+export const smartVoiceState = atom({
+  key: 'smartVoiceState',
+  default: "off"
+})
\ No newline at end of file
diff --git a/src/type/SpeechHistory.type.ts b/src/type/SpeechHistory.type.ts
index d7496ca..39aab82 100644
--- a/src/type/SpeechHistory.type.ts
+++ b/src/type/SpeechHistory.type.ts
@@ -1,6 +1,7 @@
 export type SpeechHistoryType = {
     id? : number;
     speech_type: "speech" | "memo" | "screenshot" | "action";
+    action_type?: "chat" | "suggest";
     created_at_unixtime: number;
     content: string;
     content_2?: string;
diff --git a/yarn.lock b/yarn.lock
index 206677d..9f468bd 100644
--- a/yarn.lock
+++ b/yarn.lock
@@ -548,85 +548,85 @@
   resolved "https://registry.yarnpkg.com/@pkgjs/parseargs/-/parseargs-0.11.0.tgz#a77ea742fab25775145434eb1d2328cf5013ac33"
   integrity sha512-+1VkjdD0QBLPodGrJUeqarH8VAIvQODIbwh9XpP5Syisf7YoQgsJKPNFoqqLQlu+VQ/tVSshMR6loPMn8U+dPg==
 
-"@rollup/rollup-android-arm-eabi@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-android-arm-eabi/-/rollup-android-arm-eabi-4.21.0.tgz#d941173f82f9b041c61b0dc1a2a91dcd06e4b31e"
-  integrity sha512-WTWD8PfoSAJ+qL87lE7votj3syLavxunWhzCnx3XFxFiI/BA/r3X7MUM8dVrH8rb2r4AiO8jJsr3ZjdaftmnfA==
-
-"@rollup/rollup-android-arm64@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-android-arm64/-/rollup-android-arm64-4.21.0.tgz#7e7157c8543215245ceffc445134d9e843ba51c0"
-  integrity sha512-a1sR2zSK1B4eYkiZu17ZUZhmUQcKjk2/j9Me2IDjk1GHW7LB5Z35LEzj9iJch6gtUfsnvZs1ZNyDW2oZSThrkA==
-
-"@rollup/rollup-darwin-arm64@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-darwin-arm64/-/rollup-darwin-arm64-4.21.0.tgz#f0a18a4fc8dc6eb1e94a51fa2adb22876f477947"
-  integrity sha512-zOnKWLgDld/svhKO5PD9ozmL6roy5OQ5T4ThvdYZLpiOhEGY+dp2NwUmxK0Ld91LrbjrvtNAE0ERBwjqhZTRAA==
-
-"@rollup/rollup-darwin-x64@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-darwin-x64/-/rollup-darwin-x64-4.21.0.tgz#34b7867613e5cc42d2b85ddc0424228cc33b43f0"
-  integrity sha512-7doS8br0xAkg48SKE2QNtMSFPFUlRdw9+votl27MvT46vo44ATBmdZdGysOevNELmZlfd+NEa0UYOA8f01WSrg==
-
-"@rollup/rollup-linux-arm-gnueabihf@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-arm-gnueabihf/-/rollup-linux-arm-gnueabihf-4.21.0.tgz#422b19ff9ae02b05d3395183d1d43b38c7c8be0b"
-  integrity sha512-pWJsfQjNWNGsoCq53KjMtwdJDmh/6NubwQcz52aEwLEuvx08bzcy6tOUuawAOncPnxz/3siRtd8hiQ32G1y8VA==
-
-"@rollup/rollup-linux-arm-musleabihf@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-arm-musleabihf/-/rollup-linux-arm-musleabihf-4.21.0.tgz#568aa29195ef6fc57ec6ed3f518923764406a8ee"
-  integrity sha512-efRIANsz3UHZrnZXuEvxS9LoCOWMGD1rweciD6uJQIx2myN3a8Im1FafZBzh7zk1RJ6oKcR16dU3UPldaKd83w==
-
-"@rollup/rollup-linux-arm64-gnu@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-arm64-gnu/-/rollup-linux-arm64-gnu-4.21.0.tgz#22309c8bcba9a73114f69165c72bc94b2fbec085"
-  integrity sha512-ZrPhydkTVhyeGTW94WJ8pnl1uroqVHM3j3hjdquwAcWnmivjAwOYjTEAuEDeJvGX7xv3Z9GAvrBkEzCgHq9U1w==
-
-"@rollup/rollup-linux-arm64-musl@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-arm64-musl/-/rollup-linux-arm64-musl-4.21.0.tgz#c93c388af6d33f082894b8a60839d7265b2b9bc5"
-  integrity sha512-cfaupqd+UEFeURmqNP2eEvXqgbSox/LHOyN9/d2pSdV8xTrjdg3NgOFJCtc1vQ/jEke1qD0IejbBfxleBPHnPw==
-
-"@rollup/rollup-linux-powerpc64le-gnu@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-powerpc64le-gnu/-/rollup-linux-powerpc64le-gnu-4.21.0.tgz#493c5e19e395cf3c6bd860c7139c8a903dea72b4"
-  integrity sha512-ZKPan1/RvAhrUylwBXC9t7B2hXdpb/ufeu22pG2psV7RN8roOfGurEghw1ySmX/CmDDHNTDDjY3lo9hRlgtaHg==
-
-"@rollup/rollup-linux-riscv64-gnu@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-riscv64-gnu/-/rollup-linux-riscv64-gnu-4.21.0.tgz#a2eab4346fbe5909165ce99adb935ba30c9fb444"
-  integrity sha512-H1eRaCwd5E8eS8leiS+o/NqMdljkcb1d6r2h4fKSsCXQilLKArq6WS7XBLDu80Yz+nMqHVFDquwcVrQmGr28rg==
-
-"@rollup/rollup-linux-s390x-gnu@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-s390x-gnu/-/rollup-linux-s390x-gnu-4.21.0.tgz#0bc49a79db4345d78d757bb1b05e73a1b42fa5c3"
-  integrity sha512-zJ4hA+3b5tu8u7L58CCSI0A9N1vkfwPhWd/puGXwtZlsB5bTkwDNW/+JCU84+3QYmKpLi+XvHdmrlwUwDA6kqw==
-
-"@rollup/rollup-linux-x64-gnu@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-x64-gnu/-/rollup-linux-x64-gnu-4.21.0.tgz#4fd36a6a41f3406d8693321b13d4f9b7658dd4b9"
-  integrity sha512-e2hrvElFIh6kW/UNBQK/kzqMNY5mO+67YtEh9OA65RM5IJXYTWiXjX6fjIiPaqOkBthYF1EqgiZ6OXKcQsM0hg==
-
-"@rollup/rollup-linux-x64-musl@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-x64-musl/-/rollup-linux-x64-musl-4.21.0.tgz#10ebb13bd4469cbad1a5d9b073bd27ec8a886200"
-  integrity sha512-1vvmgDdUSebVGXWX2lIcgRebqfQSff0hMEkLJyakQ9JQUbLDkEaMsPTLOmyccyC6IJ/l3FZuJbmrBw/u0A0uCQ==
-
-"@rollup/rollup-win32-arm64-msvc@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-win32-arm64-msvc/-/rollup-win32-arm64-msvc-4.21.0.tgz#2fef1a90f1402258ef915ae5a94cc91a5a1d5bfc"
-  integrity sha512-s5oFkZ/hFcrlAyBTONFY1TWndfyre1wOMwU+6KCpm/iatybvrRgmZVM+vCFwxmC5ZhdlgfE0N4XorsDpi7/4XQ==
-
-"@rollup/rollup-win32-ia32-msvc@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-win32-ia32-msvc/-/rollup-win32-ia32-msvc-4.21.0.tgz#a18ad47a95c5f264defb60acdd8c27569f816fc1"
-  integrity sha512-G9+TEqRnAA6nbpqyUqgTiopmnfgnMkR3kMukFBDsiyy23LZvUCpiUwjTRx6ezYCjJODXrh52rBR9oXvm+Fp5wg==
-
-"@rollup/rollup-win32-x64-msvc@4.21.0":
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/@rollup/rollup-win32-x64-msvc/-/rollup-win32-x64-msvc-4.21.0.tgz#20c09cf44dcb082140cc7f439dd679fe4bba3375"
-  integrity sha512-2jsCDZwtQvRhejHLfZ1JY6w6kEuEtfF9nzYsZxzSlNVKDX+DpsDJ+Rbjkm74nvg2rdx0gwBS+IMdvwJuq3S9pQ==
+"@rollup/rollup-android-arm-eabi@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-android-arm-eabi/-/rollup-android-arm-eabi-4.22.4.tgz#8b613b9725e8f9479d142970b106b6ae878610d5"
+  integrity sha512-Fxamp4aEZnfPOcGA8KSNEohV8hX7zVHOemC8jVBoBUHu5zpJK/Eu3uJwt6BMgy9fkvzxDaurgj96F/NiLukF2w==
+
+"@rollup/rollup-android-arm64@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-android-arm64/-/rollup-android-arm64-4.22.4.tgz#654ca1049189132ff602bfcf8df14c18da1f15fb"
+  integrity sha512-VXoK5UMrgECLYaMuGuVTOx5kcuap1Jm8g/M83RnCHBKOqvPPmROFJGQaZhGccnsFtfXQ3XYa4/jMCJvZnbJBdA==
+
+"@rollup/rollup-darwin-arm64@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-darwin-arm64/-/rollup-darwin-arm64-4.22.4.tgz#6d241d099d1518ef0c2205d96b3fa52e0fe1954b"
+  integrity sha512-xMM9ORBqu81jyMKCDP+SZDhnX2QEVQzTcC6G18KlTQEzWK8r/oNZtKuZaCcHhnsa6fEeOBionoyl5JsAbE/36Q==
+
+"@rollup/rollup-darwin-x64@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-darwin-x64/-/rollup-darwin-x64-4.22.4.tgz#42bd19d292a57ee11734c980c4650de26b457791"
+  integrity sha512-aJJyYKQwbHuhTUrjWjxEvGnNNBCnmpHDvrb8JFDbeSH3m2XdHcxDd3jthAzvmoI8w/kSjd2y0udT+4okADsZIw==
+
+"@rollup/rollup-linux-arm-gnueabihf@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-arm-gnueabihf/-/rollup-linux-arm-gnueabihf-4.22.4.tgz#f23555ee3d8fe941c5c5fd458cd22b65eb1c2232"
+  integrity sha512-j63YtCIRAzbO+gC2L9dWXRh5BFetsv0j0va0Wi9epXDgU/XUi5dJKo4USTttVyK7fGw2nPWK0PbAvyliz50SCQ==
+
+"@rollup/rollup-linux-arm-musleabihf@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-arm-musleabihf/-/rollup-linux-arm-musleabihf-4.22.4.tgz#f3bbd1ae2420f5539d40ac1fde2b38da67779baa"
+  integrity sha512-dJnWUgwWBX1YBRsuKKMOlXCzh2Wu1mlHzv20TpqEsfdZLb3WoJW2kIEsGwLkroYf24IrPAvOT/ZQ2OYMV6vlrg==
+
+"@rollup/rollup-linux-arm64-gnu@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-arm64-gnu/-/rollup-linux-arm64-gnu-4.22.4.tgz#7abe900120113e08a1f90afb84c7c28774054d15"
+  integrity sha512-AdPRoNi3NKVLolCN/Sp4F4N1d98c4SBnHMKoLuiG6RXgoZ4sllseuGioszumnPGmPM2O7qaAX/IJdeDU8f26Aw==
+
+"@rollup/rollup-linux-arm64-musl@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-arm64-musl/-/rollup-linux-arm64-musl-4.22.4.tgz#9e655285c8175cd44f57d6a1e8e5dedfbba1d820"
+  integrity sha512-Gl0AxBtDg8uoAn5CCqQDMqAx22Wx22pjDOjBdmG0VIWX3qUBHzYmOKh8KXHL4UpogfJ14G4wk16EQogF+v8hmA==
+
+"@rollup/rollup-linux-powerpc64le-gnu@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-powerpc64le-gnu/-/rollup-linux-powerpc64le-gnu-4.22.4.tgz#9a79ae6c9e9d8fe83d49e2712ecf4302db5bef5e"
+  integrity sha512-3aVCK9xfWW1oGQpTsYJJPF6bfpWfhbRnhdlyhak2ZiyFLDaayz0EP5j9V1RVLAAxlmWKTDfS9wyRyY3hvhPoOg==
+
+"@rollup/rollup-linux-riscv64-gnu@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-riscv64-gnu/-/rollup-linux-riscv64-gnu-4.22.4.tgz#67ac70eca4ace8e2942fabca95164e8874ab8128"
+  integrity sha512-ePYIir6VYnhgv2C5Xe9u+ico4t8sZWXschR6fMgoPUK31yQu7hTEJb7bCqivHECwIClJfKgE7zYsh1qTP3WHUA==
+
+"@rollup/rollup-linux-s390x-gnu@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-s390x-gnu/-/rollup-linux-s390x-gnu-4.22.4.tgz#9f883a7440f51a22ed7f99e1d070bd84ea5005fc"
+  integrity sha512-GqFJ9wLlbB9daxhVlrTe61vJtEY99/xB3C8e4ULVsVfflcpmR6c8UZXjtkMA6FhNONhj2eA5Tk9uAVw5orEs4Q==
+
+"@rollup/rollup-linux-x64-gnu@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-x64-gnu/-/rollup-linux-x64-gnu-4.22.4.tgz#70116ae6c577fe367f58559e2cffb5641a1dd9d0"
+  integrity sha512-87v0ol2sH9GE3cLQLNEy0K/R0pz1nvg76o8M5nhMR0+Q+BBGLnb35P0fVz4CQxHYXaAOhE8HhlkaZfsdUOlHwg==
+
+"@rollup/rollup-linux-x64-musl@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-linux-x64-musl/-/rollup-linux-x64-musl-4.22.4.tgz#f473f88219feb07b0b98b53a7923be716d1d182f"
+  integrity sha512-UV6FZMUgePDZrFjrNGIWzDo/vABebuXBhJEqrHxrGiU6HikPy0Z3LfdtciIttEUQfuDdCn8fqh7wiFJjCNwO+g==
+
+"@rollup/rollup-win32-arm64-msvc@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-win32-arm64-msvc/-/rollup-win32-arm64-msvc-4.22.4.tgz#4349482d17f5d1c58604d1c8900540d676f420e0"
+  integrity sha512-BjI+NVVEGAXjGWYHz/vv0pBqfGoUH0IGZ0cICTn7kB9PyjrATSkX+8WkguNjWoj2qSr1im/+tTGRaY+4/PdcQw==
+
+"@rollup/rollup-win32-ia32-msvc@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-win32-ia32-msvc/-/rollup-win32-ia32-msvc-4.22.4.tgz#a6fc39a15db618040ec3c2a24c1e26cb5f4d7422"
+  integrity sha512-SiWG/1TuUdPvYmzmYnmd3IEifzR61Tragkbx9D3+R8mzQqDBz8v+BvZNDlkiTtI9T15KYZhP0ehn3Dld4n9J5g==
+
+"@rollup/rollup-win32-x64-msvc@4.22.4":
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/@rollup/rollup-win32-x64-msvc/-/rollup-win32-x64-msvc-4.22.4.tgz#3dd5d53e900df2a40841882c02e56f866c04d202"
+  integrity sha512-j8pPKp53/lq9lMXN57S8cFz0MynJk8OWNuUnXct/9KCpKU7DgU3bYMJhwWmcqC0UU29p8Lr0/7KEVcaM6bf47Q==
 
 "@szhsin/react-menu@^4.2.2":
   version "4.2.2"
@@ -1966,6 +1966,11 @@ picocolors@^1.0.1:
   resolved "https://registry.yarnpkg.com/picocolors/-/picocolors-1.0.1.tgz#a8ad579b571952f0e5d25892de5445bcfe25aaa1"
   integrity sha512-anP1Z8qwhkbmu7MFP5iTt+wQKXgwzf7zTyGlcdzabySa9vd0Xt392U0rVmz9poOaBj0uHJKyyo9/upk0HrEQew==
 
+picocolors@^1.1.0:
+  version "1.1.0"
+  resolved "https://registry.yarnpkg.com/picocolors/-/picocolors-1.1.0.tgz#5358b76a78cde483ba5cef6a9dc9671440b27d59"
+  integrity sha512-TQ92mBOW0l3LeMeyLV6mzy/kWr8lkd/hp3mTg7wYK7zJhuBStmGMBG0BdeDZS/dZx1IukaX6Bk11zcln25o1Aw==
+
 picomatch@^2.0.4, picomatch@^2.2.1, picomatch@^2.3.1:
   version "2.3.1"
   resolved "https://registry.yarnpkg.com/picomatch/-/picomatch-2.3.1.tgz#3ba3833733646d9d3e4995946c1365a67fb07a42"
@@ -2047,32 +2052,14 @@ postcss-value-parser@^4.0.0, postcss-value-parser@^4.2.0:
   resolved "https://registry.yarnpkg.com/postcss-value-parser/-/postcss-value-parser-4.2.0.tgz#723c09920836ba6d3e5af019f92bc0971c02e514"
   integrity sha512-1NNCs6uurfkVbeXG4S8JFT9t19m45ICnif8zWLd5oPSZ50QnwMfK+H3jv408d4jw/7Bttv5axS5IiHoLaVNHeQ==
 
-postcss@^8:
-  version "8.4.38"
-  resolved "https://registry.yarnpkg.com/postcss/-/postcss-8.4.38.tgz#b387d533baf2054288e337066d81c6bee9db9e0e"
-  integrity sha512-Wglpdk03BSfXkHoQa3b/oulrotAkwrlLDRSOb9D0bN86FdRyE9lppSp33aHNPgBa0JKCoB+drFLZkQoRRYae5A==
-  dependencies:
-    nanoid "^3.3.7"
-    picocolors "^1.0.0"
-    source-map-js "^1.2.0"
-
-postcss@^8.4.23:
-  version "8.4.35"
-  resolved "https://registry.yarnpkg.com/postcss/-/postcss-8.4.35.tgz#60997775689ce09011edf083a549cea44aabe2f7"
-  integrity sha512-u5U8qYpBCpN13BsiEB0CbR1Hhh4Gc0zLFuedrHJKMctHCHAGrMdG0PRM/KErzAL3CU6/eckEtmHNB3x6e3c0vA==
+postcss@^8, postcss@^8.4.23, postcss@^8.4.41, postcss@^8.4.43:
+  version "8.4.47"
+  resolved "https://registry.yarnpkg.com/postcss/-/postcss-8.4.47.tgz#5bf6c9a010f3e724c503bf03ef7947dcb0fea365"
+  integrity sha512-56rxCq7G/XfB4EkXq9Egn5GCqugWvDFjafDOThIdMBsI15iqPqR5r15TfSr1YPYeEI19YeaXMCbY6u88Y76GLQ==
   dependencies:
     nanoid "^3.3.7"
-    picocolors "^1.0.0"
-    source-map-js "^1.0.2"
-
-postcss@^8.4.41:
-  version "8.4.41"
-  resolved "https://registry.yarnpkg.com/postcss/-/postcss-8.4.41.tgz#d6104d3ba272d882fe18fc07d15dc2da62fa2681"
-  integrity sha512-TesUflQ0WKZqAvg52PWL6kHgLKP6xB6heTOdoYM0Wt2UHyxNa4K25EZZMgKns3BH1RLVbZCREPpLY0rhnNoHVQ==
-  dependencies:
-    nanoid "^3.3.7"
-    picocolors "^1.0.1"
-    source-map-js "^1.2.0"
+    picocolors "^1.1.0"
+    source-map-js "^1.2.1"
 
 prop-types@^15.7.2:
   version "15.8.1"
@@ -2193,28 +2180,28 @@ robust-predicates@^3.0.2:
   integrity sha512-IXgzBWvWQwE6PrDI05OvmXUIruQTcoMDzRsOd5CDvHCVLcLHMTSYvOK5Cm46kWqlV3yAbuSpBZdJ5oP5OUoStg==
 
 rollup@^4.20.0:
-  version "4.21.0"
-  resolved "https://registry.yarnpkg.com/rollup/-/rollup-4.21.0.tgz#28db5f5c556a5180361d35009979ccc749560b9d"
-  integrity sha512-vo+S/lfA2lMS7rZ2Qoubi6I5hwZwzXeUIctILZLbHI+laNtvhhOIon2S1JksA5UEDQ7l3vberd0fxK44lTYjbQ==
+  version "4.22.4"
+  resolved "https://registry.yarnpkg.com/rollup/-/rollup-4.22.4.tgz#4135a6446671cd2a2453e1ad42a45d5973ec3a0f"
+  integrity sha512-vD8HJ5raRcWOyymsR6Z3o6+RzfEPCnVLMFJ6vRslO1jt4LO6dUo5Qnpg7y4RkZFM2DMe3WUirkI5c16onjrc6A==
   dependencies:
     "@types/estree" "1.0.5"
   optionalDependencies:
-    "@rollup/rollup-android-arm-eabi" "4.21.0"
-    "@rollup/rollup-android-arm64" "4.21.0"
-    "@rollup/rollup-darwin-arm64" "4.21.0"
-    "@rollup/rollup-darwin-x64" "4.21.0"
-    "@rollup/rollup-linux-arm-gnueabihf" "4.21.0"
-    "@rollup/rollup-linux-arm-musleabihf" "4.21.0"
-    "@rollup/rollup-linux-arm64-gnu" "4.21.0"
-    "@rollup/rollup-linux-arm64-musl" "4.21.0"
-    "@rollup/rollup-linux-powerpc64le-gnu" "4.21.0"
-    "@rollup/rollup-linux-riscv64-gnu" "4.21.0"
-    "@rollup/rollup-linux-s390x-gnu" "4.21.0"
-    "@rollup/rollup-linux-x64-gnu" "4.21.0"
-    "@rollup/rollup-linux-x64-musl" "4.21.0"
-    "@rollup/rollup-win32-arm64-msvc" "4.21.0"
-    "@rollup/rollup-win32-ia32-msvc" "4.21.0"
-    "@rollup/rollup-win32-x64-msvc" "4.21.0"
+    "@rollup/rollup-android-arm-eabi" "4.22.4"
+    "@rollup/rollup-android-arm64" "4.22.4"
+    "@rollup/rollup-darwin-arm64" "4.22.4"
+    "@rollup/rollup-darwin-x64" "4.22.4"
+    "@rollup/rollup-linux-arm-gnueabihf" "4.22.4"
+    "@rollup/rollup-linux-arm-musleabihf" "4.22.4"
+    "@rollup/rollup-linux-arm64-gnu" "4.22.4"
+    "@rollup/rollup-linux-arm64-musl" "4.22.4"
+    "@rollup/rollup-linux-powerpc64le-gnu" "4.22.4"
+    "@rollup/rollup-linux-riscv64-gnu" "4.22.4"
+    "@rollup/rollup-linux-s390x-gnu" "4.22.4"
+    "@rollup/rollup-linux-x64-gnu" "4.22.4"
+    "@rollup/rollup-linux-x64-musl" "4.22.4"
+    "@rollup/rollup-win32-arm64-msvc" "4.22.4"
+    "@rollup/rollup-win32-ia32-msvc" "4.22.4"
+    "@rollup/rollup-win32-x64-msvc" "4.22.4"
     fsevents "~2.3.2"
 
 roughjs@^4.6.6:
@@ -2273,15 +2260,10 @@ signal-exit@^4.0.1:
   resolved "https://registry.yarnpkg.com/signal-exit/-/signal-exit-4.1.0.tgz#952188c1cbd546070e2dd20d0f41c0ae0530cb04"
   integrity sha512-bzyZ1e88w9O1iNJbKnOlvYTrWPDl46O1bG0D3XInv+9tkPrxrN8jUUTiFlDkkmKWgn1M6CfIA13SuGqOa9Korw==
 
-source-map-js@^1.0.2:
-  version "1.0.2"
-  resolved "https://registry.yarnpkg.com/source-map-js/-/source-map-js-1.0.2.tgz#adbc361d9c62df380125e7f161f71c826f1e490c"
-  integrity sha512-R0XvVJ9WusLiqTCEiGCmICCMplcCkIwwR11mOSD9CR5u+IXYdiseeEuXCVAjS54zqwkLcPNnmU4OeJ6tUrWhDw==
-
-source-map-js@^1.2.0:
-  version "1.2.0"
-  resolved "https://registry.yarnpkg.com/source-map-js/-/source-map-js-1.2.0.tgz#16b809c162517b5b8c3e7dcd315a2a5c2612b2af"
-  integrity sha512-itJW8lvSA0TXEphiRoawsCksnlf8SyvmFzIhltqAHluXd88pkCd+cXJVHTDwdCr0IzwptSm035IHQktUu1QUMg==
+source-map-js@^1.2.1:
+  version "1.2.1"
+  resolved "https://registry.yarnpkg.com/source-map-js/-/source-map-js-1.2.1.tgz#1ce5650fddd87abc099eda37dcff024c2667ae46"
+  integrity sha512-UXWMKhLOwVKb728IUtQPXxfYU+usdybtUrK/8uGE8CQMvrhOpwvzDBwj0QhSL7MQc7vIsISBG8VQ8+IDQxpfQA==
 
 "string-width-cjs@npm:string-width@^4.2.0":
   version "4.2.3"
@@ -2526,13 +2508,13 @@ uuid@^9.0.1:
   resolved "https://registry.yarnpkg.com/uuid/-/uuid-9.0.1.tgz#e188d4c8853cc722220392c424cd637f32293f30"
   integrity sha512-b+1eJOlsR9K8HJpow9Ok3fiWOWSIcIzXodvv0rQjVoOVNpWMpxf1wZNpt4y9h10odCNrqnYp1OBzRktckBe3sA==
 
-vite@^5.4.2:
-  version "5.4.2"
-  resolved "https://registry.yarnpkg.com/vite/-/vite-5.4.2.tgz#8acb6ec4bfab823cdfc1cb2d6c53ed311bc4e47e"
-  integrity sha512-dDrQTRHp5C1fTFzcSaMxjk6vdpKvT+2/mIdE07Gw2ykehT49O0z/VHS3zZ8iV/Gh8BJJKHWOe5RjaNrW5xf/GA==
+vite@^5.4.6:
+  version "5.4.6"
+  resolved "https://registry.yarnpkg.com/vite/-/vite-5.4.6.tgz#85a93a1228a7fb5a723ca1743e337a2588ed008f"
+  integrity sha512-IeL5f8OO5nylsgzd9tq4qD2QqI0k2CQLGrWD0rCN0EQJZpBK5vJAx0I+GDkMOXxQX/OfFHMuLIx6ddAxGX/k+Q==
   dependencies:
     esbuild "^0.21.3"
-    postcss "^8.4.41"
+    postcss "^8.4.43"
     rollup "^4.20.0"
   optionalDependencies:
     fsevents "~2.3.3"