From ee1b5fa3ce12db34b0096137277af314743d8eee Mon Sep 17 00:00:00 2001 From: James Date: Mon, 2 Dec 2024 15:13:34 +0700 Subject: [PATCH] feat: update engine interface --- docs/docs/engines/engine-extension.mdx | 96 +++- engine/cli/commands/server_start_cmd.cc | 22 +- engine/controllers/engines.cc | 5 +- engine/cortex-common/EngineI.h | 30 ++ engine/services/engine_service.cc | 595 +++++++++++------------- engine/services/engine_service.h | 10 +- engine/services/hardware_service.cc | 2 +- engine/utils/config_yaml_utils.cc | 1 + engine/utils/config_yaml_utils.h | 6 +- engine/utils/file_manager_utils.cc | 1 + 10 files changed, 425 insertions(+), 343 deletions(-) diff --git a/docs/docs/engines/engine-extension.mdx b/docs/docs/engines/engine-extension.mdx index 84000767b..6bb966f60 100644 --- a/docs/docs/engines/engine-extension.mdx +++ b/docs/docs/engines/engine-extension.mdx @@ -22,12 +22,32 @@ First, create an engine that implements the `EngineI.h` interface. Here's the in ```cpp class EngineI { public: - struct EngineLoadOption{}; - struct EngineUnloadOption{}; + struct RegisterLibraryOption { + std::vector paths; + }; + + struct EngineLoadOption { + // engine + std::filesystem::path engine_path; + std::filesystem::path cuda_path; + bool custom_engine_path; + + // logging + std::filesystem::path log_path; + int max_log_lines; + trantor::Logger::LogLevel log_level; + }; + + struct EngineUnloadOption { + bool unload_dll; + }; virtual ~EngineI() {} + virtual void RegisterLibraryPath(RegisterLibraryOption opts) = 0; + virtual void Load(EngineLoadOption opts) = 0; + virtual void Unload(EngineUnloadOption opts) = 0; // Cortex.llamacpp interface methods @@ -65,7 +85,71 @@ class EngineI { }; ``` -Note that Cortex will call `Load` before loading any models and `Unload` when stopping the engine. +#### Lifecycle Management + +##### RegisterLibraryPath + +```cpp +virtual void RegisterLibraryPath(RegisterLibraryOption opts) = 0; +``` + +This method is called during engine initialization to set up dynamic library search paths. For example, in Linux, we still have to use `LD_LIBRARY_PATH` to add CUDA dependencies to the search path. + +**Parameters:** + +- `opts.paths`: Vector of filesystem paths that the engine should register + +**Implementation Requirements:** + +- Register provided paths for dynamic library loading +- Handle invalid paths gracefully +- Thread-safe implementation +- No exceptions should escape the method + +##### Load + +```cpp +virtual void Load(EngineLoadOption opts) = 0; +``` + +Initializes the engine with the provided configuration options. + +**Parameters:** + +- `engine_path`: Base path for engine files +- `cuda_path`: Path to CUDA installation +- `custom_engine_path`: Flag for using custom engine location +- `log_path`: Location for log files +- `max_log_lines`: Maximum number of lines per log file +- `log_level`: Logging verbosity level + +**Implementation Requirements:** + +- Validate all paths before use +- Initialize engine components +- Set up logging configuration +- Handle missing dependencies gracefully +- Clean initialization state in case of failures + +##### Unload + +```cpp +virtual void Unload(EngineUnloadOption opts) = 0; +``` + +Performs cleanup and shutdown of the engine. + +**Parameters:** + +- `unload_dll`: Boolean flag indicating whether to unload dynamic libraries + +**Implementation Requirements:** + +- Clean up all allocated resources +- Close file handles and connections +- Release memory +- Ensure proper shutdown of running models +- Handle cleanup in a thread-safe manner ### 2. Create a Dynamic Library @@ -98,7 +182,7 @@ To test your engine locally: 1. Create a directory structure following this hierarchy: -``` +```bash engines/ └── cortex.llamacpp/ └── mac-arm64/ @@ -107,12 +191,12 @@ engines/ └── version.txt ``` -2. Configure your engine: +1. Configure your engine: - Edit the `~/.cortexrc` file to register your engine name - Add your model with the appropriate engine field in `model.yaml` -3. Testing: +2. Testing: - Start the engine - Load your model - Verify functionality diff --git a/engine/cli/commands/server_start_cmd.cc b/engine/cli/commands/server_start_cmd.cc index ba4f7bd82..3d52f3d25 100644 --- a/engine/cli/commands/server_start_cmd.cc +++ b/engine/cli/commands/server_start_cmd.cc @@ -1,9 +1,12 @@ #include "server_start_cmd.h" #include "commands/cortex_upd_cmd.h" +#include "services/engine_service.h" #include "utils/cortex_utils.h" -#include "utils/engine_constants.h" #include "utils/file_manager_utils.h" + +#if defined(_WIN32) || defined(_WIN64) #include "utils/widechar_conv.h" +#endif namespace commands { @@ -108,22 +111,9 @@ bool ServerStartCmd::Exec(const std::string& host, int port, std::cerr << "Could not start server: " << std::endl; return false; } else if (pid == 0) { - // No need to configure LD_LIBRARY_PATH for macOS -#if !defined(__APPLE__) || !defined(__MACH__) - const char* name = "LD_LIBRARY_PATH"; - auto data = getenv(name); - std::string v; - if (auto g = getenv(name); g) { - v += g; - } - CTL_INF("LD_LIBRARY_PATH: " << v); - auto llamacpp_path = file_manager_utils::GetCudaToolkitPath(kLlamaRepo); - auto trt_path = file_manager_utils::GetCudaToolkitPath(kTrtLlmRepo); + // Some engines requires to add lib search path before process being created + EngineService().RegisterEngineLibPath(); - auto new_v = trt_path.string() + ":" + llamacpp_path.string() + ":" + v; - setenv(name, new_v.c_str(), true); - CTL_INF("LD_LIBRARY_PATH: " << getenv(name)); -#endif std::string p = cortex_utils::GetCurrentPath() + "/" + exe; execl(p.c_str(), exe.c_str(), "--start-server", "--config_file_path", get_config_file_path().c_str(), "--data_folder_path", diff --git a/engine/controllers/engines.cc b/engine/controllers/engines.cc index 3d3c0c037..1d0223d9a 100644 --- a/engine/controllers/engines.cc +++ b/engine/controllers/engines.cc @@ -23,10 +23,9 @@ std::string NormalizeEngine(const std::string& engine) { void Engines::ListEngine( const HttpRequestPtr& req, std::function&& callback) const { - std::vector supported_engines{kLlamaEngine, kOnnxEngine, - kTrtLlmEngine}; Json::Value ret; - for (const auto& engine : supported_engines) { + auto engine_names = engine_service_->GetSupportedEngineNames().value(); + for (const auto& engine : engine_names) { auto installed_engines = engine_service_->GetInstalledEngineVariants(engine); if (installed_engines.has_error()) { diff --git a/engine/cortex-common/EngineI.h b/engine/cortex-common/EngineI.h index 51e19c124..11866a708 100644 --- a/engine/cortex-common/EngineI.h +++ b/engine/cortex-common/EngineI.h @@ -1,5 +1,6 @@ #pragma once +#include #include #include @@ -7,8 +8,37 @@ #include "trantor/utils/Logger.h" class EngineI { public: + struct RegisterLibraryOption { + std::vector paths; + }; + + struct EngineLoadOption { + // engine + std::filesystem::path engine_path; + std::filesystem::path cuda_path; + bool custom_engine_path; + + // logging + std::filesystem::path log_path; + int max_log_lines; + trantor::Logger::LogLevel log_level; + }; + + struct EngineUnloadOption { + bool unload_dll; + }; + virtual ~EngineI() {} + /** + * Being called before starting process to register dependencies search paths. + */ + virtual void RegisterLibraryPath(RegisterLibraryOption opts) = 0; + + virtual void Load(EngineLoadOption opts) = 0; + + virtual void Unload(EngineUnloadOption opts) = 0; + // cortex.llamacpp interface virtual void HandleChatCompletion( std::shared_ptr json_body, diff --git a/engine/services/engine_service.cc b/engine/services/engine_service.cc index fe5317c7d..2f0acdc8f 100644 --- a/engine/services/engine_service.cc +++ b/engine/services/engine_service.cc @@ -2,6 +2,7 @@ #include #include #include +#include #include #include "algorithm" #include "database/engines.h" @@ -194,6 +195,7 @@ cpp::result EngineService::UninstallEngineVariant( return cpp::result(true); } + std::lock_guard lock(engines_mutex_); if (IsEngineLoaded(ne)) { CTL_INF("Engine " << ne << " is already loaded, unloading it"); auto unload_res = UnloadEngine(ne); @@ -286,6 +288,7 @@ cpp::result EngineService::DownloadEngine( return cpp::fail("Failed to find a suitable variant for " + engine); } + std::lock_guard lock(engines_mutex_); if (IsEngineLoaded(engine)) { CTL_INF("Engine " << engine << " is already loaded, unloading it"); auto unload_res = UnloadEngine(engine); @@ -528,6 +531,7 @@ EngineService::SetDefaultEngineVariant(const std::string& engine, " is not installed yet!"); } + std::lock_guard lock(engines_mutex_); if (IsEngineLoaded(ne)) { CTL_INF("Engine " << ne << " is already loaded, unloading it"); auto unload_res = UnloadEngine(ne); @@ -671,35 +675,43 @@ cpp::result EngineService::GetLoadedEngine( return engines_[ne].engine; } -cpp::result EngineService::LoadEngine( - const std::string& engine_name) { - auto ne = NormalizeEngine(engine_name); - std::lock_guard lock(engines_mutex_); - if (IsEngineLoaded(ne)) { - CTL_INF("Engine " << ne << " is already loaded"); - return {}; - } - - // Check for remote engine - if (remote_engine::IsRemoteEngine(engine_name)) { - auto exist_engine = GetEngineByNameAndVariant(engine_name); - if (exist_engine.has_error()) { - return cpp::fail("Remote engine '" + engine_name + "' is not installed"); - } - - if (engine_name == kOpenAiEngine) { - engines_[engine_name].engine = new remote_engine::OpenAiEngine(); - } else { - engines_[engine_name].engine = new remote_engine::AnthropicEngine(); +void EngineService::RegisterEngineLibPath() { + auto engine_names = GetSupportedEngineNames().value(); + for (const auto& engine : engine_names) { + auto ne = NormalizeEngine(engine); + try { + auto engine_dir_path_res = GetEngineDirPath(engine); + if (engine_dir_path_res.has_error()) { + CTL_ERR( + "Could not get engine dir path: " << engine_dir_path_res.error()); + continue; + } + auto engine_dir_path = engine_dir_path_res.value().first; + auto custom_engine_path = engine_dir_path_res.value().second; + + auto dylib = std::make_unique(engine_dir_path.string(), + "engine"); + + auto cuda_path = file_manager_utils::GetCudaToolkitPath(ne); + // init + auto func = dylib->get_function("get_engine"); + auto engine = func(); + std::vector paths{}; + auto register_opts = EngineI::RegisterLibraryOption{ + .paths = paths, + }; + engine->RegisterLibraryPath(register_opts); + delete engine; + CTL_DBG("Register lib path for: " << engine); + } catch (const std::exception& e) { + CTL_WRN("Failed to registering engine lib path: " << e.what()); } - - CTL_INF("Loaded engine: " << engine_name); - return {}; } +} - // End hard code - - CTL_INF("Loading engine: " << ne); +cpp::result, std::string> +EngineService::GetEngineDirPath(const std::string& engine_name) { + auto ne = NormalizeEngine(engine_name); auto selected_engine_variant = GetDefaultEngineVariant(ne); @@ -715,6 +727,7 @@ cpp::result EngineService::LoadEngine( auto user_defined_engine_path = getenv("ENGINE_PATH"); #endif + auto custom_engine_path = user_defined_engine_path != nullptr; CTL_DBG("user defined engine path: " << user_defined_engine_path); const std::filesystem::path engine_dir_path = [&] { if (user_defined_engine_path != nullptr) { @@ -728,126 +741,70 @@ cpp::result EngineService::LoadEngine( } }(); - CTL_DBG("Engine path: " << engine_dir_path.string()); - if (!std::filesystem::exists(engine_dir_path)) { CTL_ERR("Directory " + engine_dir_path.string() + " is not exist!"); return cpp::fail("Directory " + engine_dir_path.string() + " is not exist!"); } - CTL_INF("Engine path: " << engine_dir_path.string()); + CTL_INF("Engine path: " << engine_dir_path.string() + << ", custom_engine_path: " << custom_engine_path); + return std::make_pair(engine_dir_path, custom_engine_path); +} - try { -#if defined(_WIN32) - // TODO(?) If we only allow to load an engine at a time, the logic is simpler. - // We would like to support running multiple engines at the same time. Therefore, - // the adding/removing dll directory logic is quite complicated: - // 1. If llamacpp is loaded and new requested engine is tensorrt-llm: - // Unload the llamacpp dll directory then load the tensorrt-llm - // 2. If tensorrt-llm is loaded and new requested engine is llamacpp: - // Do nothing, llamacpp can re-use tensorrt-llm dependencies (need to be tested careful) - // 3. Add dll directory if met other conditions - - auto add_dll = [this](const std::string& e_type, - const std::filesystem::path& p) { - if (auto cookie = AddDllDirectory(p.c_str()); cookie != 0) { - CTL_DBG("Added dll directory: " << p.string()); - engines_[e_type].cookie = cookie; - } else { - CTL_WRN("Could not add dll directory: " << p.string()); - } +cpp::result EngineService::LoadEngine( + const std::string& engine_name) { + auto ne = NormalizeEngine(engine_name); - auto cuda_path = file_manager_utils::GetCudaToolkitPath(e_type); - if (auto cuda_cookie = AddDllDirectory(cuda_path.c_str()); - cuda_cookie != 0) { - CTL_DBG("Added cuda dll directory: " << p.string()); - engines_[e_type].cuda_cookie = cuda_cookie; - } else { - CTL_WRN("Could not add cuda dll directory: " << p.string()); - } - }; + std::lock_guard lock(engines_mutex_); + if (IsEngineLoaded(ne)) { + CTL_INF("Engine " << ne << " is already loaded"); + return {}; + } -#if defined(_WIN32) - if (bool should_use_dll_search_path = !(_wgetenv(L"ENGINE_PATH")); -#else - if (bool should_use_dll_search_path = !(getenv("ENGINE_PATH")); -#endif - should_use_dll_search_path) { - if (IsEngineLoaded(kLlamaRepo) && ne == kTrtLlmRepo && - should_use_dll_search_path) { - - { - - // Remove llamacpp dll directory - if (!RemoveDllDirectory(engines_[kLlamaRepo].cookie)) { - CTL_WRN("Could not remove dll directory: " << kLlamaRepo); - } else { - CTL_DBG("Removed dll directory: " << kLlamaRepo); - } - if (!RemoveDllDirectory(engines_[kLlamaRepo].cuda_cookie)) { - CTL_WRN("Could not remove cuda dll directory: " << kLlamaRepo); - } else { - CTL_DBG("Removed cuda dll directory: " << kLlamaRepo); - } - } + CTL_INF("Loading engine: " << ne); - add_dll(ne, engine_dir_path); - } else if (IsEngineLoaded(kTrtLlmRepo) && ne == kLlamaRepo) { - // Do nothing - } else { - add_dll(ne, engine_dir_path); - } - } -#endif - engines_[ne].dl = + auto engine_dir_path_res = GetEngineDirPath(ne); + if (engine_dir_path_res.has_error()) { + return cpp::fail(engine_dir_path_res.error()); + } + auto engine_dir_path = engine_dir_path_res.value().first; + auto custom_engine_path = engine_dir_path_res.value().second; + + try { + auto dylib = std::make_unique(engine_dir_path.string(), "engine"); -#if defined(__linux__) - const char* name = "LD_LIBRARY_PATH"; - auto data = getenv(name); - std::string v; - if (auto g = getenv(name); g) { - v += g; - } - CTL_INF("LD_LIBRARY_PATH: " << v); - auto llamacpp_path = file_manager_utils::GetCudaToolkitPath(kLlamaRepo); - CTL_INF("llamacpp_path: " << llamacpp_path); - // tensorrt is not supported for now - // auto trt_path = file_manager_utils::GetCudaToolkitPath(kTrtLlmRepo); - - auto new_v = llamacpp_path.string() + ":" + v; - setenv(name, new_v.c_str(), true); - CTL_INF("LD_LIBRARY_PATH: " << getenv(name)); -#endif + auto config = file_manager_utils::GetCortexConfig(); + + auto log_path = + std::filesystem::path(config.logFolderPath) / + std::filesystem::path( + config.logLlamaCppPath); // for now seems like we use same log path + + // init + auto func = dylib->get_function("get_engine"); + auto engine_obj = func(); + auto load_opts = EngineI::EngineLoadOption{ + .engine_path = engine_dir_path, + .cuda_path = file_manager_utils::GetCudaToolkitPath(ne), + .custom_engine_path = custom_engine_path, + .log_path = log_path, + .max_log_lines = config.maxLogLines, + .log_level = logging_utils_helper::global_log_level, + }; + engine_obj->Load(load_opts); + + engines_[ne].engine = engine_obj; + engines_[ne].dl = std::move(dylib); + + CTL_DBG("Engine loaded: " << ne); + return {}; } catch (const cortex_cpp::dylib::load_error& e) { CTL_ERR("Could not load engine: " << e.what()); engines_.erase(ne); return cpp::fail("Could not load engine " + ne + ": " + e.what()); } - - auto func = engines_[ne].dl->get_function("get_engine"); - engines_[ne].engine = func(); - - auto& en = std::get(engines_[ne].engine); - if (ne == kLlamaRepo) { //fix for llamacpp engine first - auto config = file_manager_utils::GetCortexConfig(); - if (en->IsSupported("SetFileLogger")) { - en->SetFileLogger(config.maxLogLines, - (std::filesystem::path(config.logFolderPath) / - std::filesystem::path(config.logLlamaCppPath)) - .string()); - } else { - CTL_WRN("Method SetFileLogger is not supported yet"); - } - if (en->IsSupported("SetLogLevel")) { - en->SetLogLevel(logging_utils_helper::global_log_level); - } else { - CTL_WRN("Method SetLogLevel is not supported yet"); - } - } - CTL_DBG("loaded engine: " << ne); - return {}; } cpp::result EngineService::UnloadEngine( @@ -863,238 +820,246 @@ cpp::result EngineService::UnloadEngine( } else { delete std::get(engines_[ne].engine); } + LOG_INFO << "Unloading engine " << ne; -#if defined(_WIN32) - if (!RemoveDllDirectory(engines_[ne].cookie)) { - CTL_WRN("Could not remove dll directory: " << ne); - } else { - CTL_DBG("Removed dll directory: " << ne); - } - if (!RemoveDllDirectory(engines_[ne].cuda_cookie)) { - CTL_WRN("Could not remove cuda dll directory: " << ne); - } else { - CTL_DBG("Removed cuda dll directory: " << ne); + std::lock_guard lock(engines_mutex_); + if (!IsEngineLoaded(ne)) { + return cpp::fail("Engine " + ne + " is not loaded yet!"); } -#endif + auto* e = std::get(engines_[ne].engine); + auto unload_opts = EngineI::EngineUnloadOption{ + .unload_dll = true, + }; + e->Unload(unload_opts); + delete e; engines_.erase(ne); + CTL_DBG("Engine unloaded: " + ne); + return {}; } - CTL_DBG("Unloaded engine " + ne); - return {}; -} -std::vector EngineService::GetLoadedEngines() { - std::lock_guard lock(engines_mutex_); - std::vector loaded_engines; - for (const auto& [key, value] : engines_) { - loaded_engines.push_back(value.engine); + std::vector EngineService::GetLoadedEngines() { + std::lock_guard lock(engines_mutex_); + std::vector loaded_engines; + for (const auto& [key, value] : engines_) { + loaded_engines.push_back(value.engine); + } + return loaded_engines; } - return loaded_engines; -} -cpp::result -EngineService::GetLatestEngineVersion(const std::string& engine) const { - auto ne = NormalizeEngine(engine); - auto res = github_release_utils::GetReleaseByVersion("janhq", ne, "latest"); - if (res.has_error()) { - return cpp::fail("Failed to fetch engine " + engine + " latest version!"); + cpp::result + EngineService::GetLatestEngineVersion(const std::string& engine) const { + auto ne = NormalizeEngine(engine); + auto res = github_release_utils::GetReleaseByVersion("janhq", ne, "latest"); + if (res.has_error()) { + return cpp::fail("Failed to fetch engine " + engine + " latest version!"); + } + return res.value(); } - return res.value(); -} -cpp::result EngineService::IsEngineReady( - const std::string& engine) { - auto ne = NormalizeEngine(engine); + cpp::result EngineService::IsEngineReady( + const std::string& engine) { + auto ne = NormalizeEngine(engine); - // Check for remote engine - if (remote_engine::IsRemoteEngine(engine)) { - auto exist_engine = GetEngineByNameAndVariant(engine); - if (exist_engine.has_error()) { - return cpp::fail("Remote engine '" + engine + "' is not installed"); + // Check for remote engine + if (remote_engine::IsRemoteEngine(engine)) { + auto exist_engine = GetEngineByNameAndVariant(engine); + if (exist_engine.has_error()) { + return cpp::fail("Remote engine '" + engine + "' is not installed"); + } + return true; } - return true; - } - // End hard code + // End hard code - auto os = hw_inf_.sys_inf->os; - if (os == kMacOs && (ne == kOnnxRepo || ne == kTrtLlmRepo)) { - return cpp::fail("Engine " + engine + " is not supported on macOS"); - } + auto os = hw_inf_.sys_inf->os; + if (os == kMacOs && (ne == kOnnxRepo || ne == kTrtLlmRepo)) { + return cpp::fail("Engine " + engine + " is not supported on macOS"); + } - if (os == kLinuxOs && ne == kOnnxRepo) { - return cpp::fail("Engine " + engine + " is not supported on Linux"); - } - auto installed_variants = GetInstalledEngineVariants(engine); - if (installed_variants.has_error()) { - return cpp::fail(installed_variants.error()); - } + if (os == kLinuxOs && ne == kOnnxRepo) { + return cpp::fail("Engine " + engine + " is not supported on Linux"); + } + auto installed_variants = GetInstalledEngineVariants(engine); + if (installed_variants.has_error()) { + return cpp::fail(installed_variants.error()); + } - return installed_variants->size() > 0; -} + return installed_variants->size() > 0; + } -cpp::result EngineService::UpdateEngine( - const std::string& engine) { - auto ne = NormalizeEngine(engine); - auto default_variant = GetDefaultEngineVariant(ne); + cpp::result EngineService::UpdateEngine( + const std::string& engine) { + auto ne = NormalizeEngine(engine); + auto default_variant = GetDefaultEngineVariant(ne); - if (default_variant.has_error()) { - // if we don't have a default variant, just stop - CTL_INF("No default variant found for " << ne << ". Exit update engine"); - return cpp::fail(default_variant.error()); - } - CTL_INF("Default variant: " << default_variant->variant - << ", version: " + default_variant->version); + if (default_variant.has_error()) { + // if we don't have a default variant, just stop + CTL_INF("No default variant found for " << ne << ". Exit update engine"); + return cpp::fail(default_variant.error()); + } + CTL_INF("Default variant: " << default_variant->variant + << ", version: " + default_variant->version); + + std::lock_guard lock(engines_mutex_); + if (IsEngineLoaded(ne)) { + CTL_INF("Engine " << ne << " is already loaded, unloading it"); + auto unload_res = UnloadEngine(ne); + if (unload_res.has_error()) { + CTL_INF("Failed to unload engine: " << unload_res.error()); + return cpp::fail(unload_res.error()); + } else { + CTL_INF("Engine " << ne << " unloaded successfully"); + } + } - if (IsEngineLoaded(ne)) { - CTL_INF("Engine " << ne << " is already loaded, unloading it"); - auto unload_res = UnloadEngine(ne); - if (unload_res.has_error()) { - CTL_INF("Failed to unload engine: " << unload_res.error()); - return cpp::fail(unload_res.error()); - } else { - CTL_INF("Engine " << ne << " unloaded successfully"); + auto latest_version = GetLatestEngineVersion(ne); + if (latest_version.has_error()) { + // if can't get latest version, stop + CTL_INF("Can't get latest version for " + << ne << " error: " << latest_version.error()); + return cpp::fail("Failed to get latest version: " + + latest_version.error()); + } + CTL_INF("Latest version: " + latest_version.value().name); + + // check if local engines variants if latest version already exist + auto installed_variants = GetInstalledEngineVariants(ne); + + bool latest_version_installed = false; + for (const auto& v : installed_variants.value()) { + CTL_INF("Installed version: " + v.version); + CTL_INF(json_helper::DumpJsonString(v.ToJson())); + if (default_variant->variant == v.name && + string_utils::RemoveSubstring(v.version, "v") == + latest_version.value().name) { + latest_version_installed = true; + break; + } } - } - auto latest_version = GetLatestEngineVersion(ne); - if (latest_version.has_error()) { - // if can't get latest version, stop - CTL_INF("Can't get latest version for " - << ne << " error: " << latest_version.error()); - return cpp::fail("Failed to get latest version: " + latest_version.error()); - } - CTL_INF("Latest version: " + latest_version.value().name); - - // check if local engines variants if latest version already exist - auto installed_variants = GetInstalledEngineVariants(ne); - - bool latest_version_installed = false; - for (const auto& v : installed_variants.value()) { - CTL_INF("Installed version: " + v.version); - CTL_INF(json_helper::DumpJsonString(v.ToJson())); - if (default_variant->variant == v.name && - string_utils::RemoveSubstring(v.version, "v") == - latest_version.value().name) { - latest_version_installed = true; - break; + if (latest_version_installed) { + CTL_INF("Engine " + ne + ", " + default_variant->variant + + " is already up-to-date! Version " + + latest_version.value().tag_name); + return cpp::fail("Engine " + ne + ", " + default_variant->variant + + " is already up-to-date! Version " + + latest_version.value().tag_name); } - } - if (latest_version_installed) { - CTL_INF("Engine " + ne + ", " + default_variant->variant + - " is already up-to-date! Version " + - latest_version.value().tag_name); - return cpp::fail("Engine " + ne + ", " + default_variant->variant + - " is already up-to-date! Version " + - latest_version.value().tag_name); - } + CTL_INF("Engine variant " + << default_variant->variant + << " is not up-to-date! Current: " << default_variant->version + << ", latest: " << latest_version->name); - CTL_INF("Engine variant " - << default_variant->variant << " is not up-to-date! Current: " - << default_variant->version << ", latest: " << latest_version->name); + auto res = InstallEngineAsync(engine, latest_version->tag_name, + default_variant->variant); - auto res = InstallEngineAsync(engine, latest_version->tag_name, - default_variant->variant); + return EngineUpdateResult{.engine = engine, + .variant = default_variant->variant, + .from = default_variant->version, + .to = latest_version->tag_name}; + } - return EngineUpdateResult{.engine = engine, - .variant = default_variant->variant, - .from = default_variant->version, - .to = latest_version->tag_name}; -} + cpp::result, std::string> + EngineService::GetEngines() { + cortex::db::Engines engines; + auto get_res = engines.GetEngines(); -cpp::result, std::string> -EngineService::GetEngines() { - cortex::db::Engines engines; - auto get_res = engines.GetEngines(); + if (!get_res.has_value()) { + return cpp::fail("Failed to get engine entries"); + } - if (!get_res.has_value()) { - return cpp::fail("Failed to get engine entries"); + return get_res.value(); } - return get_res.value(); -} + cpp::result + EngineService::GetEngineById(int id) { + cortex::db::Engines engines; + auto get_res = engines.GetEngineById(id); -cpp::result EngineService::GetEngineById( - int id) { - cortex::db::Engines engines; - auto get_res = engines.GetEngineById(id); + if (!get_res.has_value()) { + return cpp::fail("Engine with ID " + std::to_string(id) + " not found"); + } - if (!get_res.has_value()) { - return cpp::fail("Engine with ID " + std::to_string(id) + " not found"); + return get_res.value(); } - return get_res.value(); -} + cpp::result + EngineService::GetEngineByNameAndVariant( + const std::string& engine_name, + const std::optional variant) { + + cortex::db::Engines engines; + auto get_res = engines.GetEngineByNameAndVariant(engine_name, variant); -cpp::result -EngineService::GetEngineByNameAndVariant( - const std::string& engine_name, const std::optional variant) { + if (!get_res.has_value()) { + if (variant.has_value()) { + return cpp::fail("Variant " + variant.value() + + " not found for engine " + engine_name); + } else { + return cpp::fail("Engine " + engine_name + " not found"); + } + } - cortex::db::Engines engines; - auto get_res = engines.GetEngineByNameAndVariant(engine_name, variant); + return get_res.value(); + } - if (!get_res.has_value()) { - if (variant.has_value()) { - return cpp::fail("Variant " + variant.value() + " not found for engine " + - engine_name); + cpp::result EngineService::UpsertEngine( + const std::string& engine_name, const std::string& type, + const std::string& api_key, const std::string& url, + const std::string& version, const std::string& variant, + const std::string& status, const std::string& metadata) { + cortex::db::Engines engines; + auto upsert_res = engines.UpsertEngine(engine_name, type, api_key, url, + version, variant, status, metadata); + if (upsert_res.has_value()) { + return upsert_res.value(); } else { - return cpp::fail("Engine " + engine_name + " not found"); + return cpp::fail("Failed to upsert engine entry"); } } - return get_res.value(); -} - -cpp::result EngineService::UpsertEngine( - const std::string& engine_name, const std::string& type, - const std::string& api_key, const std::string& url, - const std::string& version, const std::string& variant, - const std::string& status, const std::string& metadata) { - cortex::db::Engines engines; - auto upsert_res = engines.UpsertEngine(engine_name, type, api_key, url, - version, variant, status, metadata); - if (upsert_res.has_value()) { - return upsert_res.value(); - } else { - return cpp::fail("Failed to upsert engine entry"); + std::string EngineService::DeleteEngine(int id) { + cortex::db::Engines engines; + auto delete_res = engines.DeleteEngineById(id); + if (delete_res.has_value()) { + return delete_res.value(); + } else { + return ""; + } } -} -std::string EngineService::DeleteEngine(int id) { - cortex::db::Engines engines; - auto delete_res = engines.DeleteEngineById(id); - if (delete_res.has_value()) { - return delete_res.value(); - } else { - return ""; - } -} + cpp::result EngineService::GetRemoteModels( + const std::string& engine_name) { + std::lock_guard lock(engines_mutex_); + if (auto r = IsEngineReady(engine_name); r.has_error()) { + return cpp::fail(r.error()); + } -cpp::result EngineService::GetRemoteModels( - const std::string& engine_name) { - std::lock_guard lock(engines_mutex_); - if (auto r = IsEngineReady(engine_name); r.has_error()) { - return cpp::fail(r.error()); - } + if (!IsEngineLoaded(engine_name)) { + auto exist_engine = GetEngineByNameAndVariant(engine_name); + if (exist_engine.has_error()) { + return cpp::fail("Remote engine '" + engine_name + + "' is not installed"); + } + if (engine_name == kOpenAiEngine) { + engines_[engine_name].engine = new remote_engine::OpenAiEngine(); + } else { + engines_[engine_name].engine = new remote_engine::AnthropicEngine(); + } - if (!IsEngineLoaded(engine_name)) { - auto exist_engine = GetEngineByNameAndVariant(engine_name); - if (exist_engine.has_error()) { - return cpp::fail("Remote engine '" + engine_name + "' is not installed"); + CTL_INF("Loaded engine: " << engine_name); } - if (engine_name == kOpenAiEngine) { - engines_[engine_name].engine = new remote_engine::OpenAiEngine(); + auto& e = std::get(engines_[engine_name].engine); + auto res = e->GetRemoteModels(); + if (!res["error"].isNull()) { + return cpp::fail(res["error"].asString()); } else { - engines_[engine_name].engine = new remote_engine::AnthropicEngine(); + return res; } - - CTL_INF("Loaded engine: " << engine_name); } - auto& e = std::get(engines_[engine_name].engine); - auto res = e->GetRemoteModels(); - if (!res["error"].isNull()) { - return cpp::fail(res["error"].asString()); - } else { - return res; + + cpp::result, std::string> + EngineService::GetSupportedEngineNames() { + return file_manager_utils::GetCortexConfig().supportedEngines; } -} \ No newline at end of file diff --git a/engine/services/engine_service.h b/engine/services/engine_service.h index ab274825d..2aa305bbc 100644 --- a/engine/services/engine_service.h +++ b/engine/services/engine_service.h @@ -75,6 +75,9 @@ class EngineService : public EngineServiceI { .cuda_driver_version = system_info_utils::GetDriverAndCudaVersion().second} {} + // just for initialize supported engines + EngineService() {}; + std::vector GetEngineInfoList() const; /** @@ -148,6 +151,9 @@ class EngineService : public EngineServiceI { cpp::result GetRemoteModels( const std::string& engine_name); + cpp::result, std::string> GetSupportedEngineNames(); + + void RegisterEngineLibPath(); private: bool IsEngineLoaded(const std::string& engine); @@ -162,7 +168,9 @@ class EngineService : public EngineServiceI { std::string GetMatchedVariant(const std::string& engine, const std::vector& variants); + cpp::result, std::string> + GetEngineDirPath(const std::string& engine_name); + cpp::result IsEngineVariantReady( const std::string& engine, const std::string& version, const std::string& variant); -}; \ No newline at end of file diff --git a/engine/services/hardware_service.cc b/engine/services/hardware_service.cc index 681ca7578..a5890eab9 100644 --- a/engine/services/hardware_service.cc +++ b/engine/services/hardware_service.cc @@ -5,11 +5,11 @@ #if defined(_WIN32) || defined(_WIN64) #include #include +#include "utils/widechar_conv.h" #endif #include "cli/commands/cortex_upd_cmd.h" #include "database/hardware.h" #include "utils/cortex_utils.h" -#include "utils/widechar_conv.h" namespace services { diff --git a/engine/utils/config_yaml_utils.cc b/engine/utils/config_yaml_utils.cc index ed6437256..c7a696df4 100644 --- a/engine/utils/config_yaml_utils.cc +++ b/engine/utils/config_yaml_utils.cc @@ -49,6 +49,7 @@ cpp::result CortexConfigMgr::DumpYamlConfig( node["verifyHostSsl"] = config.verifyHostSsl; node["sslCertPath"] = config.sslCertPath; node["sslKeyPath"] = config.sslKeyPath; + node["supportedEngines"] = config.supportedEngines; out_file << node; out_file.close(); diff --git a/engine/utils/config_yaml_utils.h b/engine/utils/config_yaml_utils.h index d36cc48e0..07f415894 100644 --- a/engine/utils/config_yaml_utils.h +++ b/engine/utils/config_yaml_utils.h @@ -3,6 +3,8 @@ #include #include #include +#include "utils/engine_constants.h" +#include "utils/logging_utils.h" #include "utils/result.hpp" namespace config_yaml_utils { @@ -18,6 +20,8 @@ constexpr const auto kDefaultCorsEnabled = true; const std::vector kDefaultEnabledOrigins{ "http://localhost:39281", "http://127.0.0.1:39281", "http://0.0.0.0:39281"}; constexpr const auto kDefaultNoProxy = "example.com,::1,localhost,127.0.0.1"; +const std::vector kDefaultSupportedEngines{ + kLlamaEngine, kOnnxEngine, kTrtLlmEngine}; struct CortexConfig { std::string logFolderPath; @@ -57,6 +61,7 @@ struct CortexConfig { bool verifyHostSsl; std::string sslCertPath; std::string sslKeyPath; + std::vector supportedEngines; }; class CortexConfigMgr { @@ -80,5 +85,4 @@ class CortexConfigMgr { CortexConfig FromYaml(const std::string& path, const CortexConfig& default_cfg); }; - } // namespace config_yaml_utils diff --git a/engine/utils/file_manager_utils.cc b/engine/utils/file_manager_utils.cc index ca3d0c07b..338abadac 100644 --- a/engine/utils/file_manager_utils.cc +++ b/engine/utils/file_manager_utils.cc @@ -187,6 +187,7 @@ config_yaml_utils::CortexConfig GetDefaultConfig() { .verifyHostSsl = true, .sslCertPath = "", .sslKeyPath = "", + .supportedEngines = config_yaml_utils::kDefaultSupportedEngines, }; }