diff --git a/include/system_metrics.h b/include/system_metrics.h index 678ae4f9..94363afa 100644 --- a/include/system_metrics.h +++ b/include/system_metrics.h @@ -173,4 +173,8 @@ public: // compute return compute_cpu_stats(cpu_data_prev, cpu_data_now); } + + static uint64_t get_memory_free_bytes() { + return get_memory_total_bytes() - get_memory_used_bytes(); + } }; \ No newline at end of file diff --git a/src/text_embedder_manager.cpp b/src/text_embedder_manager.cpp index 89400a79..baa99ebf 100644 --- a/src/text_embedder_manager.cpp +++ b/src/text_embedder_manager.cpp @@ -1,4 +1,5 @@ #include "text_embedder_manager.h" +#include "system_metrics.h" TextEmbedderManager& TextEmbedderManager::get_instance() { @@ -107,8 +108,17 @@ Option TextEmbedderManager::validate_and_init_local_model(const nlohmann:: return Option(true); } - const std::shared_ptr& embedder = std::make_shared( - get_model_name_without_namespace(model_name)); + const auto& model_name_without_namespace = get_model_name_without_namespace(model_name); + const auto& free_memory = SystemMetrics::get_memory_free_bytes(); + const auto& model_file_size = std::filesystem::file_size(abs_path); + + // return error if (model file size * 1.15) is greater than free memory + if(model_file_size * 1.15 > free_memory) { + LOG(ERROR) << "Memory required to load the model exceeds free memory available."; + return Option(400, "Memory required to load the model exceeds free memory available."); + } + + const std::shared_ptr& embedder = std::make_shared(model_name_without_namespace); auto validate_op = embedder->validate(); if(!validate_op.ok()) {