refactor: lora

thxCode · thxCode · commit 4e753946fe8a · 2024-11-15T17:07:46.000+08:00
Signed-off-by: thxCode &lt;thxcode0824@gmail.com&gt;
diff --git a/stable-diffusion.cpp b/stable-diffusion.cpp
@@ -642,18 +642,27 @@ class StableDiffusionGGML {
     }
 
     void apply_lora(const std::string& lora_name, float multiplier) {
-        int64_t t0                 = ggml_time_ms();
-        std::string st_file_path   = path_join(lora_model_dir, lora_name + ".safetensors");
-        std::string ckpt_file_path = path_join(lora_model_dir, lora_name + ".ckpt");
+        int64_t t0 = ggml_time_ms();
+
         std::string file_path;
-        if (file_exists(st_file_path)) {
-            file_path = st_file_path;
-        } else if (file_exists(ckpt_file_path)) {
-            file_path = ckpt_file_path;
+        if (!lora_model_dir.empty()) {
+            std::string st_file_path   = path_join(lora_model_dir, lora_name + ".safetensors");
+            std::string ckpt_file_path = path_join(lora_model_dir, lora_name + ".ckpt");
+            std::string gguf_file_path = path_join(lora_model_dir, lora_name + ".gguf");
+            if (file_exists(st_file_path)) {
+                file_path = st_file_path;
+            } else if (file_exists(ckpt_file_path)) {
+                file_path = ckpt_file_path;
+            } else if (file_exists(gguf_file_path)) {
+                file_path = gguf_file_path;
+            } else {
+                LOG_WARN("can not find %s, %s, %s for lora %s", st_file_path.c_str(), ckpt_file_path.c_str(), gguf_file_path.c_str(), lora_name.c_str());
+                return;
+            }
         } else {
-            LOG_WARN("can not find %s or %s for lora %s", st_file_path.c_str(), ckpt_file_path.c_str(), lora_name.c_str());
-            return;
+            file_path = lora_name;
         }
+
         LoraModel lora(backend, model_wtype, file_path);
         if (!lora.load_from_file()) {
             LOG_WARN("load lora tensors from %s failed", file_path.c_str());
@@ -673,6 +682,7 @@ class StableDiffusionGGML {
         if (!lora_state.empty() && model_wtype != GGML_TYPE_F16 && model_wtype != GGML_TYPE_F32) {
             LOG_WARN("In quantized models when applying LoRA, the images have poor quality.");
         }
+
         std::unordered_map<std::string, float> lora_state_diff;
         for (auto& kv : lora_state) {
             const std::string& lora_name = kv.first;
@@ -690,11 +700,9 @@ class StableDiffusionGGML {
         }
 
         LOG_INFO("Attempting to apply %lu LoRAs", lora_state.size());
-
         for (auto& kv : lora_state_diff) {
             apply_lora(kv.first, kv.second);
         }
-
         curr_lora_state = lora_state;
     }
 
@@ -980,8 +988,6 @@ class StableDiffusionGGML {
                 case VERSION_SD3_MEDIUM:
                 case VERSION_SD3_5_MEDIUM:
                 case VERSION_SD3_5_LARGE:
-                    C = 32;
-                    break;
                 case VERSION_FLUX_DEV:
                 case VERSION_FLUX_SCHNELL:
                     C = 32;
@@ -1163,20 +1169,23 @@ sd_image_t* generate_image(sd_ctx_t* sd_ctx,
     int sample_steps = sigmas.size() - 1;
 
     // Apply lora
-    auto result_pair                                = extract_and_remove_lora(prompt);
-    std::unordered_map<std::string, float> lora_f2m = result_pair.first;  // lora_name -> multiplier
+    int64_t t0, t1;
+    if (!sd_ctx->sd->lora_model_dir.empty()) {
+        auto result_pair                                = extract_and_remove_lora(prompt);
+        std::unordered_map<std::string, float> lora_f2m = result_pair.first;  // lora_name -> multiplier
 
-    for (auto& kv : lora_f2m) {
-        LOG_DEBUG("lora %s:%.2f", kv.first.c_str(), kv.second);
-    }
+        for (auto& kv : lora_f2m) {
+            LOG_DEBUG("lora %s:%.2f", kv.first.c_str(), kv.second);
+        }
 
-    prompt = result_pair.second;
-    LOG_DEBUG("prompt after extract and remove lora: \"%s\"", prompt.c_str());
+        prompt = result_pair.second;
+        LOG_DEBUG("prompt after extract and remove lora: \"%s\"", prompt.c_str());
 
-    int64_t t0 = ggml_time_ms();
-    sd_ctx->sd->apply_loras(lora_f2m);
-    int64_t t1 = ggml_time_ms();
-    LOG_INFO("apply_loras completed, taking %.2fs", (t1 - t0) * 1.0f / 1000);
+        t0 = ggml_time_ms();
+        sd_ctx->sd->apply_loras(lora_f2m);
+        t1 = ggml_time_ms();
+        LOG_INFO("apply_loras completed, taking %.2fs", (t1 - t0) * 1.0f / 1000);
+    }
 
     // Photo Maker
     std::string prompt_text_only;
@@ -1630,6 +1639,27 @@ sd_image_t* img2img(sd_ctx_t* sd_ctx,
     return result_images;
 }
 
+void sd_lora_adapters_clear(sd_ctx_t* sd_ctx) {
+    if (sd_ctx == NULL) {
+        return;
+    }
+    sd_ctx->sd->curr_lora_state.clear();
+}
+
+void sd_lora_adapters_apply(sd_ctx_t* sd_ctx, std::vector<sd_lora_adapter_container_t>& lora_adapters) {
+    if (sd_ctx == NULL) {
+        return;
+    }
+
+    sd_lora_adapters_clear(sd_ctx);
+
+    std::unordered_map<std::string, float> lora_state;
+    for (const sd_lora_adapter_container_t& lora_adapter : lora_adapters) {
+        lora_state[lora_adapter.path] = lora_adapter.multiplier;
+    }
+    sd_ctx->sd->apply_loras(lora_state);
+}
+
 int sd_get_version(sd_ctx_t* sd_ctx) {
     if (sd_ctx == NULL) {
         return VERSION_COUNT;
diff --git a/stable-diffusion.h b/stable-diffusion.h
@@ -183,6 +183,13 @@ SD_API sd_image_t* img2img(sd_ctx_t* sd_ctx,
                            bool normalize_input,
                            const char* input_id_images_path);
 
+typedef struct sd_lora_adapter_container_t {
+    const char* path;
+    float multiplier;
+} sd_lora_adapter_container_t;
+
+SD_API void sd_lora_adapters_clear(sd_ctx_t* sd_ctx);
+SD_API void sd_lora_adapters_apply(sd_ctx_t* sd_ctx, std::vector<sd_lora_adapter_container_t>& lora_adapters);
 SD_API int sd_get_version(sd_ctx_t* sd_ctx);
 SD_API sample_method_t sd_get_default_sample_method(sd_ctx_t* sd_ctx);
 SD_API int sd_get_default_sample_steps(sd_ctx_t* sd_ctx);