thxCode
diff --git a/‎conditioner.hpp
Lines changed: 3 additions & 3 deletions b/‎conditioner.hpp
Lines changed: 3 additions & 3 deletions
diff --git a/‎examples/convert/main.cpp
Lines changed: 72 additions & 22 deletions b/‎examples/convert/main.cpp
Lines changed: 72 additions & 22 deletions
diff --git a/‎lora.hpp
Lines changed: 1 addition & 1 deletion b/‎lora.hpp
Lines changed: 1 addition & 1 deletion
@@ -60,10 +60,10 @@ struct FrozenCLIPEmbedderWithCustomWords : public Conditioner {
     FrozenCLIPEmbedderWithCustomWords(ggml_backend_t backend,
                                       ggml_type wtype,
                                       const std::string& embd_dir,
-                                      SDVersion version = VERSION_SD1,
+                                      SDVersion version                = VERSION_SD1,
                                       bool compvis_compatiblity_clip_l = false,
                                       bool compvis_compatiblity_clip_g = false,
-                                      int clip_skip     = -1)
+                                      int clip_skip                    = -1)
         : version(version),
           tokenizer(version == VERSION_SD2 ? 0 : 49407),
           embd_dir(embd_dir),
@@ -166,7 +166,7 @@ struct FrozenCLIPEmbedderWithCustomWords : public Conditioner {
         } else {
             hidden_size = text_model2->model.hidden_size;
         }
-        auto on_load = [&](const TensorStorage& tensor_storage, ggml_tensor** dst_tensor) {
+        auto on_load = [&](const TensorStorage& tensor_storage, const SDVersion ver, ggml_tensor** dst_tensor) {
             if (tensor_storage.ne[0] != hidden_size) {
                 LOG_DEBUG("embedding wrong hidden size, got %i, expected %i", tensor_storage.ne[0], hidden_size);
                 return false;
 
@@ -34,9 +34,11 @@ struct convert_params {
     std::string clip_g_model_file_path;
     std::string t5xxl_model_file_path;
     std::string output_file_path;
-    ggml_type vae_output_type  = GGML_TYPE_COUNT;
-    ggml_type clip_output_type = GGML_TYPE_COUNT;
-    ggml_type output_type      = GGML_TYPE_F16;
+    ggml_type vae_output_type    = GGML_TYPE_COUNT;
+    ggml_type clip_l_output_type = GGML_TYPE_COUNT;
+    ggml_type clip_g_output_type = GGML_TYPE_COUNT;
+    ggml_type t5xxl_output_type  = GGML_TYPE_COUNT;
+    ggml_type output_type        = GGML_TYPE_F16;
 };
 
 static void convert_params_print_usage(int, char** argv, const convert_params& params) {
@@ -51,7 +53,9 @@ static void convert_params_print_usage(int, char** argv, const convert_params& p
     printf("  --t5xxl-model                      path to t5xxl model file\n");
     printf("  --outfile                          path to write to\n");
     printf("  --vae-outtype                      output format of vae model, reuse --outtype if not specified\n");
-    printf("  --clip-outtype                     output format of clip_l/clip_g/t5xxl model, reuse --outtype if not specified\n");
+    printf("  --clip-l-outtype                   output format of clip_l model, reuse --outtype if not specified\n");
+    printf("  --clip-g-outtype                   output format of clip_g model, reuse --outtype if not specified\n");
+    printf("  --t5xxl-outtype                    output format of t5xxl model, reuse --outtype if not specified\n");
     printf("  --outtype                          output format, select from fp32;fp16;q8_0;q5_1;q5_0;q4_1;q4_0;q4_k;q3_k;q2_k\n");
 }
 
@@ -157,14 +161,38 @@ static bool convert_params_parse(int argc, char** argv, convert_params& params)
                 continue;
             }
 
-            if (!strcmp(flag, "--clip-outtype")) {
+            if (!strcmp(flag, "--clip-l-outtype")) {
                 if (i == argc) {
-                    missing("--clip-outtype");
+                    missing("--clip-l-outtype");
                 }
-                const char* outtype     = argv[i++];
-                params.clip_output_type = convert_str_to_ggml_type(outtype);
-                if (params.clip_output_type >= GGML_TYPE_COUNT) {
-                    invalid("--clip-outtype");
+                const char* outtype       = argv[i++];
+                params.clip_l_output_type = convert_str_to_ggml_type(outtype);
+                if (params.clip_l_output_type >= GGML_TYPE_COUNT) {
+                    invalid("--clip-l-outtype");
+                }
+                continue;
+            }
+
+            if (!strcmp(flag, "--clip-g-outtype")) {
+                if (i == argc) {
+                    missing("--clip-g-outtype");
+                }
+                const char* outtype       = argv[i++];
+                params.clip_g_output_type = convert_str_to_ggml_type(outtype);
+                if (params.clip_g_output_type >= GGML_TYPE_COUNT) {
+                    invalid("--clip-g-outtype");
+                }
+                continue;
+            }
+
+            if (!strcmp(flag, "--t5xxl-outtype")) {
+                if (i == argc) {
+                    missing("--t5xxl-outtype");
+                }
+                const char* outtype      = argv[i++];
+                params.t5xxl_output_type = convert_str_to_ggml_type(outtype);
+                if (params.t5xxl_output_type >= GGML_TYPE_COUNT) {
+                    invalid("--t5xxl-outtype");
                 }
                 continue;
             }
@@ -252,7 +280,7 @@ int convert_sd3(const convert_params& params, const SDVersion ver) {
     bool loaded = false;
 
     if (params.clip_l_model_file_path.empty()) {
-        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder/model", params.clip_output_type, "te.");
+        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder/model", params.clip_l_output_type, "te.");
     } else {
         loaded = loader.init_from_file(params.clip_l_model_file_path, "te.");
     }
@@ -262,7 +290,7 @@ int convert_sd3(const convert_params& params, const SDVersion ver) {
     }
 
     if (params.clip_g_model_file_path.empty()) {
-        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder_2/model", params.clip_output_type, "te1.");
+        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder_2/model", params.clip_g_output_type, "te1.");
     } else {
         loaded = loader.init_from_file(params.clip_g_model_file_path, "te1.");
     }
@@ -272,7 +300,7 @@ int convert_sd3(const convert_params& params, const SDVersion ver) {
     }
 
     if (params.t5xxl_model_file_path.empty()) {
-        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder_3/model", params.clip_output_type, "te2.");
+        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder_3/model", params.t5xxl_output_type, "te2.");
     } else {
         loaded = loader.init_from_file(params.t5xxl_model_file_path, "te2.");
     }
@@ -308,15 +336,20 @@ int convert_sd3(const convert_params& params, const SDVersion ver) {
         return 1;
     }
 
-    return !loader.save_to_gguf_file(params.output_file_path, params.output_type, params.vae_output_type, params.clip_output_type);
+    return !loader.save_to_gguf_file(params.output_file_path,
+                                     params.output_type,
+                                     params.vae_output_type,
+                                     params.clip_l_output_type,
+                                     params.clip_g_output_type,
+                                     params.t5xxl_output_type);
 }
 
 int convert_flux(const convert_params& params, const SDVersion ver) {
     ModelLoader loader;
     bool loaded = false;
 
     if (params.clip_l_model_file_path.empty()) {
-        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder/model", params.clip_output_type, "te.");
+        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder/model", params.clip_l_output_type, "te.");
     } else {
         loaded = loader.init_from_file(params.clip_l_model_file_path, "te.");
     }
@@ -326,7 +359,7 @@ int convert_flux(const convert_params& params, const SDVersion ver) {
     }
 
     if (params.t5xxl_model_file_path.empty()) {
-        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder_2/model", params.clip_output_type, "te1.");
+        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder_2/model", params.t5xxl_output_type, "te1.");
     } else {
         loaded = loader.init_from_file(params.t5xxl_model_file_path, "te1.");
     }
@@ -366,7 +399,12 @@ int convert_flux(const convert_params& params, const SDVersion ver) {
         return 1;
     }
 
-    return !loader.save_to_gguf_file(params.output_file_path, params.output_type, params.vae_output_type, params.clip_output_type);
+    return !loader.save_to_gguf_file(params.output_file_path,
+                                     params.output_type,
+                                     params.vae_output_type,
+                                     params.clip_l_output_type,
+                                     params.clip_g_output_type,
+                                     params.t5xxl_output_type);
 }
 
 int convert_sdxl(const convert_params& params, const SDVersion ver) {
@@ -375,7 +413,9 @@ int convert_sdxl(const convert_params& params, const SDVersion ver) {
 
     if (params.clip_l_model_file_path.empty()) {
         if (is_directory(path_join(params.model_path, "text_encoder"))) {
-            loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder/model", params.clip_output_type, "te.");
+            loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder/model", params.clip_l_output_type, "te.");
+        } else {
+            loaded = true;
         }
     } else {
         loaded = loader.init_from_file(params.clip_l_model_file_path, "te.");
@@ -386,7 +426,7 @@ int convert_sdxl(const convert_params& params, const SDVersion ver) {
     }
 
     if (params.clip_g_model_file_path.empty()) {
-        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder_2/model", params.clip_output_type, "te1.");
+        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder_2/model", params.clip_g_output_type, "te1.");
     } else {
         loaded = loader.init_from_file(params.clip_g_model_file_path, "te1.");
     }
@@ -422,15 +462,20 @@ int convert_sdxl(const convert_params& params, const SDVersion ver) {
         return 1;
     }
 
-    return !loader.save_to_gguf_file(params.output_file_path, params.output_type, params.vae_output_type, params.clip_output_type);
+    return !loader.save_to_gguf_file(params.output_file_path,
+                                     params.output_type,
+                                     params.vae_output_type,
+                                     params.clip_l_output_type,
+                                     params.clip_g_output_type,
+                                     params.t5xxl_output_type);
 }
 
 int convert_sd(const convert_params& params, const SDVersion ver) {
     ModelLoader loader;
     bool loaded = false;
 
     if (params.clip_l_model_file_path.empty()) {
-        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder/model", params.clip_output_type, "te.");
+        loaded = loader.init_from_safetensors_file(params.model_path, "text_encoder/model", params.clip_l_output_type, "te.");
     } else {
         loaded = loader.init_from_file(params.clip_l_model_file_path, "te.");
     }
@@ -466,7 +511,12 @@ int convert_sd(const convert_params& params, const SDVersion ver) {
         return 1;
     }
 
-    return !loader.save_to_gguf_file(params.output_file_path, params.output_type, params.vae_output_type, params.clip_output_type);
+    return !loader.save_to_gguf_file(params.output_file_path,
+                                     params.output_type,
+                                     params.vae_output_type,
+                                     params.clip_l_output_type,
+                                     params.clip_g_output_type,
+                                     params.t5xxl_output_type);
 }
 
 int convert_file(const convert_params& params) {
 
@@ -38,7 +38,7 @@ struct LoraModel : public GGMLRunner {
         }
 
         bool dry_run          = true;
-        auto on_new_tensor_cb = [&](const TensorStorage& tensor_storage, ggml_tensor** dst_tensor) -> bool {
+        auto on_new_tensor_cb = [&](const TensorStorage& tensor_storage, const SDVersion ver, ggml_tensor** dst_tensor) -> bool {
             const std::string& name = tensor_storage.name;
 
             if (filter_tensor && !contains(name, "lora")) {
Original file line number	Diff line number	Diff line change
`@@ -38,7 +38,7 @@ struct LoraModel : public GGMLRunner {`
`38`	`38`	`}`
`39`	`39`
`40`	`40`	`bool dry_run = true;`
`41`		`- auto on_new_tensor_cb = [&](const TensorStorage& tensor_storage, ggml_tensor** dst_tensor) -> bool {`
	`41`	`+ auto on_new_tensor_cb = [&](const TensorStorage& tensor_storage, const SDVersion ver, ggml_tensor** dst_tensor) -> bool {`
`42`	`42`	`const std::string& name = tensor_storage.name;`
`43`	`43`
`44`	`44`	`if (filter_tensor && !contains(name, "lora")) {`