Handle ggml aborts

SkutteOleg · SkutteOleg · commit 70ad206cd2b5 · 2025-03-17T13:24:40.000+04:00
diff --git a/.gitignore b/.gitignore
@@ -10,4 +10,7 @@ test/
 *.gguf
 output*.png
 models*
-*.log
+*.log
+/cmake-build-debug
+/.idea
+/cmake-build-release
diff --git a/.gitmodules b/.gitmodules
@@ -1,3 +1,4 @@
 [submodule "ggml"]
     path = ggml
-	url = https://github.com/ggerganov/ggml.git
+        url = https://github.com/SkutteOleg/ggml.git
+        branch = dreamio
diff --git a/ggml b/ggml
@@ -1 +1 @@
-Subproject commit ff9052988b76e137bcf92bb335733933ca196ac0
+Subproject commit c3dec0049862a92d355f34bfbd0e67d35b16bc3c
diff --git a/stable-diffusion.cpp b/stable-diffusion.cpp
@@ -15,6 +15,7 @@
 #include "pmid.hpp"
 #include "tae.hpp"
 #include "vae.hpp"
+#include <setjmp.h>
 
 #define STB_IMAGE_IMPLEMENTATION
 #define STB_IMAGE_STATIC
@@ -1132,32 +1133,36 @@ SDError new_sd_ctx(sd_ctx_t** sd_ctx,
                    bool keep_control_net_cpu,
                    bool keep_vae_on_cpu,
                    bool diffusion_flash_attn) {
-    try {
-        *sd_ctx = (sd_ctx_t*)malloc(sizeof(sd_ctx_t));
-        if (*sd_ctx == NULL) {
-            return SD_ERROR_MEMORY_ALLOCATION;
-        }
-        std::string model_path(model_path_c_str);
-        std::string clip_l_path(clip_l_path_c_str);
-        std::string clip_g_path(clip_g_path_c_str);
-        std::string t5xxl_path(t5xxl_path_c_str);
-        std::string diffusion_model_path(diffusion_model_path_c_str);
-        std::string vae_path(vae_path_c_str);
-        std::string taesd_path(taesd_path_c_str);
-        std::string control_net_path(control_net_path_c_str);
-        std::string embd_path(embed_dir_c_str);
-        std::string id_embd_path(id_embed_dir_c_str);
-        std::string lora_model_dir(lora_model_dir_c_str);
-
-        (*sd_ctx)->sd = new StableDiffusionGGML(n_threads,
-                                                vae_decode_only,
-                                                free_params_immediately,
-                                                lora_model_dir,
-                                                rng_type);
-        if ((*sd_ctx)->sd == NULL) {
-            free(*sd_ctx);
-            return SD_ERROR_MEMORY_ALLOCATION;
-        }
+    ggml_error_jmp_set = 1;
+    if (setjmp(ggml_error_jmp_buf) == 0) {
+        try {
+            *sd_ctx = (sd_ctx_t*)malloc(sizeof(sd_ctx_t));
+            if (*sd_ctx == NULL) {
+                ggml_error_jmp_set = 0;
+                return SD_ERROR_MEMORY_ALLOCATION;
+            }
+            std::string model_path(model_path_c_str);
+            std::string clip_l_path(clip_l_path_c_str);
+            std::string clip_g_path(clip_g_path_c_str);
+            std::string t5xxl_path(t5xxl_path_c_str);
+            std::string diffusion_model_path(diffusion_model_path_c_str);
+            std::string vae_path(vae_path_c_str);
+            std::string taesd_path(taesd_path_c_str);
+            std::string control_net_path(control_net_path_c_str);
+            std::string embd_path(embed_dir_c_str);
+            std::string id_embd_path(id_embed_dir_c_str);
+            std::string lora_model_dir(lora_model_dir_c_str);
+
+            (*sd_ctx)->sd = new StableDiffusionGGML(n_threads,
+                                                    vae_decode_only,
+                                                    free_params_immediately,
+                                                    lora_model_dir,
+                                                    rng_type);
+            if ((*sd_ctx)->sd == NULL) {
+                free(*sd_ctx);
+                ggml_error_jmp_set = 0;
+                return SD_ERROR_MEMORY_ALLOCATION;
+            }
 
         if (!(*sd_ctx)->sd->load_from_file(model_path,
                                            clip_l_path,
@@ -1177,15 +1182,24 @@ SDError new_sd_ctx(sd_ctx_t** sd_ctx,
             diffusion_flash_attn)) {
         delete (*sd_ctx)->sd;
             free(*sd_ctx);
+            ggml_error_jmp_set = 0;
             return SD_ERROR_PROCESSING;
         }
 
-        return SD_SUCCESS;
-    } catch (const std::exception& e) {
-        LOG_ERROR("Exception in new_sd_ctx: %s", e.what());
-        return SD_ERROR_PROCESSING;
-    } catch (...) {
-        LOG_ERROR("Unknown exception in new_sd_ctx");
+            ggml_error_jmp_set = 0;
+            return SD_SUCCESS;
+        } catch (const std::exception& e) {
+            LOG_ERROR("Exception in new_sd_ctx: %s", e.what());
+            ggml_error_jmp_set = 0;
+            return SD_ERROR_PROCESSING;
+        } catch (...) {
+            LOG_ERROR("Unknown exception in new_sd_ctx");
+            ggml_error_jmp_set = 0;
+            return SD_ERROR_PROCESSING;
+        }
+    } else {
+        LOG_ERROR("GGML error in new_sd_ctx: %s", ggml_get_error_message());
+        ggml_error_jmp_set = 0;
         return SD_ERROR_PROCESSING;
     }
 }
@@ -1567,55 +1581,59 @@ SDError txt2img(sd_ctx_t* sd_ctx,
                 float skip_layer_end= 0.2) {
     std::vector<int> skip_layers_vec(skip_layers, skip_layers + skip_layers_count);
     struct ggml_context* work_ctx = NULL;
-    try {
-        LOG_DEBUG("txt2img %dx%d", width, height);
-        if (sd_ctx == NULL) {
-            return SD_ERROR_INVALID_CONTEXT;
-        }
-
-        struct ggml_init_params params;
-        params.mem_size = static_cast<size_t>(10 * 1024 * 1024);  // 10 MB
-        if (sd_version_is_sd3(sd_ctx->sd->version)) {
-            params.mem_size *= 3;
+    ggml_error_jmp_set = 1;
+    if (setjmp(ggml_error_jmp_buf) == 0) {
+        try {
+            LOG_DEBUG("txt2img %dx%d", width, height);
+            if (sd_ctx == NULL) {
+                ggml_error_jmp_set = 0;
+                return SD_ERROR_INVALID_CONTEXT;
+            }
+
+            struct ggml_init_params params;
+            params.mem_size = static_cast<size_t>(10 * 1024 * 1024);  // 10 MB
+            if (sd_version_is_sd3(sd_ctx->sd->version)) {
+                params.mem_size *= 3;
     }
     if (sd_version_is_flux(sd_ctx->sd->version)) {
         params.mem_size *= 4;
-        }
-        if (sd_ctx->sd->stacked_id) {
-            params.mem_size += static_cast<size_t>(10 * 1024 * 1024);  // 10 MB
-        }
-        params.mem_size += width * height * 3 * sizeof(float);
-        params.mem_size *= batch_count;
-        params.mem_buffer = NULL;
-        params.no_alloc   = false;
-        // LOG_DEBUG("mem_size %u ", params.mem_size);
+            }
+            if (sd_ctx->sd->stacked_id) {
+                params.mem_size += static_cast<size_t>(10 * 1024 * 1024);  // 10 MB
+            }
+            params.mem_size += width * height * 3 * sizeof(float);
+            params.mem_size *= batch_count;
+            params.mem_buffer = NULL;
+            params.no_alloc   = false;
+            // LOG_DEBUG("mem_size %u ", params.mem_size);
 
-        work_ctx = ggml_init(params);
-        if (!work_ctx) {
-            LOG_ERROR("ggml_init() failed");
-            return SD_ERROR_MEMORY_ALLOCATION;
-        }
+            work_ctx = ggml_init(params);
+            if (!work_ctx) {
+                LOG_ERROR("ggml_init() failed");
+                ggml_error_jmp_set = 0;
+                return SD_ERROR_MEMORY_ALLOCATION;
+            }
 
-        size_t t0 = ggml_time_ms();
+            size_t t0 = ggml_time_ms();
 
-        std::vector<float> sigmas = sd_ctx->sd->denoiser->get_sigmas(sample_steps);
+            std::vector<float> sigmas = sd_ctx->sd->denoiser->get_sigmas(sample_steps);
 
-        int C = 4;
-        if (sd_version_is_sd3(sd_ctx->sd->version)) {
+            int C = 4;
+            if (sd_version_is_sd3(sd_ctx->sd->version)) {
         C = 16;
     } else if (sd_version_is_flux(sd_ctx->sd->version)) {
-            C = 16;
-        }
-        int W                    = width / 8;
-        int H                    = height / 8;
-        ggml_tensor* init_latent = ggml_new_tensor_4d(work_ctx, GGML_TYPE_F32, W, H, C, 1);
-        if (sd_version_is_sd3(sd_ctx->sd->version)) {
-            ggml_set_f32(init_latent, 0.0609f);
+                C = 16;
+            }
+            int W                    = width / 8;
+            int H                    = height / 8;
+            ggml_tensor* init_latent = ggml_new_tensor_4d(work_ctx, GGML_TYPE_F32, W, H, C, 1);
+            if (sd_version_is_sd3(sd_ctx->sd->version)) {
+                ggml_set_f32(init_latent, 0.0609f);
     } else if (sd_version_is_flux(sd_ctx->sd->version)) {
         ggml_set_f32(init_latent, 0.1159f);
-        } else {
-            ggml_set_f32(init_latent, 0.f);
-        }
+            } else {
+                ggml_set_f32(init_latent, 0.f);
+            }
 
     if (sd_version_is_inpaint(sd_ctx->sd->version)) {
         LOG_WARN("This is an inpainting model, this should only be used in img2img mode with a mask");
@@ -1645,30 +1663,42 @@ SDError txt2img(sd_ctx_t* sd_ctx,
                                     skip_layer_start,
                                     skip_layer_end);
 
-        if (*result_images == NULL) {
-            ggml_free(work_ctx);
-            return SD_ERROR_PROCESSING;
-        }
+            if (*result_images == NULL) {
+                ggml_free(work_ctx);
+                ggml_error_jmp_set = 0;
+                return SD_ERROR_PROCESSING;
+            }
 
-        *result_count = batch_count;
+            *result_count = batch_count;
 
-        size_t t1 = ggml_time_ms();
+            size_t t1 = ggml_time_ms();
 
-        LOG_INFO("txt2img completed in %.2fs", (t1 - t0) * 1.0f / 1000);
+            LOG_INFO("txt2img completed in %.2fs", (t1 - t0) * 1.0f / 1000);
 
-        ggml_free(work_ctx);
-        return SD_SUCCESS;
-    } catch (const std::exception& e) {
-        LOG_ERROR("Exception in txt2img: %s", e.what());
-        if (work_ctx) {
             ggml_free(work_ctx);
+            ggml_error_jmp_set = 0;
+            return SD_SUCCESS;
+        } catch (const std::exception& e) {
+            LOG_ERROR("Exception in txt2img: %s", e.what());
+            if (work_ctx) {
+                ggml_free(work_ctx);
+            }
+            ggml_error_jmp_set = 0;
+            return SD_ERROR_PROCESSING;
+        } catch (...) {
+            LOG_ERROR("Unknown exception in txt2img");
+            if (work_ctx) {
+                ggml_free(work_ctx);
+            }
+            ggml_error_jmp_set = 0;
+            return SD_ERROR_PROCESSING;
         }
-        return SD_ERROR_PROCESSING;
-    } catch (...) {
-        LOG_ERROR("Unknown exception in txt2img");
+    } else {
+        LOG_ERROR("GGML error in txt2img: %s", ggml_get_error_message());
         if (work_ctx) {
             ggml_free(work_ctx);
         }
+        ggml_error_jmp_set = 0;
         return SD_ERROR_PROCESSING;
     }
 }