@@ -49,8 +49,7 @@ const char* sampling_methods_str[] = {
4949 " iPNDM_v" ,
5050 " LCM" ,
5151 " DDIM \" trailing\" " ,
52- " TCD"
53- };
52+ " TCD" };
5453
5554/* ================================================== Helper Functions ================================================*/
5655
@@ -683,7 +682,7 @@ class StableDiffusionGGML {
683682 float curr_multiplier = kv.second ;
684683 lora_state_diff[lora_name] -= curr_multiplier;
685684 }
686-
685+
687686 size_t rm = lora_state_diff.size () - lora_state.size ();
688687 if (rm != 0 ) {
689688 LOG_INFO (" Attempting to apply %lu LoRAs (removing %lu applied LoRAs)" , lora_state.size (), rm);
@@ -806,7 +805,6 @@ class StableDiffusionGGML {
806805 float skip_layer_start = 0.01 ,
807806 float skip_layer_end = 0.2 ,
808807 ggml_tensor* noise_mask = nullptr ) {
809-
810808 // TODO (Pix2Pix): separate image guidance params (right now it's reusing distilled guidance)
811809
812810 float img_cfg_scale = guidance;
@@ -834,7 +832,7 @@ class StableDiffusionGGML {
834832
835833 bool has_unconditioned = cfg_scale != 1.0 && uncond.c_crossattn != NULL ;
836834 bool has_img_guidance = version == VERSION_INSTRUCT_PIX2PIX && cfg_scale != img_cfg_scale;
837- has_unconditioned = has_unconditioned || has_img_guidance;
835+ has_unconditioned = has_unconditioned || has_img_guidance;
838836 bool has_skiplayer = slg_scale != 0.0 && skip_layers.size () > 0 ;
839837
840838 // denoise wrapper
@@ -988,7 +986,7 @@ class StableDiffusionGGML {
988986 int64_t i3 = i / out_cond->ne [0 ] * out_cond->ne [1 ] * out_cond->ne [2 ];
989987 float scale = min_cfg + (cfg_scale - min_cfg) * (i3 * 1 .0f / ne3);
990988 } else {
991- if (has_img_guidance){
989+ if (has_img_guidance) {
992990 latent_result = negative_data[i] + img_cfg_scale * (img_cond_data[i] - negative_data[i]) + cfg_scale * (positive_data[i] - img_cond_data[i]);
993991 } else {
994992 latent_result = negative_data[i] + cfg_scale * (positive_data[i] - negative_data[i]);
@@ -1553,7 +1551,7 @@ sd_image_t* generate_image(sd_ctx_t* sd_ctx,
15531551 result_images[i].width = width;
15541552 result_images[i].height = height;
15551553 result_images[i].channel = 3 ;
1556- result_images[i].data = sd_tensor_to_image (decoded_images[i]);
1554+ result_images[i].data = sd_tensor_to_image (decoded_images[i], sd_ctx-> sd -> version == VERSION_INSTRUCT_PIX2PIX );
15571555 }
15581556 ggml_free (work_ctx);
15591557
@@ -1737,7 +1735,7 @@ sd_image_t* img2img(sd_ctx_t* sd_ctx,
17371735
17381736 sd_mask_to_tensor (mask.data , mask_img);
17391737
1740- sd_image_to_tensor (init_image.data , init_img);
1738+ sd_image_to_tensor (init_image.data , init_img, true , sd_ctx-> sd -> version == VERSION_INSTRUCT_PIX2PIX );
17411739
17421740 ggml_tensor* masked_image;
17431741
0 commit comments