@@ -43,8 +43,8 @@ struct SDCtxParams {
4343 std::string clip_g_path;
4444 std::string clip_vision_path;
4545 std::string t5xxl_path;
46- std::string qwen2vl_path ;
47- std::string qwen2vl_vision_path ;
46+ std::string llm_path ;
47+ std::string llm_vision_path ;
4848 std::string diffusion_model_path;
4949 std::string high_noise_diffusion_model_path;
5050 std::string vae_path;
@@ -505,8 +505,8 @@ void parse_args(int argc, const char** argv, SDParams& params) {
505505 {" " , " --clip_g" , " path to the clip-g text encoder" , ¶ms.ctxParams .clip_g_path },
506506 {" " , " --clip_vision" , " path to the clip-vision encoder" , ¶ms.ctxParams .clip_vision_path },
507507 {" " , " --t5xxl" , " path to the t5xxl text encoder" , ¶ms.ctxParams .t5xxl_path },
508- {" " , " --qwen2vl " , " path to the qwen2vl text encoder" , ¶ms.ctxParams .qwen2vl_path },
509- {" " , " --qwen2vl_vision " , " path to the qwen2vl vit" , ¶ms.ctxParams .qwen2vl_vision_path },
508+ {" " , " --llm " , " path to the llm text encoder" , ¶ms.ctxParams .llm_path },
509+ {" " , " --llm_vision " , " path to the llm vit" , ¶ms.ctxParams .llm_vision_path },
510510 {" " , " --diffusion-model" , " path to the standalone diffusion model" , ¶ms.ctxParams .diffusion_model_path },
511511 {" " , " --high-noise-diffusion-model" , " path to the standalone high noise diffusion model" , ¶ms.ctxParams .high_noise_diffusion_model_path },
512512 {" " , " --vae" , " path to standalone vae model" , ¶ms.ctxParams .vae_path },
@@ -1494,11 +1494,11 @@ bool parseJsonPrompt(std::string json_str, SDParams* params) {
14941494 {" tae" , [&](const json& o) -> bool {
14951495 return parse_model_part (o, params->tae_files , params->tae_dir , params->ctxParams .taesd_path );
14961496 }},
1497- {" qwen2vl " , [&](const json& o) -> bool {
1498- return parse_model_part (o, params->clip_files , params->clip_dir , params->ctxParams .qwen2vl_path );
1497+ {" llm " , [&](const json& o) -> bool {
1498+ return parse_model_part (o, params->clip_files , params->clip_dir , params->ctxParams .llm_path );
14991499 }},
1500- {" qwen2vl_vision " , [&](const json& o) -> bool {
1501- return parse_model_part (o, params->clip_vision_files , params->clip_vision_dir , params->ctxParams .qwen2vl_vision_path );
1500+ {" llm_vision " , [&](const json& o) -> bool {
1501+ return parse_model_part (o, params->clip_vision_files , params->clip_vision_dir , params->ctxParams .llm_vision_path );
15021502 }},
15031503 {" control_net" , [&](const json& o) -> bool {
15041504 return parse_model_part (o, params->controlnet_files , params->controlnet_dir , params->ctxParams .control_net_path );
@@ -1963,8 +1963,8 @@ nlohmann::json serv_generate_image(sd_ctx_t*& sd_ctx, SDParams& params, int& n_p
19631963 params.ctxParams .clip_g_path .c_str (),
19641964 params.ctxParams .clip_vision_path .c_str (),
19651965 params.ctxParams .t5xxl_path .c_str (),
1966- params.ctxParams .qwen2vl_path .c_str (),
1967- params.ctxParams .qwen2vl_vision_path .c_str (),
1966+ params.ctxParams .llm_path .c_str (),
1967+ params.ctxParams .llm_vision_path .c_str (),
19681968 params.ctxParams .diffusion_model_path .c_str (),
19691969 params.ctxParams .high_noise_diffusion_model_path .c_str (),
19701970 params.ctxParams .vae_path .c_str (),
@@ -2469,15 +2469,15 @@ void start_server(SDParams params) {
24692469 if (!params.ctxParams .t5xxl_path .empty ()) {
24702470 response[" t5xxl" ] = sd_basename (params.ctxParams .t5xxl_path );
24712471 }
2472- if (!params.ctxParams .qwen2vl_path .empty ()) {
2473- response[" qwen2vl " ] = sd_basename (params.ctxParams .qwen2vl_path );
2472+ if (!params.ctxParams .llm_path .empty ()) {
2473+ response[" llm " ] = sd_basename (params.ctxParams .llm_path );
24742474 }
24752475
24762476 if (!params.ctxParams .clip_vision_path .empty ()) {
24772477 response[" clip_vision" ] = sd_basename (params.ctxParams .clip_vision_path );
24782478 }
2479- if (!params.ctxParams .qwen2vl_vision_path .empty ()) {
2480- response[" qwen2vl_vision " ] = sd_basename (params.ctxParams .qwen2vl_vision_path );
2479+ if (!params.ctxParams .llm_vision_path .empty ()) {
2480+ response[" llm_vision " ] = sd_basename (params.ctxParams .llm_vision_path );
24812481 }
24822482
24832483 if (!params.ctxParams .vae_path .empty ()) {
0 commit comments