@@ -1106,8 +1106,8 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa
11061106 params.fused_mmad = false ;
11071107 return true ;
11081108 }
1109- if (arg == " -rcache" || arg == " --rope-cache" ) {
1110- params.rope_cache = true ;
1109+ if (arg == " -no- rcache" || arg == " --no -rope-cache" ) {
1110+ params.rope_cache = false ;
11111111 return true ;
11121112 }
11131113 if (arg == " -ser" || arg == " --smart-expert-reduction" ) {
@@ -1918,7 +1918,7 @@ void gpt_params_print_usage(int /*argc*/, char ** argv, const gpt_params & param
19181918 options.push_back ({ " *" , " -ger, --grouped-expert-routing" , " enable grouped expert routing (default: %s)" , params.grouped_expert_routing ? " enabled" : " disabled" });
19191919 options.push_back ({ " *" , " -no-fug, --no-fused-up-gate" , " disaable fused up-gate (default: %s)" , params.fused_up_gate ? " enabled" : " disabled" });
19201920 options.push_back ({ " *" , " -no-mmad, --no-fused-mul-multiadd" , " disaable fused mul-multi_add (default: %s)" , params.fused_mmad ? " enabled" : " disabled" });
1921- options.push_back ({ " *" , " -rcache, --rope-cache" , " enable RoPE cache (default: %s)" , params.rope_cache ? " enabled" : " disabled" });
1921+ options.push_back ({ " *" , " -no- rcache, --no- rope-cache" , " disaable RoPE cache (default: %s)" , params.rope_cache ? " enabled" : " disabled" });
19221922 options.push_back ({ " *" , " -ser, --smart-expert-reduction," ," experts reduction (default: %d,%g)" , params.min_experts , params.thresh_experts });
19231923 options.push_back ({ " *" , " -mqkv, --merge-qkv," , " merge Q,K,V (default: %d)" , params.merge_qkv });
19241924 options.push_back ({ " *" , " -p, --prompt PROMPT" , " prompt to start generation with\n "
0 commit comments