@@ -71,6 +71,7 @@ struct whisper_params {
7171 bool log_score = false ;
7272 bool use_gpu = true ;
7373 bool flash_attn = false ;
74+ bool suppress_nst = false ;
7475
7576 std::string language = " en" ;
7677 std::string prompt;
@@ -170,6 +171,7 @@ static bool whisper_params_parse(int argc, char ** argv, whisper_params & params
170171 else if (arg == " -ls" || arg == " --log-score" ) { params.log_score = true ; }
171172 else if (arg == " -ng" || arg == " --no-gpu" ) { params.use_gpu = false ; }
172173 else if (arg == " -fa" || arg == " --flash-attn" ) { params.flash_attn = true ; }
174+ else if (arg == " -sns" || arg == " --suppress-nst" ) { params.suppress_nst = true ; }
173175 else if ( arg == " --suppress-regex" ) { params.suppress_regex = argv[++i]; }
174176 else if ( arg == " --grammar" ) { params.grammar = argv[++i]; }
175177 else if ( arg == " --grammar-rule" ) { params.grammar_rule = argv[++i]; }
@@ -237,6 +239,7 @@ static void whisper_print_usage(int /*argc*/, char ** argv, const whisper_params
237239 fprintf (stderr, " -ls, --log-score [%-7s] log best decoder scores of tokens\n " , params.log_score ?" true" :" false" );
238240 fprintf (stderr, " -ng, --no-gpu [%-7s] disable GPU\n " , params.use_gpu ? " false" : " true" );
239241 fprintf (stderr, " -fa, --flash-attn [%-7s] flash attention\n " , params.flash_attn ? " true" : " false" );
242+ fprintf (stderr, " -sns, --suppress-nst [%-7s] suppress non-speech tokens\n " , params.suppress_nst ? " true" : " false" );
240243 fprintf (stderr, " --suppress-regex REGEX [%-7s] regular expression matching tokens to suppress\n " , params.suppress_regex .c_str ());
241244 fprintf (stderr, " --grammar GRAMMAR [%-7s] GBNF grammar to guide decoding\n " , params.grammar .c_str ());
242245 fprintf (stderr, " --grammar-rule RULE [%-7s] top-level GBNF grammar rule name\n " , params.grammar_rule .c_str ());
@@ -1128,6 +1131,8 @@ int main(int argc, char ** argv) {
11281131
11291132 wparams.no_timestamps = params.no_timestamps ;
11301133
1134+ wparams.suppress_nst = params.suppress_nst ;
1135+
11311136 whisper_print_user_data user_data = { ¶ms, &pcmf32s, 0 };
11321137
11331138 const auto & grammar_parsed = params.grammar_parsed ;
0 commit comments