@@ -411,7 +411,7 @@ function Run-BenchMode {
411411 Write-Host " >>> BENCH ($Mode ) ..."
412412
413413 # Arguments only (exe is passed separately)
414- $benchArgs = @ (' -m' , $MODEL , ' -p' , $P_LEN , ' -n' , $N_TOK , ' -b' , $BATCH , ' -t' , $THREADS , ' -ngl' , $NGL )
414+ $benchArgs = @ (' -m' , $MODEL , ' -p' , $P_LEN , ' -n' , $N_TOK , ' -b' , $BATCH , ' -t' , $THREADS , ' -ngl' , $NGL , ' --flash-attn ' , 1 )
415415 if ($benchHasCtx ) { $benchArgs += @ (' -c' , $CTX ) }
416416 if ($UBATCH -and $benchHasUb ) { $benchArgs += @ (' -ub' , $UBATCH ) }
417417 if ($CTK -and $benchHasCTK ) { $benchArgs += @ (' -ctk' , $CTK ) }
@@ -439,7 +439,7 @@ function Run-PplMode {
439439 if ($Mode -eq ' on' ) { $env: LLAMA_XQ_NOBASE = ' 1' } else { Remove-Item Env:LLAMA_XQ_NOBASE - ErrorAction SilentlyContinue }
440440 Write-Host " >>> PPL ($Mode ) ..."
441441
442- $pplArgs = @ (' -m' , $MODEL , ' -f' , $PPL_FILE )
442+ $pplArgs = @ (' -m' , $MODEL , ' -f' , $PPL_FILE , ' --flash-attn ' , 1 )
443443 if ($pplHasCTK -and $CTK ) { $pplArgs += @ (' -ctk' , $CTK ) }
444444 if ($pplHasCTV -and $CTV ) { $pplArgs += @ (' -ctv' , $CTV ) }
445445 if ($pplHasCtx ) { $pplArgs += @ (' -c' , $CTX ) }
0 commit comments