@@ -42,7 +42,7 @@ struct whisper_params {
4242 bool print_energy = false ;
4343 bool no_timestamps = true ;
4444 bool use_gpu = true ;
45- bool flash_attn = false ;
45+ bool flash_attn = true ;
4646
4747 std::string language = " en" ;
4848 std::string model = " models/ggml-base.en.bin" ;
@@ -66,28 +66,29 @@ static bool whisper_params_parse(int argc, char ** argv, whisper_params & params
6666 whisper_print_usage (argc, argv, params);
6767 exit (0 );
6868 }
69- else if (arg == " -t" || arg == " --threads" ) { params.n_threads = std::stoi (argv[++i]); }
70- else if (arg == " -pms" || arg == " --prompt-ms" ) { params.prompt_ms = std::stoi (argv[++i]); }
71- else if (arg == " -cms" || arg == " --command-ms" ) { params.command_ms = std::stoi (argv[++i]); }
72- else if (arg == " -c" || arg == " --capture" ) { params.capture_id = std::stoi (argv[++i]); }
73- else if (arg == " -mt" || arg == " --max-tokens" ) { params.max_tokens = std::stoi (argv[++i]); }
74- else if (arg == " -ac" || arg == " --audio-ctx" ) { params.audio_ctx = std::stoi (argv[++i]); }
75- else if (arg == " -vth" || arg == " --vad-thold" ) { params.vad_thold = std::stof (argv[++i]); }
76- else if (arg == " -fth" || arg == " --freq-thold" ) { params.freq_thold = std::stof (argv[++i]); }
77- else if (arg == " -tr" || arg == " --translate" ) { params.translate = true ; }
78- else if (arg == " -ps" || arg == " --print-special" ) { params.print_special = true ; }
79- else if (arg == " -pe" || arg == " --print-energy" ) { params.print_energy = true ; }
80- else if (arg == " -ng" || arg == " --no-gpu" ) { params.use_gpu = false ; }
81- else if (arg == " -fa" || arg == " --flash-attn" ) { params.flash_attn = true ; }
82- else if (arg == " -l" || arg == " --language" ) { params.language = argv[++i]; }
83- else if (arg == " -m" || arg == " --model" ) { params.model = argv[++i]; }
84- else if (arg == " -f" || arg == " --file" ) { params.fname_out = argv[++i]; }
85- else if (arg == " -cmd" || arg == " --commands" ) { params.commands = argv[++i]; }
86- else if (arg == " -p" || arg == " --prompt" ) { params.prompt = argv[++i]; }
87- else if (arg == " -ctx" || arg == " --context" ) { params.context = argv[++i]; }
88- else if ( arg == " --grammar" ) { params.grammar = argv[++i]; }
89- else if ( arg == " --grammar-penalty" ) { params.grammar_penalty = std::stof (argv[++i]); }
90- else if ( arg == " --suppress-regex" ) { params.suppress_regex = argv[++i]; }
69+ else if (arg == " -t" || arg == " --threads" ) { params.n_threads = std::stoi (argv[++i]); }
70+ else if (arg == " -pms" || arg == " --prompt-ms" ) { params.prompt_ms = std::stoi (argv[++i]); }
71+ else if (arg == " -cms" || arg == " --command-ms" ) { params.command_ms = std::stoi (argv[++i]); }
72+ else if (arg == " -c" || arg == " --capture" ) { params.capture_id = std::stoi (argv[++i]); }
73+ else if (arg == " -mt" || arg == " --max-tokens" ) { params.max_tokens = std::stoi (argv[++i]); }
74+ else if (arg == " -ac" || arg == " --audio-ctx" ) { params.audio_ctx = std::stoi (argv[++i]); }
75+ else if (arg == " -vth" || arg == " --vad-thold" ) { params.vad_thold = std::stof (argv[++i]); }
76+ else if (arg == " -fth" || arg == " --freq-thold" ) { params.freq_thold = std::stof (argv[++i]); }
77+ else if (arg == " -tr" || arg == " --translate" ) { params.translate = true ; }
78+ else if (arg == " -ps" || arg == " --print-special" ) { params.print_special = true ; }
79+ else if (arg == " -pe" || arg == " --print-energy" ) { params.print_energy = true ; }
80+ else if (arg == " -ng" || arg == " --no-gpu" ) { params.use_gpu = false ; }
81+ else if (arg == " -fa" || arg == " --flash-attn" ) { params.flash_attn = true ; }
82+ else if (arg == " -nfa" || arg == " --no-flash-attn" ) { params.flash_attn = false ; }
83+ else if (arg == " -l" || arg == " --language" ) { params.language = argv[++i]; }
84+ else if (arg == " -m" || arg == " --model" ) { params.model = argv[++i]; }
85+ else if (arg == " -f" || arg == " --file" ) { params.fname_out = argv[++i]; }
86+ else if (arg == " -cmd" || arg == " --commands" ) { params.commands = argv[++i]; }
87+ else if (arg == " -p" || arg == " --prompt" ) { params.prompt = argv[++i]; }
88+ else if (arg == " -ctx" || arg == " --context" ) { params.context = argv[++i]; }
89+ else if ( arg == " --grammar" ) { params.grammar = argv[++i]; }
90+ else if ( arg == " --grammar-penalty" ) { params.grammar_penalty = std::stof (argv[++i]); }
91+ else if ( arg == " --suppress-regex" ) { params.suppress_regex = argv[++i]; }
9192 else {
9293 fprintf (stderr, " error: unknown argument: %s\n " , arg.c_str ());
9394 whisper_print_usage (argc, argv, params);
@@ -116,7 +117,8 @@ void whisper_print_usage(int /*argc*/, char ** argv, const whisper_params & para
116117 fprintf (stderr, " -ps, --print-special [%-7s] print special tokens\n " , params.print_special ? " true" : " false" );
117118 fprintf (stderr, " -pe, --print-energy [%-7s] print sound energy (for debugging)\n " , params.print_energy ? " true" : " false" );
118119 fprintf (stderr, " -ng, --no-gpu [%-7s] disable GPU\n " , params.use_gpu ? " false" : " true" );
119- fprintf (stderr, " -fa, --flash-attn [%-7s] flash attention\n " , params.flash_attn ? " true" : " false" );
120+ fprintf (stderr, " -fa, --flash-attn [%-7s] enbale flash attention\n " , params.flash_attn ? " true" : " false" );
121+ fprintf (stderr, " -nfa, --no-flash-attn [%-7s] disable flash attention\n " , params.flash_attn ? " false" : " true" );
120122 fprintf (stderr, " -l LANG, --language LANG [%-7s] spoken language\n " , params.language .c_str ());
121123 fprintf (stderr, " -m FNAME, --model FNAME [%-7s] model path\n " , params.model .c_str ());
122124 fprintf (stderr, " -f FNAME, --file FNAME [%-7s] text output file name\n " , params.fname_out .c_str ());
0 commit comments