@@ -42,7 +42,7 @@ struct whisper_params {
42
42
bool print_energy = false ;
43
43
bool no_timestamps = true ;
44
44
bool use_gpu = true ;
45
- bool flash_attn = false ;
45
+ bool flash_attn = true ;
46
46
47
47
std::string language = " en" ;
48
48
std::string model = " models/ggml-base.en.bin" ;
@@ -66,28 +66,29 @@ static bool whisper_params_parse(int argc, char ** argv, whisper_params & params
66
66
whisper_print_usage (argc, argv, params);
67
67
exit (0 );
68
68
}
69
- else if (arg == " -t" || arg == " --threads" ) { params.n_threads = std::stoi (argv[++i]); }
70
- else if (arg == " -pms" || arg == " --prompt-ms" ) { params.prompt_ms = std::stoi (argv[++i]); }
71
- else if (arg == " -cms" || arg == " --command-ms" ) { params.command_ms = std::stoi (argv[++i]); }
72
- else if (arg == " -c" || arg == " --capture" ) { params.capture_id = std::stoi (argv[++i]); }
73
- else if (arg == " -mt" || arg == " --max-tokens" ) { params.max_tokens = std::stoi (argv[++i]); }
74
- else if (arg == " -ac" || arg == " --audio-ctx" ) { params.audio_ctx = std::stoi (argv[++i]); }
75
- else if (arg == " -vth" || arg == " --vad-thold" ) { params.vad_thold = std::stof (argv[++i]); }
76
- else if (arg == " -fth" || arg == " --freq-thold" ) { params.freq_thold = std::stof (argv[++i]); }
77
- else if (arg == " -tr" || arg == " --translate" ) { params.translate = true ; }
78
- else if (arg == " -ps" || arg == " --print-special" ) { params.print_special = true ; }
79
- else if (arg == " -pe" || arg == " --print-energy" ) { params.print_energy = true ; }
80
- else if (arg == " -ng" || arg == " --no-gpu" ) { params.use_gpu = false ; }
81
- else if (arg == " -fa" || arg == " --flash-attn" ) { params.flash_attn = true ; }
82
- else if (arg == " -l" || arg == " --language" ) { params.language = argv[++i]; }
83
- else if (arg == " -m" || arg == " --model" ) { params.model = argv[++i]; }
84
- else if (arg == " -f" || arg == " --file" ) { params.fname_out = argv[++i]; }
85
- else if (arg == " -cmd" || arg == " --commands" ) { params.commands = argv[++i]; }
86
- else if (arg == " -p" || arg == " --prompt" ) { params.prompt = argv[++i]; }
87
- else if (arg == " -ctx" || arg == " --context" ) { params.context = argv[++i]; }
88
- else if ( arg == " --grammar" ) { params.grammar = argv[++i]; }
89
- else if ( arg == " --grammar-penalty" ) { params.grammar_penalty = std::stof (argv[++i]); }
90
- else if ( arg == " --suppress-regex" ) { params.suppress_regex = argv[++i]; }
69
+ else if (arg == " -t" || arg == " --threads" ) { params.n_threads = std::stoi (argv[++i]); }
70
+ else if (arg == " -pms" || arg == " --prompt-ms" ) { params.prompt_ms = std::stoi (argv[++i]); }
71
+ else if (arg == " -cms" || arg == " --command-ms" ) { params.command_ms = std::stoi (argv[++i]); }
72
+ else if (arg == " -c" || arg == " --capture" ) { params.capture_id = std::stoi (argv[++i]); }
73
+ else if (arg == " -mt" || arg == " --max-tokens" ) { params.max_tokens = std::stoi (argv[++i]); }
74
+ else if (arg == " -ac" || arg == " --audio-ctx" ) { params.audio_ctx = std::stoi (argv[++i]); }
75
+ else if (arg == " -vth" || arg == " --vad-thold" ) { params.vad_thold = std::stof (argv[++i]); }
76
+ else if (arg == " -fth" || arg == " --freq-thold" ) { params.freq_thold = std::stof (argv[++i]); }
77
+ else if (arg == " -tr" || arg == " --translate" ) { params.translate = true ; }
78
+ else if (arg == " -ps" || arg == " --print-special" ) { params.print_special = true ; }
79
+ else if (arg == " -pe" || arg == " --print-energy" ) { params.print_energy = true ; }
80
+ else if (arg == " -ng" || arg == " --no-gpu" ) { params.use_gpu = false ; }
81
+ else if (arg == " -fa" || arg == " --flash-attn" ) { params.flash_attn = true ; }
82
+ else if (arg == " -nfa" || arg == " --no-flash-attn" ) { params.flash_attn = false ; }
83
+ else if (arg == " -l" || arg == " --language" ) { params.language = argv[++i]; }
84
+ else if (arg == " -m" || arg == " --model" ) { params.model = argv[++i]; }
85
+ else if (arg == " -f" || arg == " --file" ) { params.fname_out = argv[++i]; }
86
+ else if (arg == " -cmd" || arg == " --commands" ) { params.commands = argv[++i]; }
87
+ else if (arg == " -p" || arg == " --prompt" ) { params.prompt = argv[++i]; }
88
+ else if (arg == " -ctx" || arg == " --context" ) { params.context = argv[++i]; }
89
+ else if ( arg == " --grammar" ) { params.grammar = argv[++i]; }
90
+ else if ( arg == " --grammar-penalty" ) { params.grammar_penalty = std::stof (argv[++i]); }
91
+ else if ( arg == " --suppress-regex" ) { params.suppress_regex = argv[++i]; }
91
92
else {
92
93
fprintf (stderr, " error: unknown argument: %s\n " , arg.c_str ());
93
94
whisper_print_usage (argc, argv, params);
@@ -116,7 +117,8 @@ void whisper_print_usage(int /*argc*/, char ** argv, const whisper_params & para
116
117
fprintf (stderr, " -ps, --print-special [%-7s] print special tokens\n " , params.print_special ? " true" : " false" );
117
118
fprintf (stderr, " -pe, --print-energy [%-7s] print sound energy (for debugging)\n " , params.print_energy ? " true" : " false" );
118
119
fprintf (stderr, " -ng, --no-gpu [%-7s] disable GPU\n " , params.use_gpu ? " false" : " true" );
119
- fprintf (stderr, " -fa, --flash-attn [%-7s] flash attention\n " , params.flash_attn ? " true" : " false" );
120
+ fprintf (stderr, " -fa, --flash-attn [%-7s] enbale flash attention\n " , params.flash_attn ? " true" : " false" );
121
+ fprintf (stderr, " -nfa, --no-flash-attn [%-7s] disable flash attention\n " , params.flash_attn ? " false" : " true" );
120
122
fprintf (stderr, " -l LANG, --language LANG [%-7s] spoken language\n " , params.language .c_str ());
121
123
fprintf (stderr, " -m FNAME, --model FNAME [%-7s] model path\n " , params.model .c_str ());
122
124
fprintf (stderr, " -f FNAME, --file FNAME [%-7s] text output file name\n " , params.fname_out .c_str ());
0 commit comments