@@ -98,26 +98,27 @@ c++ -I. -I./examples -O3 -std=c++11 -pthread examples/main/main.cpp whisper.o gg
98
98
usage: . / main [options] file0. wav file1. wav ...
99
99
100
100
options:
101
- - h, -- help show this help message and exit
102
- - t N , -- threads N number of threads to use during computation (default : 4 )
103
- - p N , -- processors N number of processors to use during computation (default : 1 )
104
- - ot N , -- offset- t N time offset in milliseconds (default : 0 )
105
- - on N , -- offset- n N segment index offset (default : 0 )
106
- - mc N , -- max- context N maximum number of text context tokens to store (default : max)
107
- - ml N , -- max- len N maximum segment length in characters (default : 0 )
108
- - wt N , -- word- thold N word timestamp probability threshold (default : 0.010000 )
109
- - v, -- verbose verbose output
110
- -- translate translate from source language to english
111
- - otxt, -- output- txt output result in a text file
112
- - ovtt, -- output- vtt output result in a vtt file
113
- - osrt, -- output- srt output result in a srt file
114
- - owts, -- output- words output script for generating karaoke video
115
- - ps, -- print_special print special tokens
116
- - pc, -- print_colors print colors
117
- - nt, -- no_timestamps do not print timestamps
118
- - l LANG , -- language LANG spoken language (default : en)
119
- - m FNAME , -- model FNAME model path (default : models/ ggml- base. en. bin)
120
- - f FNAME , -- file FNAME input WAV file path
101
+ - h, -- help [default ] show this help message and exit
102
+ - t N , -- threads N [4 ] number of threads to use during computation
103
+ - p N , -- processors N [1 ] number of processors to use during computation
104
+ - ot N , -- offset- t N [0 ] time offset in milliseconds
105
+ - on N , -- offset- n N [0 ] segment index offset
106
+ - d N , -- duration N [0 ] duration of audio to process in milliseconds
107
+ - mc N , -- max- context N [- 1 ] maximum number of text context tokens to store
108
+ - ml N , -- max- len N [0 ] maximum segment length in characters
109
+ - wt N , -- word- thold N [0.01 ] word timestamp probability threshold
110
+ - su, -- speed- up [false ] speed up audio by x2 (reduced accuracy)
111
+ - tr, -- translate [false ] translate from source language to english
112
+ - otxt, -- output- txt [false ] output result in a text file
113
+ - ovtt, -- output- vtt [false ] output result in a vtt file
114
+ - osrt, -- output- srt [false ] output result in a srt file
115
+ - owts, -- output- words [false ] output script for generating karaoke video
116
+ - ps, -- print- special [false ] print special tokens
117
+ - pc, -- print- colors [false ] print colors
118
+ - nt, -- no- timestamps [true ] do not print timestamps
119
+ - l LANG , -- language LANG [en ] spoken language
120
+ - m FNAME , -- model FNAME [models/ ggml- base. en. bin] model path
121
+ - f FNAME , -- file FNAME [ ] input WAV file path
121
122
122
123
bash . / models/ download- ggml- model. sh base. en
123
124
Downloading ggml model base. en ...
@@ -149,13 +150,13 @@ whisper_model_load: n_text_layer = 6
149
150
whisper_model_load: n_mels = 80
150
151
whisper_model_load: f16 = 1
151
152
whisper_model_load: type = 2
152
- whisper_model_load: mem_required = 670.00 MB
153
153
whisper_model_load: adding 1607 extra tokens
154
- whisper_model_load: ggml ctx size = 140.60 MB
155
- whisper_model_load: memory size = 22.83 MB
156
- whisper_model_load: model size = 140.54 MB
154
+ whisper_model_load: mem_required = 506.00 MB
155
+ whisper_model_load: ggml ctx size = 140.60 MB
156
+ whisper_model_load: memory size = 22.83 MB
157
+ whisper_model_load: model size = 140.54 MB
157
158
158
- system_info: n_threads = 4 / 10 | AVX2 = 0 | AVX512 = 0 | NEON = 1 | FP16_VA = 1 | WASM_SIMD = 0 | BLAS = 1 |
159
+ system_info: n_threads = 4 / 10 | AVX = 0 | AVX2 = 0 | AVX512 = 0 | NEON = 1 | FP16_VA = 1 | WASM_SIMD = 0 | BLAS = 1 |
159
160
160
161
main: processing ' samples/jfk.wav' (176000 samples, 11.0 sec), 4 threads, 1 processors, lang = en, task = transcribe, timestamps = 1 ...
161
162
0 commit comments