

better documentation, help message and logging prints
@54634f008ee362a3986327738407297766d9ce96
--- README.md
+++ README.md
... | ... | @@ -183,7 +183,7 @@ |
183 | 183 |
|
184 | 184 |
### Server -- real-time from mic |
185 | 185 |
|
186 |
-`whisper_online_server.py` has the same model options as `whisper_online.py`, plus `--host` and `--port` of the TCP connection. See help message (`-h` option). |
|
186 |
+`whisper_online_server.py` has the same model options as `whisper_online.py`, plus `--host` and `--port` of the TCP connection and the `--warmup-file`. See the help message (`-h` option). |
|
187 | 187 |
|
188 | 188 |
Client example: |
189 | 189 |
|
--- whisper_online.py
+++ whisper_online.py
... | ... | @@ -625,7 +625,7 @@ |
625 | 625 |
# load the audio into the LRU cache before we start the timer |
626 | 626 |
a = load_audio_chunk(audio_path,0,1) |
627 | 627 |
|
628 |
- # warm up the ASR, because the very first transcribe takes much more time than the other |
|
628 |
+ # warm up the ASR because the very first transcribe takes much more time than the other |
|
629 | 629 |
asr.transcribe(a) |
630 | 630 |
|
631 | 631 |
beg = args.start_at |
--- whisper_online_server.py
+++ whisper_online_server.py
... | ... | @@ -10,8 +10,8 @@ |
10 | 10 |
# server options |
11 | 11 |
parser.add_argument("--host", type=str, default='localhost') |
12 | 12 |
parser.add_argument("--port", type=int, default=43007) |
13 |
- |
|
14 |
-parser.add_argument("--warmup-file", type=str, dest="warmup_file") |
|
13 |
+parser.add_argument("--warmup-file", type=str, dest="warmup_file", |
|
14 |
+ help="The path to a speech audio wav file to warm up Whisper so that the very first chunk processing is fast. It can be e.g. https://github.com/ggerganov/whisper.cpp/raw/master/samples/jfk.wav .") |
|
15 | 15 |
|
16 | 16 |
|
17 | 17 |
# options from whisper_online |
... | ... | @@ -41,19 +41,18 @@ |
41 | 41 |
tokenizer = None |
42 | 42 |
online = OnlineASRProcessor(asr,tokenizer,buffer_trimming=(args.buffer_trimming, args.buffer_trimming_sec)) |
43 | 43 |
|
44 |
- |
|
45 |
- |
|
46 |
-if args.warmup_file and os.path.exists(args.warmup_file): |
|
47 |
- # load the audio into the LRU cache before we start the timer |
|
48 |
- a = load_audio_chunk(args.warmup_file,0,1) |
|
49 |
- |
|
50 |
- # TODO: it should be tested whether it's meaningful |
|
51 |
- # warm up the ASR, because the very first transcribe takes much more time than the other |
|
52 |
- asr.transcribe(a) |
|
44 |
+# warm up the ASR because the very first transcribe takes more time than the others. |
|
45 |
+# Test results in https://github.com/ufal/whisper_streaming/pull/81 |
|
46 |
+msg = "Whisper is not warmed up. The first chunk processing may take longer." |
|
47 |
+if args.warmup_file: |
|
48 |
+ if os.path.isfile(args.warmup_file): |
|
49 |
+ a = load_audio_chunk(args.warmup_file,0,1) |
|
50 |
+ asr.transcribe(a) |
|
51 |
+ print("INFO: Whisper is warmed up.",file=sys.stderr) |
|
52 |
+ else: |
|
53 |
+ print("WARNING: The warm up file is not available. "+msg,file=sys.stderr) |
|
53 | 54 |
else: |
54 |
- print("Whisper is not warmed up",file=sys.stderr) |
|
55 |
- |
|
56 |
- |
|
55 |
+ print("WARNING: " + msg, file=sys.stderr) |
|
57 | 56 |
|
58 | 57 |
|
59 | 58 |
######### Server objects |
Add a comment
Delete comment
Once you delete this comment, you won't be able to recover it. Are you sure you want to delete this comment?