Dominik Macháček 2024-11-15
Merge branch 'main' of github.com:promet99/whisper_streaming into promet99-main
@c42dc8bafff91a9a4d7e2a78280f981d2f340caf
whisper_online.py
--- whisper_online.py
+++ whisper_online.py
@@ -192,17 +192,17 @@
 
         o = []
         for word in segments.words:
-            start = word.get("start")
-            end = word.get("end")
+            start = word.start
+            end = word.end
             if any(s[0] <= start <= s[1] for s in no_speech_segments):
                 # print("Skipping word", word.get("word"), "because it's in a no-speech segment")
                 continue
-            o.append((start, end, word.get("word")))
+            o.append((start, end, word.word))
         return o
 
 
     def segments_end_ts(self, res):
-        return [s["end"] for s in res.words]
+        return [s.end for s in res.words]
 
     def transcribe(self, audio_data, prompt=None, *args, **kwargs):
         # Write the audio data to a buffer
Add a comment
List