Spaces:

langtech-innovation
/

WhisperLiveKitDiarization

Paused

App Files Files Community

qfuxa commited on May 28

Commit

3ccfa18

1 Parent(s): f86e733

correct error when using VAC

Browse files

Files changed (1) hide show

whisperlivekit/whisper_streaming_custom/online_asr.py +10 -9

whisperlivekit/whisper_streaming_custom/online_asr.py CHANGED Viewed

@@ -343,15 +343,15 @@ class OnlineASRProcessor:
                 )
                 sentences.append(sentence)
         return sentences
-    def finish(self) -> Transcript:
         """
         Flush the remaining transcript when processing ends.
         """
         remaining_tokens = self.transcript_buffer.buffer
-        final_transcript = self.concatenate_tokens(remaining_tokens)
-        logger.debug(f"Final non-committed transcript: {final_transcript}")
         self.buffer_time_offset += len(self.audio_buffer) / self.SAMPLING_RATE
-        return final_transcript
     def concatenate_tokens(
         self,
@@ -384,7 +384,8 @@ class VACOnlineASRProcessor:
     def __init__(self, online_chunk_size: float, *args, **kwargs):
         self.online_chunk_size = online_chunk_size
         self.online = OnlineASRProcessor(*args, **kwargs)
         # Load a VAD model (e.g. Silero VAD)
         import torch
         model, _ = torch.hub.load(repo_or_dir="snakers4/silero-vad", model="silero_vad")
@@ -455,7 +456,7 @@ class VACOnlineASRProcessor:
                 self.buffer_offset += max(0, len(self.audio_buffer) - self.SAMPLING_RATE)
                 self.audio_buffer = self.audio_buffer[-self.SAMPLING_RATE:]
-    def process_iter(self) -> Transcript:
         """
         Depending on the VAD status and the amount of accumulated audio,
         process the current audio chunk.
@@ -467,9 +468,9 @@ class VACOnlineASRProcessor:
             return self.online.process_iter()
         else:
             logger.debug("No online update, only VAD")
-            return Transcript(None, None, "")
-    def finish(self) -> Transcript:
         """Finish processing by flushing any remaining text."""
         result = self.online.finish()
         self.current_online_chunk_buffer_size = 0
@@ -480,4 +481,4 @@ class VACOnlineASRProcessor:
         """
         Get the unvalidated buffer in string format.
         """
-        return self.online.concatenate_tokens(self.online.transcript_buffer.buffer).text

                 )
                 sentences.append(sentence)
         return sentences
+    def finish(self) -> List[ASRToken]:
         """
         Flush the remaining transcript when processing ends.
         """
         remaining_tokens = self.transcript_buffer.buffer
+        logger.debug(f"Final non-committed tokens: {remaining_tokens}")
         self.buffer_time_offset += len(self.audio_buffer) / self.SAMPLING_RATE
+        return remaining_tokens
     def concatenate_tokens(
         self,
     def __init__(self, online_chunk_size: float, *args, **kwargs):
         self.online_chunk_size = online_chunk_size
         self.online = OnlineASRProcessor(*args, **kwargs)
+        self.asr = self.online.asr
         # Load a VAD model (e.g. Silero VAD)
         import torch
         model, _ = torch.hub.load(repo_or_dir="snakers4/silero-vad", model="silero_vad")
                 self.buffer_offset += max(0, len(self.audio_buffer) - self.SAMPLING_RATE)
                 self.audio_buffer = self.audio_buffer[-self.SAMPLING_RATE:]
+    def process_iter(self) -> List[ASRToken]:
         """
         Depending on the VAD status and the amount of accumulated audio,
         process the current audio chunk.
             return self.online.process_iter()
         else:
             logger.debug("No online update, only VAD")
+            return []
+    def finish(self) -> List[ASRToken]:
         """Finish processing by flushing any remaining text."""
         result = self.online.finish()
         self.current_online_chunk_buffer_size = 0
         """
         Get the unvalidated buffer in string format.
         """
+        return self.online.concatenate_tokens(self.online.transcript_buffer.buffer)