From d38b8027063851287a8ca7e59f82de43c26b265e Mon Sep 17 00:00:00 2001 From: Gregory Ecock Date: Thu, 20 Jun 2024 10:53:20 -0400 Subject: [PATCH] concat all interim results Signed-off-by: Gregory Ecock --- transcribe.py | 14 ++++++++++++-- 1 file changed, 12 insertions(+), 2 deletions(-) diff --git a/transcribe.py b/transcribe.py index 7134704..dfd546c 100644 --- a/transcribe.py +++ b/transcribe.py @@ -48,12 +48,22 @@ def __init__(self, audio_file_name:str, transcriptions:Transcriptions): def on_data(self, data): #print(json.dumps(data, indent=2)) + # if self.audio_file_name not in self.transcriptions.getData(): + # transcription = "" + # else: + # print(self.transcriptions.getData()[self.audio_file_name]) + try: transcription = "" for result in data['results']: transcription += result["alternatives"][0]["transcript"] - #print(transcription) - self.transcriptions.add(self.audio_file_name, transcription) + #print(result["final"],"\n\n\n") + # print(self.audio_file_name + " -- " + transcription+"\n\n") + if self.audio_file_name not in self.transcriptions.getData(): + self.transcriptions.add(self.audio_file_name, transcription) + else: + transcription = self.transcriptions.getData()[self.audio_file_name]+ " " + transcription + self.transcriptions.add(self.audio_file_name, transcription) except: logging.exception(f"{self.audio_file_name} - No transcription found")