From 115cf8fab99f377b9ac5f1ac5b26115ac0ea5508 Mon Sep 17 00:00:00 2001 From: misygauziya Date: Fri, 11 Aug 2023 01:53:11 +0900 Subject: [PATCH] =?UTF-8?q?[Update]=20=E9=9F=B3=E5=A3=B0=E8=AA=8D=E8=AD=98?= =?UTF-8?q?=E3=81=AEtranscribe=5Faudio=5Fqueue=E9=96=A2=E6=95=B0=E3=82=B3?= =?UTF-8?q?=E3=83=BC=E3=83=AB=E6=99=82=E3=81=ABlanguage=E3=82=92=E8=A8=AD?= =?UTF-8?q?=E5=AE=9A=E3=81=99=E3=82=8B=E3=82=88=E3=81=86=E3=81=AB=E5=A4=89?= =?UTF-8?q?=E6=9B=B4?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- VRCT.py | 6 ++---- audio_transcriber.py | 7 +++---- 2 files changed, 5 insertions(+), 8 deletions(-) diff --git a/VRCT.py b/VRCT.py index b3d3cd92..647d088c 100644 --- a/VRCT.py +++ b/VRCT.py @@ -467,12 +467,11 @@ class App(CTk): self.mic_transcriber = AudioTranscriber( speaker=False, source=self.mic_audio_recorder.source, - language=transcription_lang[self.INPUT_MIC_VOICE_LANGUAGE], phrase_timeout=self.INPUT_MIC_PHRASE_TIMEOUT, max_phrases=self.INPUT_MIC_MAX_PHRASES, ) def mic_transcript_to_chatbox(): - self.mic_transcriber.transcribe_audio_queue(self.mic_audio_queue) + self.mic_transcriber.transcribe_audio_queue(self.mic_audio_queue, transcription_lang[self.INPUT_MIC_VOICE_LANGUAGE]) message = self.mic_transcriber.get_transcript() if len(message) > 0: # word filter @@ -566,13 +565,12 @@ class App(CTk): self.spk_transcriber = AudioTranscriber( speaker=True, source=self.spk_audio_recorder.source, - language=transcription_lang[self.INPUT_SPEAKER_VOICE_LANGUAGE], phrase_timeout=self.INPUT_SPEAKER_PHRASE_TIMEOUT, max_phrases=self.INPUT_SPEAKER_MAX_PHRASES, ) def spk_transcript_to_textbox(): - self.spk_transcriber.transcribe_audio_queue(self.spk_audio_queue) + self.spk_transcriber.transcribe_audio_queue(self.spk_audio_queue, transcription_lang[self.INPUT_SPEAKER_VOICE_LANGUAGE]) message = self.spk_transcriber.get_transcript() if len(message) > 0: # translate diff --git a/audio_transcriber.py b/audio_transcriber.py index aadd6adf..94c858e7 100644 --- a/audio_transcriber.py +++ b/audio_transcriber.py @@ -9,9 +9,8 @@ PHRASE_TIMEOUT = 3 MAX_PHRASES = 10 class AudioTranscriber: - def __init__(self, speaker, source, language, phrase_timeout, max_phrases): + def __init__(self, speaker, source, phrase_timeout, max_phrases): self.speaker = speaker - self.language = language self.phrase_timeout = phrase_timeout self.max_phrases = max_phrases self.transcript_data = [] @@ -27,7 +26,7 @@ class AudioTranscriber: "process_data_func": self.process_speaker_data if speaker else self.process_speaker_data } - def transcribe_audio_queue(self, audio_queue): + def transcribe_audio_queue(self, audio_queue, language): # while True: audio, time_spoken = audio_queue.get() self.update_last_sample_and_phrase_status(audio, time_spoken) @@ -37,7 +36,7 @@ class AudioTranscriber: # fd, path = tempfile.mkstemp(suffix=".wav") # os.close(fd) audio_data = self.audio_sources["process_data_func"]() - text = self.audio_recognizer.recognize_google(audio_data, language=self.language) + text = self.audio_recognizer.recognize_google(audio_data, language=language) except Exception as e: pass finally: