[Update] 音声認識のtranscribe_audio_queue関数コール時にlanguageを設定するように変更
This commit is contained in:
6
VRCT.py
6
VRCT.py
@@ -467,12 +467,11 @@ class App(CTk):
|
||||
self.mic_transcriber = AudioTranscriber(
|
||||
speaker=False,
|
||||
source=self.mic_audio_recorder.source,
|
||||
language=transcription_lang[self.INPUT_MIC_VOICE_LANGUAGE],
|
||||
phrase_timeout=self.INPUT_MIC_PHRASE_TIMEOUT,
|
||||
max_phrases=self.INPUT_MIC_MAX_PHRASES,
|
||||
)
|
||||
def mic_transcript_to_chatbox():
|
||||
self.mic_transcriber.transcribe_audio_queue(self.mic_audio_queue)
|
||||
self.mic_transcriber.transcribe_audio_queue(self.mic_audio_queue, transcription_lang[self.INPUT_MIC_VOICE_LANGUAGE])
|
||||
message = self.mic_transcriber.get_transcript()
|
||||
if len(message) > 0:
|
||||
# word filter
|
||||
@@ -566,13 +565,12 @@ class App(CTk):
|
||||
self.spk_transcriber = AudioTranscriber(
|
||||
speaker=True,
|
||||
source=self.spk_audio_recorder.source,
|
||||
language=transcription_lang[self.INPUT_SPEAKER_VOICE_LANGUAGE],
|
||||
phrase_timeout=self.INPUT_SPEAKER_PHRASE_TIMEOUT,
|
||||
max_phrases=self.INPUT_SPEAKER_MAX_PHRASES,
|
||||
)
|
||||
|
||||
def spk_transcript_to_textbox():
|
||||
self.spk_transcriber.transcribe_audio_queue(self.spk_audio_queue)
|
||||
self.spk_transcriber.transcribe_audio_queue(self.spk_audio_queue, transcription_lang[self.INPUT_SPEAKER_VOICE_LANGUAGE])
|
||||
message = self.spk_transcriber.get_transcript()
|
||||
if len(message) > 0:
|
||||
# translate
|
||||
|
||||
@@ -9,9 +9,8 @@ PHRASE_TIMEOUT = 3
|
||||
MAX_PHRASES = 10
|
||||
|
||||
class AudioTranscriber:
|
||||
def __init__(self, speaker, source, language, phrase_timeout, max_phrases):
|
||||
def __init__(self, speaker, source, phrase_timeout, max_phrases):
|
||||
self.speaker = speaker
|
||||
self.language = language
|
||||
self.phrase_timeout = phrase_timeout
|
||||
self.max_phrases = max_phrases
|
||||
self.transcript_data = []
|
||||
@@ -27,7 +26,7 @@ class AudioTranscriber:
|
||||
"process_data_func": self.process_speaker_data if speaker else self.process_speaker_data
|
||||
}
|
||||
|
||||
def transcribe_audio_queue(self, audio_queue):
|
||||
def transcribe_audio_queue(self, audio_queue, language):
|
||||
# while True:
|
||||
audio, time_spoken = audio_queue.get()
|
||||
self.update_last_sample_and_phrase_status(audio, time_spoken)
|
||||
@@ -37,7 +36,7 @@ class AudioTranscriber:
|
||||
# fd, path = tempfile.mkstemp(suffix=".wav")
|
||||
# os.close(fd)
|
||||
audio_data = self.audio_sources["process_data_func"]()
|
||||
text = self.audio_recognizer.recognize_google(audio_data, language=self.language)
|
||||
text = self.audio_recognizer.recognize_google(audio_data, language=language)
|
||||
except Exception as e:
|
||||
pass
|
||||
finally:
|
||||
|
||||
Reference in New Issue
Block a user