add SelectedMicEnergyRecorder, SelectedSpeakeEnergyRecorder

This commit is contained in:
misygauziya
2023-07-11 00:40:39 +09:00
parent 41df105bab
commit 14d3a4a33e
2 changed files with 108 additions and 48 deletions

View File

@@ -21,7 +21,7 @@ class BaseRecorder:
def record_into_queue(self, audio_queue): def record_into_queue(self, audio_queue):
def record_callback(_, audio): def record_callback(_, audio):
audio_queue.put((audio.get_raw_data(), datetime.now())) audio_queue.put((audio[0].get_raw_data(), audio[1], datetime.now()))
self.stop = self.recorder.listen_in_background(self.source, record_callback, phrase_time_limit=self.record_timeout) self.stop = self.recorder.listen_in_background(self.source, record_callback, phrase_time_limit=self.record_timeout)
@@ -44,4 +44,48 @@ class SelectedSpeakerRecorder(BaseRecorder):
channels=device["maxInputChannels"] channels=device["maxInputChannels"]
) )
super().__init__(source=source, energy_threshold=energy_threshold, dynamic_energy_threshold=dynamic_energy_threshold, record_timeout=record_timeout) super().__init__(source=source, energy_threshold=energy_threshold, dynamic_energy_threshold=dynamic_energy_threshold, record_timeout=record_timeout)
self.adjust_for_noise()
class BaseEnergyRecorder:
def __init__(self, source):
self.recorder = Recognizer()
self.recorder.energy_threshold = 0
self.recorder.dynamic_energy_threshold = False
self.record_timeout = 0
self.stop = None
if source is None:
raise ValueError("audio source can't be None")
self.source = source
def adjust_for_noise(self):
with self.source:
self.recorder.adjust_for_ambient_noise(self.source)
def record_into_queue(self, energy_queue):
def record_callback(_, energy):
energy_queue.put(energy)
self.stop = self.recorder.listen_energy_in_background(self.source, record_callback)
class SelectedMicEnergyRecorder(BaseEnergyRecorder):
def __init__(self, device):
source=Microphone(
device_index=device['index'],
sample_rate=int(device["defaultSampleRate"]),
)
super().__init__(source=source)
self.adjust_for_noise()
class SelectedSpeakeEnergyRecorder(BaseEnergyRecorder):
def __init__(self, device):
source = Microphone(speaker=True,
device_index= device["index"],
sample_rate=int(device["defaultSampleRate"]),
chunk_size=get_sample_size(paInt16),
channels=device["maxInputChannels"]
)
super().__init__(source=source)
self.adjust_for_noise() self.adjust_for_noise()

View File

@@ -1,4 +1,5 @@
from time import sleep from time import sleep
from queue import Queue
from os import path as os_path from os import path as os_path
from tkinter import DoubleVar, IntVar from tkinter import DoubleVar, IntVar
from tkinter import font as tk_font from tkinter import font as tk_font
@@ -8,12 +9,11 @@ from flashtext import KeywordProcessor
from utils import save_json, print_textbox, thread_fnc from utils import save_json, print_textbox, thread_fnc
from audio_utils import get_input_device_list, get_output_device_list from audio_utils import get_input_device_list, get_output_device_list
from audio_recorder import SelectedMicRecorder, SelectedSpeakerRecorder from audio_recorder import SelectedMicEnergyRecorder, SelectedSpeakeEnergyRecorder
from languages import translation_lang, transcription_lang from languages import translation_lang, transcription_lang
class ToplevelWindowConfig(CTkToplevel): class ToplevelWindowConfig(CTkToplevel):
def __init__(self, parent, *args, **kwargs): def __init__(self, parent, *args, **kwargs):
super().__init__(parent, *args, **kwargs) super().__init__(parent, *args, **kwargs)
self.parent = parent self.parent = parent
@@ -27,7 +27,7 @@ class ToplevelWindowConfig(CTkToplevel):
# init parameter # init parameter
self.MAX_MIC_ENERGY_THRESHOLD = 2000 self.MAX_MIC_ENERGY_THRESHOLD = 2000
self.MAX_SPEAKER_ENERGY_THRESHOLD = 4000 self.MAX_SPEAKER_ENERGY_THRESHOLD = 2000
self.last_mic_device_name = None self.last_mic_device_name = None
self.last_speaker_device_name = None self.last_speaker_device_name = None
@@ -283,11 +283,21 @@ class ToplevelWindowConfig(CTkToplevel):
corner_radius=0 corner_radius=0
) )
self.progressBar_input_mic_energy_threshold.grid(row=row, column=1, columnspan=1, padx=5, pady=(5,0), sticky="nsew") self.progressBar_input_mic_energy_threshold.grid(row=row, column=1, columnspan=1, padx=5, pady=(5,0), sticky="nsew")
self.th_progressBar_input_mic_energy_threshold_recorder = thread_fnc(fnc=self.progressBar_input_mic_energy_threshold_recorder)
self.th_progressBar_input_mic_energy_threshold_recorder.daemon = True self.mic_energy_queue = Queue()
self.th_progressBar_input_mic_energy_threshold_recorder.start() mic_device = [device for device in get_input_device_list() if device["name"] == self.parent.CHOICE_MIC_DEVICE][0]
try:
self.mic_energy_recorder = SelectedMicEnergyRecorder(mic_device)
self.mic_energy_recorder.record_into_queue(self.mic_energy_queue)
except Exception as e:
print(e)
sleep(2) sleep(2)
self.mic_energy_plot_progressbar = thread_fnc(self.progressBar_input_mic_energy_plot)
self.mic_energy_plot_progressbar.daemon = True
self.mic_energy_plot_progressbar.start()
row +=1 row +=1
self.slider_input_mic_energy_threshold = customtkinter.CTkSlider( self.slider_input_mic_energy_threshold = customtkinter.CTkSlider(
self.tabview_config.tab("Transcription"), self.tabview_config.tab("Transcription"),
@@ -446,9 +456,19 @@ class ToplevelWindowConfig(CTkToplevel):
corner_radius=0 corner_radius=0
) )
self.progressBar_input_speaker_energy_threshold.grid(row=row, column=1, columnspan=1, padx=5, pady=(5,0), sticky="nsew") self.progressBar_input_speaker_energy_threshold.grid(row=row, column=1, columnspan=1, padx=5, pady=(5,0), sticky="nsew")
self.th_progressBar_input_speaker_energy_threshold_recorder = thread_fnc(fnc=self.progressBar_input_speaker_energy_threshold_recorder)
self.th_progressBar_input_speaker_energy_threshold_recorder.daemon=True self.speaker_energy_queue = Queue()
self.th_progressBar_input_speaker_energy_threshold_recorder.start() speaker_device = [device for device in get_output_device_list() if device["name"] == self.parent.CHOICE_SPEAKER_DEVICE][0]
try:
self.speaker_energy_recorder = SelectedSpeakeEnergyRecorder(speaker_device)
self.speaker_energy_recorder.record_into_queue(self.speaker_energy_queue)
except Exception as e:
print(e)
sleep(2)
self.speaker_energy_plot_progressbar = thread_fnc(self.progressBar_input_speaker_energy_plot)
self.speaker_energy_plot_progressbar.daemon = True
self.speaker_energy_plot_progressbar.start()
row +=1 row +=1
self.slider_input_speaker_energy_threshold = customtkinter.CTkSlider( self.slider_input_speaker_energy_threshold = customtkinter.CTkSlider(
@@ -772,25 +792,25 @@ class ToplevelWindowConfig(CTkToplevel):
self.parent.CHOICE_MIC_DEVICE = choice self.parent.CHOICE_MIC_DEVICE = choice
save_json(self.parent.PATH_CONFIG, "CHOICE_MIC_DEVICE", self.parent.CHOICE_MIC_DEVICE) save_json(self.parent.PATH_CONFIG, "CHOICE_MIC_DEVICE", self.parent.CHOICE_MIC_DEVICE)
self.mic_energy_recorder.stop()
self.mic_energy_recorder.stop = None
sleep(2)
try:
mic_device = [device for device in get_input_device_list() if device["name"] == self.parent.CHOICE_MIC_DEVICE][0]
self.mic_energy_recorder = SelectedMicEnergyRecorder(mic_device)
self.mic_energy_recorder.record_into_queue(self.mic_energy_queue)
except Exception as e:
print(e)
def optionmenu_input_mic_voice_language_callback(self, choice): def optionmenu_input_mic_voice_language_callback(self, choice):
self.parent.INPUT_MIC_VOICE_LANGUAGE = choice self.parent.INPUT_MIC_VOICE_LANGUAGE = choice
save_json(self.parent.PATH_CONFIG, "INPUT_MIC_VOICE_LANGUAGE", self.parent.INPUT_MIC_VOICE_LANGUAGE) save_json(self.parent.PATH_CONFIG, "INPUT_MIC_VOICE_LANGUAGE", self.parent.INPUT_MIC_VOICE_LANGUAGE)
def progressBar_input_mic_energy_threshold_recorder(self): def progressBar_input_mic_energy_plot(self):
self.last_mic_device_name = self.parent.CHOICE_MIC_DEVICE if self.mic_energy_queue.empty() is False:
mic_device = [device for device in get_input_device_list() if device["name"] == self.last_mic_device_name][0] energy = self.mic_energy_queue.get()
re = SelectedMicRecorder(mic_device, energy_threshold=0, dynamic_energy_threshold=False, record_timeout=0) self.progressBar_input_mic_energy_threshold.set(energy/self.MAX_MIC_ENERGY_THRESHOLD)
try: sleep(0.01)
while True:
if self.last_mic_device_name != self.parent.CHOICE_MIC_DEVICE:
break
with re.source as source:
energy = re.recorder.listen_energy(source)
self.progressBar_input_mic_energy_threshold.set(energy/self.MAX_MIC_ENERGY_THRESHOLD)
sleep(0.05)
except:
pass
sleep(5)
def slider_input_mic_energy_threshold_callback(self, value): def slider_input_mic_energy_threshold_callback(self, value):
self.parent.INPUT_MIC_ENERGY_THRESHOLD = int(value) self.parent.INPUT_MIC_ENERGY_THRESHOLD = int(value)
@@ -824,25 +844,25 @@ class ToplevelWindowConfig(CTkToplevel):
self.parent.CHOICE_SPEAKER_DEVICE = choice self.parent.CHOICE_SPEAKER_DEVICE = choice
save_json(self.parent.PATH_CONFIG, "CHOICE_SPEAKER_DEVICE", self.parent.CHOICE_SPEAKER_DEVICE) save_json(self.parent.PATH_CONFIG, "CHOICE_SPEAKER_DEVICE", self.parent.CHOICE_SPEAKER_DEVICE)
self.speaker_energy_recorder.stop()
self.speaker_energy_recorder.stop = None
sleep(2)
try:
speaker_device = [device for device in get_output_device_list() if device["name"] == self.parent.CHOICE_SPEAKER_DEVICE][0]
self.speaker_energy_recorder = SelectedSpeakeEnergyRecorder(speaker_device)
self.speaker_energy_recorder.record_into_queue(self.speaker_energy_queue)
except Exception as e:
print(e)
def optionmenu_input_speaker_voice_language_callback(self, choice): def optionmenu_input_speaker_voice_language_callback(self, choice):
self.parent.INPUT_SPEAKER_VOICE_LANGUAGE = choice self.parent.INPUT_SPEAKER_VOICE_LANGUAGE = choice
save_json(self.parent.PATH_CONFIG, "INPUT_SPEAKER_VOICE_LANGUAGE", self.parent.INPUT_SPEAKER_VOICE_LANGUAGE) save_json(self.parent.PATH_CONFIG, "INPUT_SPEAKER_VOICE_LANGUAGE", self.parent.INPUT_SPEAKER_VOICE_LANGUAGE)
def progressBar_input_speaker_energy_threshold_recorder(self): def progressBar_input_speaker_energy_plot(self):
self.last_speaker_device_name = self.parent.CHOICE_SPEAKER_DEVICE if self.speaker_energy_queue.empty() is False:
speaker_device = [device for device in get_output_device_list() if device["name"] == self.last_speaker_device_name][0] energy = self.speaker_energy_queue.get()
re = SelectedSpeakerRecorder(speaker_device, energy_threshold=0, dynamic_energy_threshold=False, record_timeout=0) self.progressBar_input_speaker_energy_threshold.set(energy/self.MAX_SPEAKER_ENERGY_THRESHOLD)
try: sleep(0.01)
while True:
if self.last_speaker_device_name != self.parent.CHOICE_SPEAKER_DEVICE:
break
with re.source as source:
energy = re.recorder.listen_energy(source)
self.progressBar_input_speaker_energy_threshold.set(energy/self.MAX_SPEAKER_ENERGY_THRESHOLD)
sleep(0.05)
except:
pass
sleep(5)
def slider_input_speaker_energy_threshold_callback(self, value): def slider_input_speaker_energy_threshold_callback(self, value):
self.parent.INPUT_SPEAKER_ENERGY_THRESHOLD = int(value) self.parent.INPUT_SPEAKER_ENERGY_THRESHOLD = int(value)
@@ -885,15 +905,11 @@ class ToplevelWindowConfig(CTkToplevel):
pass pass
def delete_window(self): def delete_window(self):
self.mic_energy_recorder.stop()
if isinstance(self.th_progressBar_input_mic_energy_threshold_recorder, thread_fnc): self.mic_energy_plot_progressbar.stop()
self.th_progressBar_input_mic_energy_threshold_recorder.stop() self.speaker_energy_recorder.stop()
self.last_mic_device_name = None self.speaker_energy_plot_progressbar.stop()
if isinstance(self.th_progressBar_input_speaker_energy_threshold_recorder, thread_fnc):
self.th_progressBar_input_speaker_energy_threshold_recorder.stop()
self.last_speaker_device_name = None
self.parent.checkbox_translation.configure(state="normal") self.parent.checkbox_translation.configure(state="normal")
self.parent.checkbox_transcription_send.configure(state="normal") self.parent.checkbox_transcription_send.configure(state="normal")
self.parent.checkbox_transcription_receive.configure(state="normal") self.parent.checkbox_transcription_receive.configure(state="normal")