47 lines
2.0 KiB
Python
47 lines
2.0 KiB
Python
import custom_speech_recognition as sr
|
|
import pyaudiowpatch as pyaudio
|
|
from datetime import datetime
|
|
|
|
class BaseRecorder:
|
|
def __init__(self, source, energy_threshold, dynamic_energy_threshold, record_timeout):
|
|
self.recorder = sr.Recognizer()
|
|
self.recorder.energy_threshold = energy_threshold
|
|
self.recorder.dynamic_energy_threshold = dynamic_energy_threshold
|
|
self.record_timeout = record_timeout
|
|
self.stop = None
|
|
|
|
if source is None:
|
|
raise ValueError("audio source can't be None")
|
|
|
|
self.source = source
|
|
|
|
def adjust_for_noise(self):
|
|
with self.source:
|
|
self.recorder.adjust_for_ambient_noise(self.source)
|
|
|
|
def record_into_queue(self, audio_queue):
|
|
def record_callback(_, audio:sr.AudioData) -> None:
|
|
audio_queue.put((audio.get_raw_data(), datetime.now()))
|
|
|
|
self.stop = self.recorder.listen_in_background(self.source, record_callback, phrase_time_limit=self.record_timeout)
|
|
|
|
class SelectedMicRecorder(BaseRecorder):
|
|
def __init__(self, device, energy_threshold, dynamic_energy_threshold, record_timeout):
|
|
source=sr.Microphone(
|
|
device_index=device['index'],
|
|
sample_rate=int(device["defaultSampleRate"]),
|
|
)
|
|
super().__init__(source=source, energy_threshold=energy_threshold, dynamic_energy_threshold=dynamic_energy_threshold, record_timeout=record_timeout)
|
|
self.adjust_for_noise()
|
|
|
|
class SelectedSpeakerRecorder(BaseRecorder):
|
|
def __init__(self, device, energy_threshold, dynamic_energy_threshold, record_timeout):
|
|
|
|
source = sr.Microphone(speaker=True,
|
|
device_index= device["index"],
|
|
sample_rate=int(device["defaultSampleRate"]),
|
|
chunk_size=pyaudio.get_sample_size(pyaudio.paInt16),
|
|
channels=device["maxInputChannels"]
|
|
)
|
|
super().__init__(source=source, energy_threshold=energy_threshold, dynamic_energy_threshold=dynamic_energy_threshold, record_timeout=record_timeout)
|
|
self.adjust_for_noise() |