import os import json import threading import customtkinter from PIL import Image import utils import translation import transcription import osc_tools import window_config import window_information class App(customtkinter.CTk): def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) # init config self.PATH_CONFIG = "./config.json" ## main window self.ENABLE_TRANSLATION = False self.ENABLE_TRANSCRIPTION = False self.ENABLE_FOREGROUND = False ## UI self.TRANSPARENCY = 100 self.APPEARANCE_THEME = "System" self.UI_SCALING = "100%" self.FONT_FAMILY = "Yu Gothic UI" ## Translation self.CHOICE_TRANSLATOR = "DeepL(web)" self.INPUT_SOURCE_LANG = "JA" self.INPUT_TARGET_LANG = "EN" self.OUTPUT_SOURCE_LANG = "JA" self.OUTPUT_TARGET_LANG = "EN" ## Transcription self.CHOICE_MIC_DEVICE = None self.INPUT_MIC_VOICE_LANGUAGE = "ja-JP" self.ENABLE_MIC_IS_DYNAMIC = False self.MIC_THRESHOLD = 300 self.CHOICE_SPEAKER_DEVICE = None self.INPUT_SPEAKER_VOICE_LANGUAGE = "ja-JP" self.ENABLE_SPEAKER_IS_DYNAMIC = False self.SPEAKER_THRESHOLD = 300 ## Parameter self.OSC_IP_ADDRESS = "127.0.0.1" self.OSC_PORT = 9000 self.AUTH_KEYS = { "DeepL(web)": None, "DeepL(auth)": None, "Bing(web)": None, "Google(web)": None, } self.MESSAGE_FORMAT = "[message]([translation])" # load config if os.path.isfile(self.PATH_CONFIG) is not False: with open(self.PATH_CONFIG, 'r') as fp: config = json.load(fp) # main window if "ENABLE_TRANSLATION" in config.keys(): self.ENABLE_TRANSLATION = config["ENABLE_TRANSLATION"] if "ENABLE_TRANSCRIPTION" in config.keys(): self.ENABLE_TRANSCRIPTION = config["ENABLE_TRANSCRIPTION"] if "ENABLE_FOREGROUND" in config.keys(): self.ENABLE_FOREGROUND = config["ENABLE_FOREGROUND"] # tab ui if "TRANSPARENCY" in config.keys(): self.TRANSPARENCY = config["TRANSPARENCY"] if "APPEARANCE_THEME" in config.keys(): self.APPEARANCE_THEME = config["APPEARANCE_THEME"] if "UI_SCALING" in config.keys(): self.UI_SCALING = config["UI_SCALING"] if "FONT_FAMILY" in config.keys(): self.FONT_FAMILY = config["FONT_FAMILY"] # translation if "CHOICE_TRANSLATOR" in config.keys(): self.CHOICE_TRANSLATOR = config["CHOICE_TRANSLATOR"] if "INPUT_SOURCE_LANG" in config.keys(): self.INPUT_SOURCE_LANG = config["INPUT_SOURCE_LANG"] if "INPUT_TARGET_LANG" in config.keys(): self.INPUT_TARGET_LANG = config["INPUT_TARGET_LANG"] if "OUTPUT_SOURCE_LANG" in config.keys(): self.OUTPUT_SOURCE_LANG = config["OUTPUT_SOURCE_LANG"] if "OUTPUT_TARGET_LANG" in config.keys(): self.OUTPUT_TARGET_LANG = config["OUTPUT_TARGET_LANG"] # Transcription if "CHOICE_MIC_DEVICE" in config.keys(): self.CHOICE_MIC_DEVICE = config["CHOICE_MIC_DEVICE"] if "INPUT_MIC_VOICE_LANGUAGE" in config.keys(): self.INPUT_MIC_VOICE_LANGUAGE = config["INPUT_MIC_VOICE_LANGUAGE"] if "ENABLE_MIC_IS_DYNAMIC" in config.keys(): self.ENABLE_MIC_IS_DYNAMIC = config["ENABLE_MIC_IS_DYNAMIC"] if "MIC_THRESHOLD" in config.keys(): self.MIC_THRESHOLD = config["MIC_THRESHOLD"] if "CHOICE_SPEAKER_DEVICE" in config.keys(): self.CHOICE_SPEAKER_DEVICE = config["CHOICE_SPEAKER_DEVICE"] if "INPUT_SPEAKER_VOICE_LANGUAGE" in config.keys(): self.INPUT_SPEAKER_VOICE_LANGUAGE = config["INPUT_SPEAKER_VOICE_LANGUAGE"] if "ENABLE_SPEAKER_IS_DYNAMIC" in config.keys(): self.ENABLE_SPEAKER_IS_DYNAMIC = config["ENABLE_SPEAKER_IS_DYNAMIC"] if "SPEAKER_THRESHOLD" in config.keys(): self.SPEAKER_THRESHOLD = config["SPEAKER_THRESHOLD"] # Parameter if "OSC_IP_ADDRESS" in config.keys(): self.OSC_IP_ADDRESS = config["OSC_IP_ADDRESS"] if "OSC_PORT" in config.keys(): self.OSC_PORT = config["OSC_PORT"] if "AUTH_KEYS" in config.keys(): self.AUTH_KEYS = config["AUTH_KEYS"] if "MESSAGE_FORMAT" in config.keys(): self.MESSAGE_FORMAT = config["MESSAGE_FORMAT"] with open(self.PATH_CONFIG, 'w') as fp: config = { "ENABLE_TRANSLATION": self.ENABLE_TRANSLATION, "ENABLE_TRANSCRIPTION": self.ENABLE_TRANSCRIPTION, "ENABLE_FOREGROUND": self.ENABLE_FOREGROUND, "TRANSPARENCY": self.TRANSPARENCY, "APPEARANCE_THEME": self.APPEARANCE_THEME, "UI_SCALING": self.UI_SCALING, "FONT_FAMILY": self.FONT_FAMILY, "CHOICE_TRANSLATOR": self.CHOICE_TRANSLATOR, "INPUT_SOURCE_LANG": self.INPUT_SOURCE_LANG, "INPUT_TARGET_LANG": self.INPUT_TARGET_LANG, "OUTPUT_SOURCE_LANG": self.OUTPUT_SOURCE_LANG, "OUTPUT_TARGET_LANG": self.OUTPUT_TARGET_LANG, "CHOICE_MIC_DEVICE": self.CHOICE_MIC_DEVICE, "INPUT_MIC_VOICE_LANGUAGE": self.INPUT_MIC_VOICE_LANGUAGE, "ENABLE_MIC_IS_DYNAMIC": self.ENABLE_MIC_IS_DYNAMIC, "MIC_THRESHOLD": self.MIC_THRESHOLD, "CHOICE_SPEAKER_DEVICE": self.CHOICE_SPEAKER_DEVICE, "INPUT_SPEAKER_VOICE_LANGUAGE": self.INPUT_SPEAKER_VOICE_LANGUAGE, "ENABLE_SPEAKER_IS_DYNAMIC": self.ENABLE_SPEAKER_IS_DYNAMIC, "SPEAKER_THRESHOLD": self.SPEAKER_THRESHOLD, "OSC_IP_ADDRESS": self.OSC_IP_ADDRESS, "OSC_PORT": self.OSC_PORT, "AUTH_KEYS": self.AUTH_KEYS, "MESSAGE_FORMAT": self.MESSAGE_FORMAT, } json.dump(config, fp, indent=4) # init main window self.iconbitmap(os.path.join(os.path.dirname(__file__), "img", "app.ico")) self.title("VRCT") self.geometry(f"{400}x{140}") self.minsize(400, 140) self.grid_columnconfigure(1, weight=1) self.grid_rowconfigure(0, weight=1) # add sidebar left self.sidebar_frame = customtkinter.CTkFrame(self, corner_radius=0) self.sidebar_frame.grid(row=0, column=0, rowspan=4, sticky="nsw") self.sidebar_frame.grid_rowconfigure(5, weight=1) # add checkbox translation self.checkbox_translation = customtkinter.CTkCheckBox( self.sidebar_frame, text="Translation", onvalue=True, offvalue=False, command=self.checkbox_translation_callback, font=customtkinter.CTkFont(family=self.FONT_FAMILY) ) self.checkbox_translation.grid(row=0, column=0, columnspan=2 ,padx=10, pady=(5, 5), sticky="we") # add checkbox transcription self.checkbox_transcription = customtkinter.CTkCheckBox( self.sidebar_frame, text="Transcription", onvalue=True, offvalue=False, command=self.checkbox_transcription_callback, font=customtkinter.CTkFont(family=self.FONT_FAMILY) ) self.checkbox_transcription.grid(row=1, column=0, columnspan=2 ,padx=10, pady=(5, 5), sticky="we") # add checkbox foreground self.checkbox_foreground = customtkinter.CTkCheckBox( self.sidebar_frame, text="Foreground", onvalue=True, offvalue=False, command=self.checkbox_foreground_callback, font=customtkinter.CTkFont(family=self.FONT_FAMILY) ) self.checkbox_foreground.grid(row=2, column=0, columnspan=2 ,padx=10, pady=(5, 5), sticky="we") # add button information self.button_information = customtkinter.CTkButton( self.sidebar_frame, text="", width=25, command=self.button_information_callback, image=customtkinter.CTkImage(Image.open(os.path.join(os.path.dirname(__file__), "img", "info-icon-white.png"))) ) self.button_information.grid(row=5, column=0, padx=(10, 5), pady=(5, 5), sticky="wse") self.information_window = None # add button config self.button_config = customtkinter.CTkButton( self.sidebar_frame, text="", width=25, command=self.button_config_callback, image=customtkinter.CTkImage(Image.open(os.path.join(os.path.dirname(__file__), "img", "config-icon-white.png"))) ) self.button_config.grid(row=5, column=1, padx=(5, 10), pady=(5, 5), sticky="wse") self.config_window = None # add tabview textbox self.tabview_logs = customtkinter.CTkTabview(master=self) self.tabview_logs.add("send") self.tabview_logs.add("receive") self.tabview_logs.grid(row=0, column=1, padx=5, pady=0, sticky="nsew") self.tabview_logs._segmented_button.grid(sticky="W") self.tabview_logs.tab("send").grid_rowconfigure(0, weight=1) self.tabview_logs.tab("send").grid_columnconfigure(0, weight=1) self.tabview_logs.tab("receive").grid_rowconfigure(0, weight=1) self.tabview_logs.tab("receive").grid_columnconfigure(0, weight=1) self.tabview_logs.configure(state='disabled') # add textbox message log self.textbox_message_log = customtkinter.CTkTextbox( self.tabview_logs.tab("send"), font=customtkinter.CTkFont(family=self.FONT_FAMILY) ) self.textbox_message_log.grid(row=0, column=0, padx=0, pady=0, sticky="nsew") self.textbox_message_log.configure(state='disabled') # add textbox message log self.textbox_message_receive_log = customtkinter.CTkTextbox( self.tabview_logs.tab("receive"), font=customtkinter.CTkFont(family=self.FONT_FAMILY) ) self.textbox_message_receive_log.grid(row=0, column=0, padx=0, pady=0, sticky="nsew") self.textbox_message_receive_log.configure(state='disabled') # add entry message box self.entry_message_box = customtkinter.CTkEntry( self, placeholder_text="message", font=customtkinter.CTkFont(family=self.FONT_FAMILY) ) self.entry_message_box.grid(row=1, column=1, columnspan=2, padx=(10, 10), pady=(5, 10), sticky="nsew") # set default values ## set translator instance self.translator = translation.Translator() if self.translator.authentication(self.CHOICE_TRANSLATOR, self.AUTH_KEYS[self.CHOICE_TRANSLATOR]) is False: # error update Auth key self.textbox_message_log.configure(state='normal') self.textbox_message_log.insert("end", f"[ERROR] Auth Keyを設定してないか間違っています\n") self.textbox_message_log.configure(state='disabled') self.textbox_message_log.see("end") ## set transcription instance self.vr = transcription.VoiceRecognizer() self.CHOICE_MIC_DEVICE = self.CHOICE_MIC_DEVICE if self.CHOICE_MIC_DEVICE is not None else list(self.vr.input_device_dict.keys())[0] ## set checkbox enable translation if self.ENABLE_TRANSLATION: self.checkbox_translation.select() self.checkbox_translation_callback() else: self.checkbox_translation.deselect() ## set checkbox enable transcription if self.ENABLE_TRANSCRIPTION: self.checkbox_transcription.select() else: self.checkbox_transcription.deselect() self.checkbox_transcription_callback() ## set set checkbox enable foreground if self.ENABLE_FOREGROUND: self.checkbox_foreground.select() else: self.checkbox_foreground.deselect() self.checkbox_foreground_callback() ## set bind entry message box self.entry_message_box.bind("", self.entry_message_box_press_key_enter) self.entry_message_box.bind("", self.entry_message_box_press_key_any) self.entry_message_box.bind("", self.entry_message_box_leave) ## set transparency for main window self.wm_attributes("-alpha", self.TRANSPARENCY/100) ## set UI scale new_scaling_float = int(self.UI_SCALING.replace("%", "")) / 100 customtkinter.set_widget_scaling(new_scaling_float) ## set UI theme customtkinter.set_appearance_mode(self.APPEARANCE_THEME) customtkinter.set_default_color_theme("blue") def button_config_callback(self): if self.config_window is None or not self.config_window.winfo_exists(): self.config_window = window_config.ToplevelWindowConfig(self) self.config_window.focus() def button_information_callback(self): if self.information_window is None or not self.information_window.winfo_exists(): self.information_window = window_information.ToplevelWindowInformation(self) self.information_window.focus() def checkbox_translation_callback(self): self.ENABLE_TRANSLATION = self.checkbox_translation.get() self.textbox_message_log.configure(state='normal') if self.ENABLE_TRANSLATION: self.textbox_message_log.insert("end", f"[INFO] start translation\n") else: self.textbox_message_log.insert("end", f"[INFO] stop translation\n") self.textbox_message_log.configure(state='disabled') self.textbox_message_log.see("end") utils.save_json(self.PATH_CONFIG, "ENABLE_TRANSLATION", self.ENABLE_TRANSLATION) def checkbox_transcription_callback(self): self.ENABLE_TRANSCRIPTION = self.checkbox_transcription.get() if self.ENABLE_TRANSCRIPTION is True: # start threading th = threading.Thread(target = self.voice_input) th.start() utils.save_json(self.PATH_CONFIG, "ENABLE_TRANSCRIPTION", self.ENABLE_TRANSCRIPTION) def voice_input(self): self.vr.set_mic(self.CHOICE_MIC_DEVICE) self.vr.init_mic(threshold=self.MIC_THRESHOLD, is_dynamic=self.ENABLE_MIC_IS_DYNAMIC) # start voice_input if self.checkbox_transcription.get() is True: self.textbox_message_log.configure(state='normal') self.textbox_message_log.insert("end", f"[INFO] start transcription\n") self.textbox_message_log.configure(state='disabled') self.textbox_message_log.see("end") while self.checkbox_transcription.get() is True: message = self.vr.listen_voice(language=self.INPUT_MIC_VOICE_LANGUAGE) if len(message) > 0: # translate if self.checkbox_translation.get() is False: chat_message = f"{message}" elif (self.translator.translator_status[self.CHOICE_TRANSLATOR] is False) or (self.INPUT_SOURCE_LANG == "None") or (self.INPUT_TARGET_LANG == "None"): self.textbox_message_log.configure(state='normal') self.textbox_message_log.insert("end", f"[ERROR] Auth Keyもしくは言語の設定が間違っています\n") self.textbox_message_log.configure(state='disabled') self.textbox_message_log.see("end") chat_message = f"{message}" else: result = self.translator.translate( translator_name=self.CHOICE_TRANSLATOR, source_language=self.INPUT_SOURCE_LANG, target_language=self.INPUT_TARGET_LANG, message=message ) chat_message = self.MESSAGE_FORMAT.replace("[message]", message).replace("[translation]", result) # send OSC message osc_tools.send_message(chat_message, self.OSC_IP_ADDRESS, self.OSC_PORT) # update textbox message log self.textbox_message_log.configure(state='normal') self.textbox_message_log.insert("end", f"[VOICE] {chat_message}\n") self.textbox_message_log.configure(state='disabled') self.textbox_message_log.see("end") self.textbox_message_log.configure(state='normal') self.textbox_message_log.insert("end", f"[INFO] stop transcription\n") self.textbox_message_log.configure(state='disabled') self.textbox_message_log.see("end") def checkbox_foreground_callback(self): self.ENABLE_FOREGROUND = self.checkbox_foreground.get() if self.ENABLE_FOREGROUND: self.attributes("-topmost", True) else: self.attributes("-topmost", False) utils.save_json(self.PATH_CONFIG, "ENABLE_FOREGROUND", self.ENABLE_FOREGROUND) def entry_message_box_press_key_enter(self, event): # send OSC typing osc_tools.send_typing(False, self.OSC_IP_ADDRESS, self.OSC_PORT) if self.ENABLE_FOREGROUND: self.attributes("-topmost", True) message = self.entry_message_box.get() if len(message) > 0: # translate if self.checkbox_translation.get() is False: chat_message = f"{message}" elif (self.translator.translator_status[self.CHOICE_TRANSLATOR] is False) or (self.INPUT_SOURCE_LANG == "None") or (self.INPUT_TARGET_LANG == "None"): self.textbox_message_log.configure(state='normal') self.textbox_message_log.insert("end", f"[ERROR] Auth Keyもしくは言語の設定が間違っています\n") self.textbox_message_log.configure(state='disabled') self.textbox_message_log.see("end") chat_message = f"{message}" else: result = self.translator.translate( translator_name=self.CHOICE_TRANSLATOR, source_language=self.INPUT_SOURCE_LANG, target_language=self.INPUT_TARGET_LANG, message=message ) chat_message = self.MESSAGE_FORMAT.replace("[message]", message).replace("[translation]", result) # send OSC message osc_tools.send_message(chat_message, self.OSC_IP_ADDRESS, self.OSC_PORT) # update textbox message log self.textbox_message_log.configure(state='normal') self.textbox_message_log.insert("end", f"[CHAT] {chat_message}\n") self.textbox_message_log.configure(state='disabled') self.textbox_message_log.see("end") # delete message in entry message box # self.entry_message_box.delete(0, customtkinter.END) def entry_message_box_press_key_any(self, event): # send OSC typing osc_tools.send_typing(True, self.OSC_IP_ADDRESS, self.OSC_PORT) if self.ENABLE_FOREGROUND: self.attributes("-topmost", False) def entry_message_box_leave(self, event): # send OSC typing osc_tools.send_typing(False, self.OSC_IP_ADDRESS, self.OSC_PORT) if self.ENABLE_FOREGROUND: self.attributes("-topmost", True) if __name__ == "__main__": app = App() app.mainloop()