feat: Implement translation prompt history injection for Chat/Mic/Speaker

- Added a history management system in model.py to store and retrieve recent messages from Chat, Mic, and Speaker. - Updated controller.py to automatically add messages to the translation history after processing. - Enhanced translation clients (OpenAI, Gemini, Groq, etc.) to accept and utilize context history for improved translation quality. - Introduced YAML configuration options for enabling history injection and customizing its behavior across different translation models. - Ensured that only original messages are stored in history to optimize token usage during translation.
2025-12-15 01:15:47 +09:00
parent 9e88cff889
commit dac903e07c
18 changed files with 734 additions and 7 deletions
--- a/src-python/models/translation/translation_openai.py
+++ b/src-python/models/translation/translation_openai.py
@@ -72,6 +72,16 @@ class OpenAIClient:
        prompt_config = loadTranslatePromptConfig(root_path, "translation_openai.yml")
        self.supported_languages = list(translation_lang["OpenAI_API"]["source"].keys())
        self.prompt_template = prompt_config["system_prompt"]
+        # history config (optional)
+        self.history_cfg = prompt_config.get("history", {
+            "use_history": False,
+            "sources": [],
+            "max_messages": 0,
+            "max_chars": 0,
+            "header_template": "",
+            "item_template": "[{source}] {role}: {text}",
+        })
+        self._context_history: list[dict] = []

        self.openai_llm = None

@@ -105,12 +115,62 @@ class OpenAIClient:
            streaming=False,
        )

+    def setContextHistory(self, history_items: list[dict]) -> None:
+        """Set recent conversation history for prompt injection.
+
+        Each item should be a dict containing:
+        - source: "chat" | "mic" | "speaker"
+        - text: message string
+        - timestamp: ISO format datetime string
+        """
+        self._context_history = history_items or []
+
    def translate(self, text: str, input_lang: str, output_lang: str) -> str:
        system_prompt = self.prompt_template.format(
            supported_languages=self.supported_languages,
            input_lang=input_lang,
            output_lang=output_lang,
        )
+
+        # Inject recent conversation history if enabled by YAML config
+        if self.history_cfg.get("use_history"):
+            allowed_sources = set(self.history_cfg.get("sources", []))
+            max_messages = int(self.history_cfg.get("max_messages", 0))
+            max_chars = int(self.history_cfg.get("max_chars", 0))
+            item_tmpl = self.history_cfg.get("item_template", "[{source}] {role}: {text}")
+            header_tmpl = self.history_cfg.get("header_template", "{history}")
+
+            # filter by source and take newest N
+            filtered = [h for h in self._context_history if h.get("source") in allowed_sources]
+            recent = filtered[-max_messages:] if max_messages > 0 else filtered
+            # format items
+            formatted_items = []
+            for h in recent:
+                # Format timestamp as HH:MM to save tokens
+                timestamp_str = ''
+                if 'timestamp' in h:
+                    from datetime import datetime
+                    try:
+                        ts = datetime.fromisoformat(h['timestamp'])
+                        timestamp_str = ts.strftime('%H:%M')
+                    except:
+                        timestamp_str = ''
+                formatted_items.append(
+                    item_tmpl.format(
+                        timestamp=timestamp_str,
+                        source=h.get("source", ""),
+                        text=h.get("text", ""),
+                    )
+                )
+            history_blob = "\n".join(formatted_items).strip()
+            # truncate by char limit to mitigate token use
+            if max_chars and len(history_blob) > max_chars:
+                history_blob = history_blob[-max_chars:]
+            # assemble header and append to system prompt
+            history_header = header_tmpl.format(max_messages=max_messages, history=history_blob)
+            if history_header:
+                system_prompt = f"{system_prompt}\n\n{history_header}"
+
        messages = [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": text},