Files
VRCT/src-python/models/translation/translation_ollama.py
misyaguziya dac903e07c feat: Implement translation prompt history injection for Chat/Mic/Speaker
- Added a history management system in model.py to store and retrieve recent messages from Chat, Mic, and Speaker.
- Updated controller.py to automatically add messages to the translation history after processing.
- Enhanced translation clients (OpenAI, Gemini, Groq, etc.) to accept and utilize context history for improved translation quality.
- Introduced YAML configuration options for enabling history injection and customizing its behavior across different translation models.
- Ensured that only original messages are stored in history to optimize token usage during translation.
2025-12-15 01:15:47 +09:00

169 lines
6.1 KiB
Python

import requests
from langchain_ollama import ChatOllama
try:
from .translation_languages import translation_lang
from .translation_utils import loadTranslatePromptConfig
except Exception:
import sys
from os import path as os_path
sys.path.append(os_path.dirname(os_path.abspath(__file__)))
from translation_languages import translation_lang, loadTranslationLanguages
from translation_utils import loadTranslatePromptConfig
translation_lang = loadTranslationLanguages(path=".", force=True)
def _authentication_check(base_url: str | None = None) -> bool:
"""Check authentication for Ollama API.
"""
try:
response = requests.get(f"{base_url}", timeout=0.2)
if response.status_code == 200:
return True
else:
return False
except Exception:
return False
def _get_available_text_models(base_url: str | None = None) -> list[str]:
"""Extract available text models from Ollama.
"""
try:
response = requests.get(f"{base_url}/api/tags")
models = response.json()["models"]
except Exception:
models = []
allowed_models = []
for model in models:
allowed_models.append(model["name"])
allowed_models.sort()
return allowed_models
class OllamaClient:
"""Ollama Translation simple wrapper.
prompt/translation_ollama.yml から system_prompt / supported_languages を読み込む。
"""
def __init__(self, root_path: str = None):
self.model = None
self.base_url = "http://localhost:11434"
prompt_config = loadTranslatePromptConfig(root_path, "translation_ollama.yml")
self.supported_languages = list(translation_lang["Ollama"]["source"].keys())
self.prompt_template = prompt_config["system_prompt"]
# history config (optional)
self.history_cfg = prompt_config.get("history", {
"use_history": False,
"sources": [],
"max_messages": 0,
"max_chars": 0,
"header_template": "",
"item_template": "[{source}] {role}: {text}",
})
self._context_history: list[dict] = []
self.openai_llm = None
def authenticationCheck(self) -> bool:
return _authentication_check(self.base_url)
def getModelList(self) -> list[str]:
if self.authenticationCheck():
return _get_available_text_models(self.base_url)
return []
def getModel(self) -> str:
return self.model
def setModel(self, model: str) -> bool:
if model in self.getModelList():
self.model = model
return True
else:
return False
def updateClient(self) -> None:
self.openai_llm = ChatOllama(
base_url=self.base_url,
model=self.model,
streaming=False,
)
def setContextHistory(self, history_items: list[dict]) -> None:
"""Set recent conversation history for prompt injection.
Each item should be a dict containing:
- source: "chat" | "mic" | "speaker"
- text: message string
- timestamp: ISO format datetime string
"""
self._context_history = history_items or []
def translate(self, text: str, input_lang: str, output_lang: str) -> str:
system_prompt = self.prompt_template.format(
supported_languages=self.supported_languages,
input_lang=input_lang,
output_lang=output_lang,
)
# Inject recent conversation history if enabled by YAML config
if self.history_cfg.get("use_history"):
allowed_sources = set(self.history_cfg.get("sources", []))
max_messages = int(self.history_cfg.get("max_messages", 0))
max_chars = int(self.history_cfg.get("max_chars", 0))
item_tmpl = self.history_cfg.get("item_template", "[{source}] {role}: {text}")
header_tmpl = self.history_cfg.get("header_template", "{history}")
filtered = [h for h in self._context_history if h.get("source") in allowed_sources]
recent = filtered[-max_messages:] if max_messages > 0 else filtered
formatted_items = []
for h in recent:
# Format timestamp as HH:MM to save tokens
timestamp_str = ''
if 'timestamp' in h:
from datetime import datetime
try:
ts = datetime.fromisoformat(h['timestamp'])
timestamp_str = ts.strftime('%H:%M')
except:
timestamp_str = ''
formatted_items.append(
item_tmpl.format(
timestamp=timestamp_str,
source=h.get("source", ""),
text=h.get("text", ""),
)
)
history_blob = "\n".join(formatted_items).strip()
if max_chars and len(history_blob) > max_chars:
history_blob = history_blob[-max_chars:]
history_header = header_tmpl.format(max_messages=max_messages, history=history_blob)
if history_header:
system_prompt = f"{system_prompt}\n\n{history_header}"
messages = [
{"role": "system", "content": system_prompt},
{"role": "user", "content": text},
]
resp = self.openai_llm.invoke(messages)
content = ""
if isinstance(resp.content, str):
content = resp.content
elif isinstance(resp.content, list):
for part in resp.content:
if isinstance(part, str):
content += part
elif isinstance(part, dict) and "content" in part and isinstance(part["content"], str):
content += part["content"]
return content.strip()
if __name__ == "__main__":
client = OllamaClient()
models = client.getModelList()
if models:
print("Available models:", models)
model = input("Select a model: ")
client.setModel(model)
client.updateClient()
print(client.translate("こんにちは世界", "Japanese", "English"))