From 202e459aadef0c806e86347213e05e014f2b9701 Mon Sep 17 00:00:00 2001 From: misyaguziya Date: Mon, 4 Mar 2024 17:18:28 +0900 Subject: [PATCH] =?UTF-8?q?=F0=9F=90=9B[bugifx]=20Model:=20=E4=B8=AD?= =?UTF-8?q?=E5=9B=BD=E8=AA=9E=E3=80=81=E7=B9=81=E4=BD=93=E5=AD=97=E3=81=8C?= =?UTF-8?q?=E8=A1=A8=E7=A4=BA=E3=81=95=E3=82=8C=E3=81=AA=E3=81=84=E3=81=9A?= =?UTF-8?q?=E3=80=81=E5=85=A8=E9=83=A8=E7=B0=A1=E4=BD=93=E5=AD=97=E3=81=AB?= =?UTF-8?q?=E3=81=AA=E3=81=A3=E3=81=A6=E3=82=8B=E5=95=8F=E9=A1=8C=E3=82=92?= =?UTF-8?q?=E4=BF=AE=E6=AD=A3?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../transcription/transcription_languages.py | 12 +- models/translation/translation_languages.py | 311 +++++++++--------- 2 files changed, 166 insertions(+), 157 deletions(-) diff --git a/models/transcription/transcription_languages.py b/models/transcription/transcription_languages.py index 63d92568..c2cfa914 100644 --- a/models/transcription/transcription_languages.py +++ b/models/transcription/transcription_languages.py @@ -85,20 +85,22 @@ transcription_lang = { "Whisper": "ca", }, }, - "Chinese":{ - "Mandarin (Simplified, China)":{ + "Chinese Simplified":{ + "China":{ "Google": "cmn-Hans-CN", "Whisper": "zh", }, - "Mandarin (Simplified, Hong Kong)":{ + "Hong Kong":{ "Google": "cmn-Hans-HK", "Whisper": "zh", }, - "Mandarin (Traditional, Taiwan)":{ + }, + "Chinese Traditional":{ + "Taiwan":{ "Google": "cmn-Hant-TW", "Whisper": "zh", }, - "Cantonese (Traditional Hong Kong)":{ + "Hong Kong":{ "Google": "yue-Hant-HK", "Whisper": "yue", }, diff --git a/models/translation/translation_languages.py b/models/translation/translation_languages.py index 44051f8a..a697960b 100644 --- a/models/translation/translation_languages.py +++ b/models/translation/translation_languages.py @@ -1,40 +1,41 @@ translation_lang = {} dict_deepl_languages = { - 'Arabic':'ar', - 'Bulgarian':'bg', - 'Czech':'cs', - 'Danish':'da', - 'German':'de', - 'Greek':'el', - 'English':'en', - 'Spanish':'es', - 'Estonian':'et', - 'Finnish':'fi', - 'French':'fr', - 'Irish':'ga', - 'Croatian':'hr', - 'Hungarian':'hu', - 'Indonesian':'id', - 'Icelandic':'is', - 'Italian':'it', - 'Japanese':'ja', - 'Korean':'ko', - 'Lithuanian':'lt', - 'Latvian':'lv', - 'Maltese':'mt', - 'Bokmal':'nb', - 'Dutch':'nl', - 'Norwegian':'no', - 'Polish':'pl', - 'Portuguese':'pt', - 'Romanian':'ro', - 'Russian':'ru', - 'Slovak':'sk', - 'Slovenian':'sl', - 'Swedish':'sv', - 'Turkish':'tr', - 'Ukrainian':'uk', - 'Chinese':'zh', + "Arabic":"ar", + "Bulgarian":"bg", + "Czech":"cs", + "Danish":"da", + "German":"de", + "Greek":"el", + "English":"en", + "Spanish":"es", + "Estonian":"et", + "Finnish":"fi", + "French":"fr", + "Irish":"ga", + "Croatian":"hr", + "Hungarian":"hu", + "Indonesian":"id", + "Icelandic":"is", + "Italian":"it", + "Japanese":"ja", + "Korean":"ko", + "Lithuanian":"lt", + "Latvian":"lv", + "Maltese":"mt", + "Bokmal":"nb", + "Dutch":"nl", + "Norwegian":"no", + "Polish":"pl", + "Portuguese":"pt", + "Romanian":"ro", + "Russian":"ru", + "Slovak":"sk", + "Slovenian":"sl", + "Swedish":"sv", + "Turkish":"tr", + "Ukrainian":"uk", + "Chinese Simplified":"zh", + "Chinese Traditional":"zh" } translation_lang["DeepL"] = { "source":dict_deepl_languages, @@ -70,7 +71,8 @@ dict_deepl_api_source_languages = { "Swedish":"sv", "Turkish":"tr", "Ukrainian":"uk", - "Chinese":"zh" + "Chinese Simplified":"zh", + "Chinese Traditional":"zh" } dict_deepl_api_target_languages = { "Japanese":"ja", @@ -104,7 +106,8 @@ dict_deepl_api_target_languages = { "Swedish":"sv", "Turkish":"tr", "Ukrainian":"uk", - "Chinese":"zh" + "Chinese Simplified":"zh", + "Chinese Traditional":"zh" } translation_lang["DeepL_API"] = { "source": dict_deepl_api_source_languages, @@ -114,7 +117,8 @@ translation_lang["DeepL_API"] = { dict_google_languages = { "Japanese":"ja", "English":"en", - "Chinese":"zh", + "Chinese Simplified":"zh", + "Chinese Traditional":"zh-TW", "Arabic":"ar", "Russian":"ru", "French":"fr", @@ -183,7 +187,8 @@ translation_lang["Google"] = { dict_bing_languages = { "Japanese":"ja", "English":"en", - "Chinese":"zh", + "Chinese Simplified":"zh", + "Chinese Traditional":"zh-Hant", "Arabic":"ar", "Russian":"ru", "French":"fr", @@ -248,20 +253,21 @@ translation_lang["Bing"] = { } dict_papago_languages = { - 'German': 'de', - 'English': 'en', - 'Spanish':'es', - 'French': 'fr', - 'Hindi': 'hi', - 'Indonesian': 'id', - 'Italian': 'it', - 'Japanese': 'ja', - 'Korean': 'ko', - 'Portuguese': 'pt', - 'Russian': 'ru', - 'Thai': 'th', - 'Vietnamese': 'vi', - 'Chinese':'zh-CN', + "German": "de", + "English": "en", + "Spanish":"es", + "French": "fr", + "Hindi": "hi", + "Indonesian": "id", + "Italian": "it", + "Japanese": "ja", + "Korean": "ko", + "Portuguese": "pt", + "Russian": "ru", + "Thai": "th", + "Vietnamese": "vi", + "Chinese Simplified":"zh-CN", + "Chinese Traditional":"zh-TW", } translation_lang["Papago"] = { @@ -270,105 +276,106 @@ translation_lang["Papago"] = { } dict_ctranslate2_languages = { - 'English': 'en', - 'Chinese': 'zh', - 'German': 'de', - 'Spanish': 'es', - 'Russian': 'ru', - 'Korean': 'ko', - 'French': 'fr', - 'Japanese': 'ja', - 'Portuguese': 'pt', - 'Turkish': 'tr', - 'Polish': 'pl', - 'Catalan': 'ca', - 'Dutch': 'nl', - 'Arabic': 'ar', - 'Swedish': 'sv', - 'Italian': 'it', - 'Indonesian': 'id', - 'Hindi': 'hi', - 'Finnish': 'fi', - 'Vietnamese': 'vi', - 'Hebrew': 'he', - 'Ukrainian': 'uk', - 'Greek': 'el', - 'Malay': 'ms', - 'Czech': 'cs', - 'Romanian': 'ro', - 'Danish': 'da', - 'Hungarian': 'hu', - 'Tamil': 'ta', - 'Norwegian': 'no', - 'Thai': 'th', - 'Urdu': 'ur', - 'Croatian': 'hr', - 'Bulgarian': 'bg', - 'Lithuanian': 'lt', - 'Latin': 'la', - 'Maori': 'mi', - 'Malayalam': 'ml', - 'Welsh': 'cy', - 'Slovak': 'sk', - 'Telugu': 'te', - 'Persian': 'fa', - 'Latvian': 'lv', - 'Bengali': 'bn', - 'Serbian': 'sr', - 'Azerbaijani': 'az', - 'Slovenian': 'sl', - 'Kannada': 'kn', - 'Estonian': 'et', - 'Macedonian': 'mk', - 'Breton': 'br', - 'Basque': 'eu', - 'Icelandic': 'is', - 'Armenian': 'hy', - 'Nepali': 'ne', - 'Mongolian': 'mn', - 'Bosnian': 'bs', - 'Kazakh': 'kk', - 'Albanian': 'sq', - 'Swahili': 'sw', - 'Galician': 'gl', - 'Marathi': 'mr', - 'Punjabi': 'pa', - 'Sinhala': 'si', - 'Khmer': 'km', - 'Shona': 'sn', - 'Yoruba': 'yo', - 'Somali': 'so', - 'Afrikaans': 'af', - 'Occitan': 'oc', - 'Georgian': 'ka', - 'Belarusian': 'be', - 'Tajik': 'tg', - 'Sindhi': 'sd', - 'Gujarati': 'gu', - 'Amharic': 'am', - 'Yiddish': 'yi', - 'Lao': 'lo', - 'Uzbek': 'uz', - 'Faroese': 'fo', - 'Haitian creole': 'ht', - 'Pashto': 'ps', - 'Turkmen': 'tk', - 'Nynorsk': 'nn', - 'Maltese': 'mt', - 'Sanskrit': 'sa', - 'Luxembourgish': 'lb', - 'Myanmar': 'my', - 'Tibetan': 'bo', - 'Filipino': 'tl', - 'Malagasy': 'mg', - 'Assamese': 'as', - 'Tatar': 'tt', - 'Hawaiian': 'haw', - 'Lingala': 'ln', - 'Hausa': 'ha', - 'Bashkir': 'ba', - 'Javanese': 'jw', - 'Sundanese': 'su' + "English": "en", + "Chinese Simplified": "zh", + "Chinese Traditional":"zh", + "German": "de", + "Spanish": "es", + "Russian": "ru", + "Korean": "ko", + "French": "fr", + "Japanese": "ja", + "Portuguese": "pt", + "Turkish": "tr", + "Polish": "pl", + "Catalan": "ca", + "Dutch": "nl", + "Arabic": "ar", + "Swedish": "sv", + "Italian": "it", + "Indonesian": "id", + "Hindi": "hi", + "Finnish": "fi", + "Vietnamese": "vi", + "Hebrew": "he", + "Ukrainian": "uk", + "Greek": "el", + "Malay": "ms", + "Czech": "cs", + "Romanian": "ro", + "Danish": "da", + "Hungarian": "hu", + "Tamil": "ta", + "Norwegian": "no", + "Thai": "th", + "Urdu": "ur", + "Croatian": "hr", + "Bulgarian": "bg", + "Lithuanian": "lt", + "Latin": "la", + "Maori": "mi", + "Malayalam": "ml", + "Welsh": "cy", + "Slovak": "sk", + "Telugu": "te", + "Persian": "fa", + "Latvian": "lv", + "Bengali": "bn", + "Serbian": "sr", + "Azerbaijani": "az", + "Slovenian": "sl", + "Kannada": "kn", + "Estonian": "et", + "Macedonian": "mk", + "Breton": "br", + "Basque": "eu", + "Icelandic": "is", + "Armenian": "hy", + "Nepali": "ne", + "Mongolian": "mn", + "Bosnian": "bs", + "Kazakh": "kk", + "Albanian": "sq", + "Swahili": "sw", + "Galician": "gl", + "Marathi": "mr", + "Punjabi": "pa", + "Sinhala": "si", + "Khmer": "km", + "Shona": "sn", + "Yoruba": "yo", + "Somali": "so", + "Afrikaans": "af", + "Occitan": "oc", + "Georgian": "ka", + "Belarusian": "be", + "Tajik": "tg", + "Sindhi": "sd", + "Gujarati": "gu", + "Amharic": "am", + "Yiddish": "yi", + "Lao": "lo", + "Uzbek": "uz", + "Faroese": "fo", + "Haitian creole": "ht", + "Pashto": "ps", + "Turkmen": "tk", + "Nynorsk": "nn", + "Maltese": "mt", + "Sanskrit": "sa", + "Luxembourgish": "lb", + "Myanmar": "my", + "Tibetan": "bo", + "Filipino": "tl", + "Malagasy": "mg", + "Assamese": "as", + "Tatar": "tt", + "Hawaiian": "haw", + "Lingala": "ln", + "Hausa": "ha", + "Bashkir": "ba", + "Javanese": "jw", + "Sundanese": "su" } translation_lang["CTranslate2"] = {