From 70efd85d85a087cf0a791139ee5d3732ee9217d9 Mon Sep 17 00:00:00 2001 From: misyaguziya Date: Wed, 5 Jun 2024 18:48:07 +0900 Subject: [PATCH] =?UTF-8?q?=F0=9F=91=8D=EF=B8=8F[Update]=20Model=20:=20?= =?UTF-8?q?=E4=BB=A5=E4=B8=8B=E3=81=AE=E3=83=AA=E3=83=B3=E3=82=AF=E3=81=AB?= =?UTF-8?q?=E5=9F=BA=E3=81=A5=E3=81=8D=E3=80=81=E6=96=87=E5=AD=97=E8=B5=B7?= =?UTF-8?q?=E3=81=93=E3=81=97=E3=81=AE=E8=A8=80=E8=AA=9E=E3=82=92=E8=BF=BD?= =?UTF-8?q?=E5=8A=A0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit https://cloud.google.com/speech-to-text/docs/speech-to-text-supported-languages?hl=ja --- .../transcription/transcription_languages.py | 332 ++++++++++++++++-- 1 file changed, 308 insertions(+), 24 deletions(-) diff --git a/models/transcription/transcription_languages.py b/models/transcription/transcription_languages.py index dd333424..12625df7 100644 --- a/models/transcription/transcription_languages.py +++ b/models/transcription/transcription_languages.py @@ -5,6 +5,18 @@ transcription_lang = { "Whisper": "af", }, }, + "Albanian":{ + "Albania":{ + "Google": "sq-AL", + "Whisper": "sq", + }, + }, + "Amharic":{ + "Ethiopia":{ + "Google": "am-ET", + "Whisper": "am", + }, + }, "Arabic":{ "Algeria":{ "Google": "ar-DZ", @@ -38,6 +50,10 @@ transcription_lang = { "Google": "ar-LB", "Whisper": "ar", }, + "Mauritania":{ + "Google": "ar-MR", + "Whisper": "ar", + }, "Morocco":{ "Google": "ar-MA", "Whisper": "ar", @@ -46,10 +62,6 @@ transcription_lang = { "Google": "ar-OM", "Whisper": "ar", }, - "State of Palestine":{ - "Google": "ar-PS", - "Whisper": "ar", - }, "Qatar":{ "Google": "ar-QA", "Whisper": "ar", @@ -58,6 +70,14 @@ transcription_lang = { "Google": "ar-SA", "Whisper": "ar", }, + "Palestine":{ + "Google": "ar-PS", + "Whisper": "ar", + }, + "Syria":{ + "Google": "ar-SY", + "Whisper": "ar", + }, "Tunisia":{ "Google": "ar-TN", "Whisper": "ar", @@ -66,6 +86,22 @@ transcription_lang = { "Google": "ar-AE", "Whisper": "ar", }, + "Yemen":{ + "Google": "ar-YE", + "Whisper": "ar", + }, + }, + "Armenian": { + "Armenia": { + "Google": "hy-AM", + "Whisper": "hy", + }, + }, + "Azerbaijani": { + "Azerbaijan": { + "Google": "az-AZ", + "Whisper": "az", + }, }, "Basque":{ "Spain":{ @@ -73,12 +109,34 @@ transcription_lang = { "Whisper": "eu", }, }, + "Bengali":{ + "Bangladesh":{ + "Google": "bn-BD", + "Whisper": "bn", + }, + "India":{ + "Google": "bn-IN", + "Whisper": "bn", + }, + }, + "Bosnian":{ + "Bosnia and Herzegovina":{ + "Google": "bs-BA", + "Whisper": "bs", + } + }, "Bulgarian":{ "Bulgaria":{ "Google": "bg-BG", "Whisper": "bg", }, }, + "Burmese":{ + "Myanmar":{ + "Google": "my-MM", + "Whisper": "my", + }, + }, "Catalan":{ "Spain":{ "Google": "ca-ES", @@ -124,20 +182,16 @@ transcription_lang = { }, }, "Dutch":{ + "Belgium":{ + "Google": "nl-BE", + "Whisper": "nl", + }, "Netherlands":{ "Google": "nl-NL", "Whisper": "nl", }, }, "English": { - "United States":{ - "Google": "en-US", - "Whisper": "en", - }, - "United Kingdom":{ - "Google": "en-GB", - "Whisper": "en", - }, "Australia":{ "Google": "en-AU", "Whisper": "en", @@ -146,6 +200,14 @@ transcription_lang = { "Google": "en-CA", "Whisper": "en", }, + "Ghana":{ + "Google": "en-GH", + "Whisper": "en", + }, + "Hong Kong":{ + "Google": "en-HK", + "Whisper": "en", + }, "India":{ "Google": "en-IN", "Whisper": "en", @@ -154,18 +216,42 @@ transcription_lang = { "Google": "en-IE", "Whisper": "en", }, + "Kenya":{ + "Google": "en-KE", + "Whisper": "en", + }, "New Zealand":{ "Google": "en-NZ", "Whisper": "en", }, + "Nigeria":{ + "Google": "en-NG", + "Whisper": "en", + }, "Philippines":{ "Google": "en-PH", "Whisper": "en", }, + "Singapore":{ + "Google": "en-SG", + "Whisper": "en", + }, "South Africa":{ "Google": "en-ZA", "Whisper": "en", }, + "Tanzania":{ + "Google": "en-TZ", + "Whisper": "en", + }, + "United Kingdom":{ + "Google": "en-GB", + "Whisper": "en", + }, + "United States":{ + "Google": "en-US", + "Whisper": "en", + }, }, "Estonian":{ "Estonia":{ @@ -186,10 +272,22 @@ transcription_lang = { }, }, "French":{ + "Belgium":{ + "Google": "fr-BE", + "Whisper": "fr", + }, + "Canada":{ + "Google": "fr-CA", + "Whisper": "fr", + }, "France":{ "Google": "fr-FR", "Whisper": "fr", }, + "Switzerland":{ + "Google": "fr-CH", + "Whisper": "fr", + }, }, "Galician":{ "Spain":{ @@ -197,11 +295,25 @@ transcription_lang = { "Whisper": "gl", }, }, + "Georgian":{ + "Georgia":{ + "Google": "ka-GE", + "Whisper": "ka", + }, + }, "German":{ + "Austria":{ + "Google": "de-AT", + "Whisper": "de", + }, "Germany":{ "Google": "de-DE", "Whisper": "de", }, + "Switzerland":{ + "Google": "de-CH", + "Whisper": "de", + }, }, "Greek":{ "Greece":{ @@ -209,9 +321,15 @@ transcription_lang = { "Whisper": "el", }, }, + "Gujarati":{ + "India":{ + "Google": "gu-IN", + "Whisper": "gu", + }, + }, "Hebrew":{ "Israel":{ - "Google": "he-IL", + "Google": "iw-IL", "Whisper": "he", }, }, @@ -227,18 +345,18 @@ transcription_lang = { "Whisper": "hu", }, }, - "Indonesian":{ - "Indonesia":{ - "Google": "id-ID", - "Whisper": "id", - }, - }, "Icelandic":{ "Iceland":{ "Google": "is-IS", "Whisper": "is", }, }, + "Indonesian":{ + "Indonesia":{ + "Google": "id-ID", + "Whisper": "id", + }, + }, "Italian":{ "Italy":{ "Google": "it-IT", @@ -255,27 +373,91 @@ transcription_lang = { "Whisper": "ja", }, }, + # "Javanese":{ + # "Indonesia":{ + # "Google": "jv-ID", + # }, + # }, + "Kannada":{ + "India":{ + "Google": "kn-IN", + "Whisper": "kn", + }, + }, + "Kazakh":{ + "Kazakhstan":{ + "Google": "kk-KZ", + "Whisper": "kk", + }, + }, + "Khmer":{ + "Cambodia":{ + "Google": "km-KH", + "Whisper": "km", + }, + }, + # "Kinyarwanda":{ + # "rwanda":{ + # "Google": "rw-RW", + # }, + # }, "Korean":{ "South Korea":{ "Google": "ko-KR", "Whisper": "ko", }, }, + "Lao":{ + "Laos":{ + "Google": "lo-LA", + "Whisper": "lo", + }, + }, + "Latvian":{ + "Latvia":{ + "Google": "lv-LV", + "Whisper": "lv", + }, + }, "Lithuanian":{ "Lithuania":{ "Google": "lt-LT", "Whisper": "lt", }, }, + "Macedonian":{ + "North Macedonia":{ + "Google": "mk-MK", + "Whisper": "mk", + }, + }, "Malay":{ "Malaysia":{ "Google": "ms-MY", "Whisper": "ms", }, }, + "Malayalam":{ + "India":{ + "Google": "ml-IN", + "Whisper": "ml", + }, + }, + "Mongolian":{ + "Mongolia":{ + "Google": "mn-MN", + "Whisper": "mn", + }, + }, + "Nepali":{ + "Nepal":{ + "Google": "ne-NP", + "Whisper": "ne", + }, + }, "Norwegian":{ "Norway":{ - "Google": "nb-NO", + "Google": "no-NO", "Whisper": "no", }, }, @@ -301,6 +483,11 @@ transcription_lang = { "Whisper": "pt", }, }, + # "Punjabi":{ + # "India":{ + # "Google": "pa-Guru-IN", + # }, + # }, "Romanian":{ "Romania":{ "Google": "ro-RO", @@ -319,6 +506,12 @@ transcription_lang = { "Whisper": "sr", }, }, + "Sinhala":{ + "Sri Lanka":{ + "Google": "si-LK", + "Whisper": "si", + }, + }, "Slovak":{ "Slovakia":{ "Google": "sk-SK", @@ -331,6 +524,11 @@ transcription_lang = { "Whisper": "sl", }, }, + # "Sesotho":{ + # "South Africa":{ + # "Google": "st-ZA", + # }, + # }, "Spanish":{ "Argentina":{ "Google": "es-AR", @@ -400,31 +598,86 @@ transcription_lang = { "Google": "es-ES", "Whisper": "es", }, - "Uruguay":{ - "Google": "es-UY", - "Whisper": "es", - }, "United States":{ "Google": "es-US", "Whisper": "es", }, + "Uruguay":{ + "Google": "es-UY", + "Whisper": "es", + }, "Venezuela":{ "Google": "es-VE", "Whisper": "es", }, }, + "Sundanese":{ + "Indonesia":{ + "Google": "su-ID", + "Whisper": "su", + }, + }, + "Swahili":{ + "Kenya":{ + "Google": "sw-KE", + "Whisper": "sw", + }, + "Tanzania":{ + "Google": "sw-TZ", + "Whisper": "sw", + }, + }, + # "Swazi":{ + # "Eswatini":{ + # "Google": "ss-Latn-ZA", + # }, + # }, "Swedish":{ "Sweden":{ "Google": "sv-SE", "Whisper": "sv", }, }, + "Tamil":{ + "India":{ + "Google": "ta-IN", + "Whisper": "ta", + }, + "malaysia":{ + "Google": "ta-MY", + "Whisper": "ta", + }, + "Singapore":{ + "Google": "ta-SG", + "Whisper": "ta", + }, + "Sri Lanka":{ + "Google": "ta-LK", + "Whisper": "ta", + }, + }, + "Telugu":{ + "India":{ + "Google": "te-IN", + "Whisper": "te", + }, + }, "Thai":{ "Thailand":{ "Google": "th-TH", "Whisper": "th", }, }, + # "Tsonga":{ + # "South Africa":{ + # "Google": "ts-ZA", + # }, + # }, + # "Setswana":{ + # "South Africa":{ + # "Google": "tn-Latn-ZA", + # }, + # }, "Turkish":{ "Turkey":{ "Google": "tr-TR", @@ -437,10 +690,41 @@ transcription_lang = { "Whisper": "uk", }, }, + "Urdu":{ + "India":{ + "Google": "ur-IN", + "Whisper": "ur", + }, + "Pakistan":{ + "Google": "ur-PK", + "Whisper": "ur", + }, + }, + "Uzbek":{ + "Uzbekistan":{ + "Google": "uz-UZ", + "Whisper": "uz", + }, + }, + # "Venda":{ + # "South Africa":{ + # "Google": "ve-ZA", + # }, + # }, "Vietnamese":{ "Vietnam":{ "Google": "vi-VN", "Whisper": "vi", }, }, + # "Xhosa":{ + # "South Africa":{ + # "Google": "xh-ZA", + # }, + # }, + # "Zulu":{ + # "South Africa":{ + # "Google": "zu-ZA", + # }, + # }, } \ No newline at end of file