From 7ef711a2d08a7d9ef9e24844e374b1f8985d7694 Mon Sep 17 00:00:00 2001 From: Konstantin Date: Fri, 3 Feb 2023 20:42:53 +0100 Subject: Comments --- Tools/CompressShaders/LanguageCodes.cs | 4 +- WhisperNet/API/eLanguage.cs | 200 +++++++++++++++++---------------- 2 files changed, 104 insertions(+), 100 deletions(-) diff --git a/Tools/CompressShaders/LanguageCodes.cs b/Tools/CompressShaders/LanguageCodes.cs index 71a9909..0843fc7 100644 --- a/Tools/CompressShaders/LanguageCodes.cs +++ b/Tools/CompressShaders/LanguageCodes.cs @@ -71,6 +71,8 @@ namespace CompressShaders namespace Whisper { /// Supported languages + /// The values of this enum are zero-padded ASCII strings.
+ /// It seems OpenAI tried to implement ISO 639-1, but they used the version of the standard from 1988.
public enum eLanguage: uint {" ); @@ -79,7 +81,7 @@ namespace Whisper string tc = row.name.titleCase(); stm.WriteLine( " /// {0}", tc ); tc = Regex.Replace( tc, @"\s+", string.Empty ); - stm.WriteLine( " {0} = 0x{1:X},", tc, row.keyValue ); + stm.WriteLine( " {0} = 0x{1:X}, // \"{2}\"", tc, row.keyValue, row.keySource ); } stm.Write( @" } }" ); diff --git a/WhisperNet/API/eLanguage.cs b/WhisperNet/API/eLanguage.cs index 1241077..e78b81c 100644 --- a/WhisperNet/API/eLanguage.cs +++ b/WhisperNet/API/eLanguage.cs @@ -2,205 +2,207 @@ namespace Whisper { /// Supported languages + /// The values of this enum are zero-padded ASCII strings.
+ /// It seems OpenAI tried to implement ISO 639-1, but they used the version of the standard from 1988.
public enum eLanguage: uint { /// Afrikaans - Afrikaans = 0x6661, + Afrikaans = 0x6661, // "af" /// Albanian - Albanian = 0x7173, + Albanian = 0x7173, // "sq" /// Amharic - Amharic = 0x6D61, + Amharic = 0x6D61, // "am" /// Arabic - Arabic = 0x7261, + Arabic = 0x7261, // "ar" /// Armenian - Armenian = 0x7968, + Armenian = 0x7968, // "hy" /// Assamese - Assamese = 0x7361, + Assamese = 0x7361, // "as" /// Azerbaijani - Azerbaijani = 0x7A61, + Azerbaijani = 0x7A61, // "az" /// Bashkir - Bashkir = 0x6162, + Bashkir = 0x6162, // "ba" /// Basque - Basque = 0x7565, + Basque = 0x7565, // "eu" /// Belarusian - Belarusian = 0x6562, + Belarusian = 0x6562, // "be" /// Bengali - Bengali = 0x6E62, + Bengali = 0x6E62, // "bn" /// Bosnian - Bosnian = 0x7362, + Bosnian = 0x7362, // "bs" /// Breton - Breton = 0x7262, + Breton = 0x7262, // "br" /// Bulgarian - Bulgarian = 0x6762, + Bulgarian = 0x6762, // "bg" /// Catalan - Catalan = 0x6163, + Catalan = 0x6163, // "ca" /// Chinese - Chinese = 0x687A, + Chinese = 0x687A, // "zh" /// Croatian - Croatian = 0x7268, + Croatian = 0x7268, // "hr" /// Czech - Czech = 0x7363, + Czech = 0x7363, // "cs" /// Danish - Danish = 0x6164, + Danish = 0x6164, // "da" /// Dutch - Dutch = 0x6C6E, + Dutch = 0x6C6E, // "nl" /// English - English = 0x6E65, + English = 0x6E65, // "en" /// Estonian - Estonian = 0x7465, + Estonian = 0x7465, // "et" /// Faroese - Faroese = 0x6F66, + Faroese = 0x6F66, // "fo" /// Finnish - Finnish = 0x6966, + Finnish = 0x6966, // "fi" /// French - French = 0x7266, + French = 0x7266, // "fr" /// Galician - Galician = 0x6C67, + Galician = 0x6C67, // "gl" /// Georgian - Georgian = 0x616B, + Georgian = 0x616B, // "ka" /// German - German = 0x6564, + German = 0x6564, // "de" /// Greek - Greek = 0x6C65, + Greek = 0x6C65, // "el" /// Gujarati - Gujarati = 0x7567, + Gujarati = 0x7567, // "gu" /// Haitian Creole - HaitianCreole = 0x7468, + HaitianCreole = 0x7468, // "ht" /// Hausa - Hausa = 0x6168, + Hausa = 0x6168, // "ha" /// Hawaiian - Hawaiian = 0x776168, + Hawaiian = 0x776168, // "haw" /// Hebrew - Hebrew = 0x7769, + Hebrew = 0x7769, // "iw" /// Hindi - Hindi = 0x6968, + Hindi = 0x6968, // "hi" /// Hungarian - Hungarian = 0x7568, + Hungarian = 0x7568, // "hu" /// Icelandic - Icelandic = 0x7369, + Icelandic = 0x7369, // "is" /// Indonesian - Indonesian = 0x6469, + Indonesian = 0x6469, // "id" /// Italian - Italian = 0x7469, + Italian = 0x7469, // "it" /// Japanese - Japanese = 0x616A, + Japanese = 0x616A, // "ja" /// Javanese - Javanese = 0x776A, + Javanese = 0x776A, // "jw" /// Kannada - Kannada = 0x6E6B, + Kannada = 0x6E6B, // "kn" /// Kazakh - Kazakh = 0x6B6B, + Kazakh = 0x6B6B, // "kk" /// Khmer - Khmer = 0x6D6B, + Khmer = 0x6D6B, // "km" /// Korean - Korean = 0x6F6B, + Korean = 0x6F6B, // "ko" /// Lao - Lao = 0x6F6C, + Lao = 0x6F6C, // "lo" /// Latin - Latin = 0x616C, + Latin = 0x616C, // "la" /// Latvian - Latvian = 0x766C, + Latvian = 0x766C, // "lv" /// Lingala - Lingala = 0x6E6C, + Lingala = 0x6E6C, // "ln" /// Lithuanian - Lithuanian = 0x746C, + Lithuanian = 0x746C, // "lt" /// Luxembourgish - Luxembourgish = 0x626C, + Luxembourgish = 0x626C, // "lb" /// Macedonian - Macedonian = 0x6B6D, + Macedonian = 0x6B6D, // "mk" /// Malagasy - Malagasy = 0x676D, + Malagasy = 0x676D, // "mg" /// Malay - Malay = 0x736D, + Malay = 0x736D, // "ms" /// Malayalam - Malayalam = 0x6C6D, + Malayalam = 0x6C6D, // "ml" /// Maltese - Maltese = 0x746D, + Maltese = 0x746D, // "mt" /// Maori - Maori = 0x696D, + Maori = 0x696D, // "mi" /// Marathi - Marathi = 0x726D, + Marathi = 0x726D, // "mr" /// Mongolian - Mongolian = 0x6E6D, + Mongolian = 0x6E6D, // "mn" /// Myanmar - Myanmar = 0x796D, + Myanmar = 0x796D, // "my" /// Nepali - Nepali = 0x656E, + Nepali = 0x656E, // "ne" /// Norwegian - Norwegian = 0x6F6E, + Norwegian = 0x6F6E, // "no" /// Nynorsk - Nynorsk = 0x6E6E, + Nynorsk = 0x6E6E, // "nn" /// Occitan - Occitan = 0x636F, + Occitan = 0x636F, // "oc" /// Pashto - Pashto = 0x7370, + Pashto = 0x7370, // "ps" /// Persian - Persian = 0x6166, + Persian = 0x6166, // "fa" /// Polish - Polish = 0x6C70, + Polish = 0x6C70, // "pl" /// Portuguese - Portuguese = 0x7470, + Portuguese = 0x7470, // "pt" /// Punjabi - Punjabi = 0x6170, + Punjabi = 0x6170, // "pa" /// Romanian - Romanian = 0x6F72, + Romanian = 0x6F72, // "ro" /// Russian - Russian = 0x7572, + Russian = 0x7572, // "ru" /// Sanskrit - Sanskrit = 0x6173, + Sanskrit = 0x6173, // "sa" /// Serbian - Serbian = 0x7273, + Serbian = 0x7273, // "sr" /// Shona - Shona = 0x6E73, + Shona = 0x6E73, // "sn" /// Sindhi - Sindhi = 0x6473, + Sindhi = 0x6473, // "sd" /// Sinhala - Sinhala = 0x6973, + Sinhala = 0x6973, // "si" /// Slovak - Slovak = 0x6B73, + Slovak = 0x6B73, // "sk" /// Slovenian - Slovenian = 0x6C73, + Slovenian = 0x6C73, // "sl" /// Somali - Somali = 0x6F73, + Somali = 0x6F73, // "so" /// Spanish - Spanish = 0x7365, + Spanish = 0x7365, // "es" /// Sundanese - Sundanese = 0x7573, + Sundanese = 0x7573, // "su" /// Swahili - Swahili = 0x7773, + Swahili = 0x7773, // "sw" /// Swedish - Swedish = 0x7673, + Swedish = 0x7673, // "sv" /// Tagalog - Tagalog = 0x6C74, + Tagalog = 0x6C74, // "tl" /// Tajik - Tajik = 0x6774, + Tajik = 0x6774, // "tg" /// Tamil - Tamil = 0x6174, + Tamil = 0x6174, // "ta" /// Tatar - Tatar = 0x7474, + Tatar = 0x7474, // "tt" /// Telugu - Telugu = 0x6574, + Telugu = 0x6574, // "te" /// Thai - Thai = 0x6874, + Thai = 0x6874, // "th" /// Tibetan - Tibetan = 0x6F62, + Tibetan = 0x6F62, // "bo" /// Turkish - Turkish = 0x7274, + Turkish = 0x7274, // "tr" /// Turkmen - Turkmen = 0x6B74, + Turkmen = 0x6B74, // "tk" /// Ukrainian - Ukrainian = 0x6B75, + Ukrainian = 0x6B75, // "uk" /// Urdu - Urdu = 0x7275, + Urdu = 0x7275, // "ur" /// Uzbek - Uzbek = 0x7A75, + Uzbek = 0x7A75, // "uz" /// Vietnamese - Vietnamese = 0x6976, + Vietnamese = 0x6976, // "vi" /// Welsh - Welsh = 0x7963, + Welsh = 0x7963, // "cy" /// Yiddish - Yiddish = 0x6979, + Yiddish = 0x6979, // "yi" /// Yoruba - Yoruba = 0x6F79, + Yoruba = 0x6F79, // "yo" } } \ No newline at end of file -- cgit v1.2.3