dockerwiki/content/inc/Utf8/tables/romanization.php
2021-10-26 13:02:53 +02:00

1459 lines
34 KiB
PHP
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<?php
/**
* Romanization lookup table
*
* This lookup tables provides a way to transform strings written in a language
* different from the ones based upon latin letters into plain ASCII.
*
* Please note: this is not a scientific transliteration table. It only works
* oneway from nonlatin to ASCII and it works by simple character replacement
* only. Specialities of each language are not supported.
*
* @todo some keys are used multiple times
* @todo remove or integrate commented pairs
*
* @author Andreas Gohr <andi@splitbrain.org>
* @author Vitaly Blokhin <vitinfo@vitn.com>
* @author Bisqwit <bisqwit@iki.fi>
* @author Arthit Suriyawongkul <arthit@gmail.com>
* @author Denis Scheither <amorphis@uni-bremen.de>
* @author Eivind Morland <eivind.morland@gmail.com>
* @link http://www.uconv.com/translit.htm
* @link http://kanjidict.stc.cx/hiragana.php?src=2
* @link http://www.translatum.gr/converter/greek-transliteration.htm
* @link http://en.wikipedia.org/wiki/Royal_Thai_General_System_of_Transcription
* @link http://www.btranslations.com/resources/romanization/korean.asp
*/
return [
// scandinavian - differs from what we do in deaccent
'å' => 'a',
'Å' => 'A',
'ä' => 'a',
'Ä' => 'A',
'ö' => 'o',
'Ö' => 'O',
//russian cyrillic
'а' => 'a',
'А' => 'A',
'б' => 'b',
'Б' => 'B',
'в' => 'v',
'В' => 'V',
'г' => 'g',
'Г' => 'G',
'д' => 'd',
'Д' => 'D',
'е' => 'e',
'Е' => 'E',
'ё' => 'jo',
'Ё' => 'Jo',
'ж' => 'zh',
'Ж' => 'Zh',
'з' => 'z',
'З' => 'Z',
'и' => 'i',
'И' => 'I',
'й' => 'j',
'Й' => 'J',
'к' => 'k',
'К' => 'K',
'л' => 'l',
'Л' => 'L',
'м' => 'm',
'М' => 'M',
'н' => 'n',
'Н' => 'N',
'о' => 'o',
'О' => 'O',
'п' => 'p',
'П' => 'P',
'р' => 'r',
'Р' => 'R',
'с' => 's',
'С' => 'S',
'т' => 't',
'Т' => 'T',
'у' => 'u',
'У' => 'U',
'ф' => 'f',
'Ф' => 'F',
'х' => 'x',
'Х' => 'X',
'ц' => 'c',
'Ц' => 'C',
'ч' => 'ch',
'Ч' => 'Ch',
'ш' => 'sh',
'Ш' => 'Sh',
'щ' => 'sch',
'Щ' => 'Sch',
'ъ' => '',
'Ъ' => '',
'ы' => 'y',
'Ы' => 'Y',
'ь' => '',
'Ь' => '',
'э' => 'eh',
'Э' => 'Eh',
'ю' => 'ju',
'Ю' => 'Ju',
'я' => 'ja',
'Я' => 'Ja',
// Ukrainian cyrillic
'Ґ' => 'Gh',
'ґ' => 'gh',
'Є' => 'Je',
'є' => 'je',
'І' => 'I',
'і' => 'i',
'Ї' => 'Ji',
'ї' => 'ji',
// Georgian
'ა' => 'a',
'ბ' => 'b',
'გ' => 'g',
'დ' => 'd',
'ე' => 'e',
'ვ' => 'v',
'ზ' => 'z',
'თ' => 'th',
'ი' => 'i',
'კ' => 'p',
'ლ' => 'l',
'მ' => 'm',
'ნ' => 'n',
'ო' => 'o',
'პ' => 'p',
'ჟ' => 'zh',
'რ' => 'r',
'ს' => 's',
'ტ' => 't',
'უ' => 'u',
'ფ' => 'ph',
'ქ' => 'kh',
'ღ' => 'gh',
'' => 'q',
'შ' => 'sh',
'ჩ' => 'ch',
'ც' => 'c',
'ძ' => 'dh',
'წ' => 'w',
'ჭ' => 'j',
'ხ' => 'x',
'ჯ' => 'jh',
'ჰ' => 'xh',
//Sanskrit
'अ' => 'a',
'आ' => 'ah',
'इ' => 'i',
'ई' => 'ih',
'उ' => 'u',
'ऊ' => 'uh',
'ऋ' => 'ry',
'ॠ' => 'ryh',
'ऌ' => 'ly',
'ॡ' => 'lyh',
'ए' => 'e',
'ऐ' => 'ay',
'ओ' => 'o',
'औ' => 'aw',
'अं' => 'amh',
'अः' => 'aq',
'क' => 'k',
'ख' => 'kh',
'ग' => 'g',
'घ' => 'gh',
'ङ' => 'nh',
'च' => 'c',
'छ' => 'ch',
'ज' => 'j',
'झ' => 'jh',
'ञ' => 'ny',
'ट' => 'tq',
'ठ' => 'tqh',
'ड' => 'dq',
'ढ' => 'dqh',
'ण' => 'nq',
'त' => 't',
'थ' => 'th',
'द' => 'd',
'ध' => 'dh',
'न' => 'n',
'प' => 'p',
'फ' => 'ph',
'ब' => 'b',
'भ' => 'bh',
'म' => 'm',
'य' => 'z',
'र' => 'r',
'ल' => 'l',
'व' => 'v',
'श' => 'sh',
'ष' => 'sqh',
'स' => 's',
'ह' => 'x',
//Sanskrit diacritics
'Ā' => 'A',
'Ī' => 'I',
'Ū' => 'U',
'Ṛ' => 'R',
'Ṝ' => 'R',
'Ṅ' => 'N',
'Ñ' => 'N',
'Ṭ' => 'T',
'Ḍ' => 'D',
'Ṇ' => 'N',
'Ś' => 'S',
'Ṣ' => 'S',
'Ṁ' => 'M',
'Ṃ' => 'M',
'Ḥ' => 'H',
'Ḷ' => 'L',
'Ḹ' => 'L',
'ā' => 'a',
'ī' => 'i',
'ū' => 'u',
'ṛ' => 'r',
'ṝ' => 'r',
'ṅ' => 'n',
'ñ' => 'n',
'ṭ' => 't',
'ḍ' => 'd',
'ṇ' => 'n',
'ś' => 's',
'ṣ' => 's',
'ṁ' => 'm',
'ṃ' => 'm',
'ḥ' => 'h',
'ḷ' => 'l',
'ḹ' => 'l',
//Hebrew
'א' => 'a',
'ב' => 'b',
'ג' => 'g',
'ד' => 'd',
'ה' => 'h',
'ו' => 'v',
'ז' => 'z',
'ח' => 'kh',
'ט' => 'th',
'י' => 'y',
'ך' => 'h',
'כ' => 'k',
'ל' => 'l',
'ם' => 'm',
'מ' => 'm',
'ן' => 'n',
'נ' => 'n',
'ס' => 's',
'ע' => 'ah',
'ף' => 'f',
'פ' => 'p',
'ץ' => 'c',
'צ' => 'c',
'ק' => 'q',
'ר' => 'r',
'ש' => 'sh',
'ת' => 't',
//Arabic
'ا' => 'a',
'ب' => 'b',
'ت' => 't',
'ث' => 'th',
'ج' => 'g',
'ح' => 'xh',
'خ' => 'x',
'د' => 'd',
'ذ' => 'dh',
'ر' => 'r',
'ز' => 'z',
'س' => 's',
'ش' => 'sh',
'ص' => 's\'',
'ض' => 'd\'',
'ط' => 't\'',
'ظ' => 'z\'',
'ع' => 'y',
'غ' => 'gh',
'ف' => 'f',
'ق' => 'q',
'ك' => 'k',
'ل' => 'l',
'م' => 'm',
'ن' => 'n',
'ه' => 'x\'',
'و' => 'u',
'ي' => 'i',
// Japanese characters (last update: 2008-05-09)
// Japanese hiragana
// 3 character syllables, っ doubles the consonant after
'っちゃ' => 'ccha',
'っちぇ' => 'cche',
'っちょ' => 'ccho',
'っちゅ' => 'cchu',
'っびゃ' => 'bbya',
'っびぇ' => 'bbye',
'っびぃ' => 'bbyi',
'っびょ' => 'bbyo',
'っびゅ' => 'bbyu',
'っぴゃ' => 'ppya',
'っぴぇ' => 'ppye',
'っぴぃ' => 'ppyi',
'っぴょ' => 'ppyo',
'っぴゅ' => 'ppyu',
'っちゃ' => 'ccha',
'っちぇ' => 'cche',
'っち' => 'cchi',
'っちょ' => 'ccho',
'っちゅ' => 'cchu',
// 'っひゃ'=>'hya',
// 'っひぇ'=>'hye',
// 'っひぃ'=>'hyi',
// 'っひょ'=>'hyo',
// 'っひゅ'=>'hyu',
'っきゃ' => 'kkya',
'っきぇ' => 'kkye',
'っきぃ' => 'kkyi',
'っきょ' => 'kkyo',
'っきゅ' => 'kkyu',
'っぎゃ' => 'ggya',
'っぎぇ' => 'ggye',
'っぎぃ' => 'ggyi',
'っぎょ' => 'ggyo',
'っぎゅ' => 'ggyu',
'っみゃ' => 'mmya',
'っみぇ' => 'mmye',
'っみぃ' => 'mmyi',
'っみょ' => 'mmyo',
'っみゅ' => 'mmyu',
'っにゃ' => 'nnya',
'っにぇ' => 'nnye',
'っにぃ' => 'nnyi',
'っにょ' => 'nnyo',
'っにゅ' => 'nnyu',
'っりゃ' => 'rrya',
'っりぇ' => 'rrye',
'っりぃ' => 'rryi',
'っりょ' => 'rryo',
'っりゅ' => 'rryu',
'っしゃ' => 'ssha',
'っしぇ' => 'sshe',
'っし' => 'sshi',
'っしょ' => 'ssho',
'っしゅ' => 'sshu',
// seperate hiragana 'n' ('n' + 'i' != 'ni', normally we would write "kon'nichi wa" but the
// apostrophe would be converted to _ anyway)
'んあ' => 'n_a',
'んえ' => 'n_e',
'んい' => 'n_i',
'んお' => 'n_o',
'んう' => 'n_u',
'んや' => 'n_ya',
'んよ' => 'n_yo',
'んゆ' => 'n_yu',
// 2 character syllables - normal
'ふぁ' => 'fa',
'ふぇ' => 'fe',
'ふぃ' => 'fi',
'ふぉ' => 'fo',
'ちゃ' => 'cha',
'ちぇ' => 'che',
'ち' => 'chi',
'ちょ' => 'cho',
'ちゅ' => 'chu',
'ひゃ' => 'hya',
'ひぇ' => 'hye',
'ひぃ' => 'hyi',
'ひょ' => 'hyo',
'ひゅ' => 'hyu',
'びゃ' => 'bya',
'びぇ' => 'bye',
'びぃ' => 'byi',
'びょ' => 'byo',
'びゅ' => 'byu',
'ぴゃ' => 'pya',
'ぴぇ' => 'pye',
'ぴぃ' => 'pyi',
'ぴょ' => 'pyo',
'ぴゅ' => 'pyu',
'きゃ' => 'kya',
'きぇ' => 'kye',
'きぃ' => 'kyi',
'きょ' => 'kyo',
'きゅ' => 'kyu',
'ぎゃ' => 'gya',
'ぎぇ' => 'gye',
'ぎぃ' => 'gyi',
'ぎょ' => 'gyo',
'ぎゅ' => 'gyu',
'みゃ' => 'mya',
'みぇ' => 'mye',
'みぃ' => 'myi',
'みょ' => 'myo',
'みゅ' => 'myu',
'にゃ' => 'nya',
'にぇ' => 'nye',
'にぃ' => 'nyi',
'にょ' => 'nyo',
'にゅ' => 'nyu',
'りゃ' => 'rya',
'りぇ' => 'rye',
'りぃ' => 'ryi',
'りょ' => 'ryo',
'りゅ' => 'ryu',
'しゃ' => 'sha',
'しぇ' => 'she',
'し' => 'shi',
'しょ' => 'sho',
'しゅ' => 'shu',
'じゃ' => 'ja',
'じぇ' => 'je',
'じょ' => 'jo',
'じゅ' => 'ju',
'うぇ' => 'we',
'うぃ' => 'wi',
'いぇ' => 'ye',
// 2 character syllables, っ doubles the consonant after
'っば' => 'bba',
'っべ' => 'bbe',
'っび' => 'bbi',
'っぼ' => 'bbo',
'っぶ' => 'bbu',
'っぱ' => 'ppa',
'っぺ' => 'ppe',
'っぴ' => 'ppi',
'っぽ' => 'ppo',
'っぷ' => 'ppu',
'った' => 'tta',
'って' => 'tte',
'っち' => 'cchi',
'っと' => 'tto',
'っつ' => 'ttsu',
'っだ' => 'dda',
'っで' => 'dde',
'っぢ' => 'ddi',
'っど' => 'ddo',
'っづ' => 'ddu',
'っが' => 'gga',
'っげ' => 'gge',
'っぎ' => 'ggi',
'っご' => 'ggo',
'っぐ' => 'ggu',
'っか' => 'kka',
'っけ' => 'kke',
'っき' => 'kki',
'っこ' => 'kko',
'っく' => 'kku',
'っま' => 'mma',
'っめ' => 'mme',
'っみ' => 'mmi',
'っも' => 'mmo',
'っむ' => 'mmu',
'っな' => 'nna',
'っね' => 'nne',
'っに' => 'nni',
'っの' => 'nno',
'っぬ' => 'nnu',
'っら' => 'rra',
'っれ' => 'rre',
'っり' => 'rri',
'っろ' => 'rro',
'っる' => 'rru',
'っさ' => 'ssa',
'っせ' => 'sse',
'っし' => 'sshi',
'っそ' => 'sso',
'っす' => 'ssu',
'っざ' => 'zza',
'っぜ' => 'zze',
'っじ' => 'jji',
'っぞ' => 'zzo',
'っず' => 'zzu',
// 1 character syllabels
'あ' => 'a',
'え' => 'e',
'い' => 'i',
'お' => 'o',
'う' => 'u',
'ん' => 'n',
'は' => 'ha',
'へ' => 'he',
'ひ' => 'hi',
'ほ' => 'ho',
'ふ' => 'fu',
'ば' => 'ba',
'べ' => 'be',
'び' => 'bi',
'ぼ' => 'bo',
'ぶ' => 'bu',
'ぱ' => 'pa',
'ぺ' => 'pe',
'ぴ' => 'pi',
'ぽ' => 'po',
'ぷ' => 'pu',
'た' => 'ta',
'て' => 'te',
'ち' => 'chi',
'と' => 'to',
'つ' => 'tsu',
'だ' => 'da',
'で' => 'de',
'ぢ' => 'di',
'ど' => 'do',
'づ' => 'du',
'が' => 'ga',
'げ' => 'ge',
'ぎ' => 'gi',
'ご' => 'go',
'ぐ' => 'gu',
'か' => 'ka',
'け' => 'ke',
'き' => 'ki',
'こ' => 'ko',
'く' => 'ku',
'ま' => 'ma',
'め' => 'me',
'み' => 'mi',
'も' => 'mo',
'む' => 'mu',
'な' => 'na',
'ね' => 'ne',
'に' => 'ni',
'の' => 'no',
'ぬ' => 'nu',
'ら' => 'ra',
'れ' => 're',
'り' => 'ri',
'ろ' => 'ro',
'る' => 'ru',
'さ' => 'sa',
'せ' => 'se',
'し' => 'shi',
'そ' => 'so',
'す' => 'su',
'わ' => 'wa',
'を' => 'wo',
'ざ' => 'za',
'ぜ' => 'ze',
'じ' => 'ji',
'ぞ' => 'zo',
'ず' => 'zu',
'や' => 'ya',
'よ' => 'yo',
'ゆ' => 'yu',
// old characters
'ゑ' => 'we',
'ゐ' => 'wi',
// convert what's left (probably only kicks in when something's missing above)
// 'ぁ'=>'a','ぇ'=>'e','ぃ'=>'i','ぉ'=>'o','ぅ'=>'u',
// 'ゃ'=>'ya','ょ'=>'yo','ゅ'=>'yu',
// never seen one of those (disabled for the moment)
// 'ヴぁ'=>'va','ヴぇ'=>'ve','ヴぃ'=>'vi','ヴぉ'=>'vo','ヴ'=>'vu',
// 'でゃ'=>'dha','でぇ'=>'dhe','でぃ'=>'dhi','でょ'=>'dho','でゅ'=>'dhu',
// 'どぁ'=>'dwa','どぇ'=>'dwe','どぃ'=>'dwi','どぉ'=>'dwo','どぅ'=>'dwu',
// 'ぢゃ'=>'dya','ぢぇ'=>'dye','ぢぃ'=>'dyi','ぢょ'=>'dyo','ぢゅ'=>'dyu',
// 'ふぁ'=>'fwa','ふぇ'=>'fwe','ふぃ'=>'fwi','ふぉ'=>'fwo','ふぅ'=>'fwu',
// 'ふゃ'=>'fya','ふぇ'=>'fye','ふぃ'=>'fyi','ふょ'=>'fyo','ふゅ'=>'fyu',
// 'すぁ'=>'swa','すぇ'=>'swe','すぃ'=>'swi','すぉ'=>'swo','すぅ'=>'swu',
// 'てゃ'=>'tha','てぇ'=>'the','てぃ'=>'thi','てょ'=>'tho','てゅ'=>'thu',
// 'つゃ'=>'tsa','つぇ'=>'tse','つぃ'=>'tsi','つょ'=>'tso','つ'=>'tsu',
// 'とぁ'=>'twa','とぇ'=>'twe','とぃ'=>'twi','とぉ'=>'two','とぅ'=>'twu',
// 'ヴゃ'=>'vya','ヴぇ'=>'vye','ヴぃ'=>'vyi','ヴょ'=>'vyo','ヴゅ'=>'vyu',
// 'うぁ'=>'wha','うぇ'=>'whe','うぃ'=>'whi','うぉ'=>'who','うぅ'=>'whu',
// 'じゃ'=>'zha','じぇ'=>'zhe','じぃ'=>'zhi','じょ'=>'zho','じゅ'=>'zhu',
// 'じゃ'=>'zya','じぇ'=>'zye','じぃ'=>'zyi','じょ'=>'zyo','じゅ'=>'zyu',
// 'spare' characters from other romanization systems
// 'だ'=>'da','で'=>'de','ぢ'=>'di','ど'=>'do','づ'=>'du',
// 'ら'=>'la','れ'=>'le','り'=>'li','ろ'=>'lo','る'=>'lu',
// 'さ'=>'sa','せ'=>'se','し'=>'si','そ'=>'so','す'=>'su',
// 'ちゃ'=>'cya','ちぇ'=>'cye','ちぃ'=>'cyi','ちょ'=>'cyo','ちゅ'=>'cyu',
//'じゃ'=>'jya','じぇ'=>'jye','じぃ'=>'jyi','じょ'=>'jyo','じゅ'=>'jyu',
//'りゃ'=>'lya','りぇ'=>'lye','りぃ'=>'lyi','りょ'=>'lyo','りゅ'=>'lyu',
//'しゃ'=>'sya','しぇ'=>'sye','しぃ'=>'syi','しょ'=>'syo','しゅ'=>'syu',
//'ちゃ'=>'tya','ちぇ'=>'tye','ちぃ'=>'tyi','ちょ'=>'tyo','ちゅ'=>'tyu',
//'し'=>'ci',,い'=>'yi','ぢ'=>'dzi',
//'っじゃ'=>'jja','っじぇ'=>'jje','っじ'=>'jji','っじょ'=>'jjo','っじゅ'=>'jju',
// Japanese katakana
// 4 character syllables: ッ doubles the consonant after, ー doubles the vowel before
// (usualy written with macron, but we don't want that in our URLs)
'ッビャー' => 'bbyaa',
'ッビェー' => 'bbyee',
'ッビィー' => 'bbyii',
'ッビョー' => 'bbyoo',
'ッビュー' => 'bbyuu',
'ッピャー' => 'ppyaa',
'ッピェー' => 'ppyee',
'ッピィー' => 'ppyii',
'ッピョー' => 'ppyoo',
'ッピュー' => 'ppyuu',
'ッキャー' => 'kkyaa',
'ッキェー' => 'kkyee',
'ッキィー' => 'kkyii',
'ッキョー' => 'kkyoo',
'ッキュー' => 'kkyuu',
'ッギャー' => 'ggyaa',
'ッギェー' => 'ggyee',
'ッギィー' => 'ggyii',
'ッギョー' => 'ggyoo',
'ッギュー' => 'ggyuu',
'ッミャー' => 'mmyaa',
'ッミェー' => 'mmyee',
'ッミィー' => 'mmyii',
'ッミョー' => 'mmyoo',
'ッミュー' => 'mmyuu',
'ッニャー' => 'nnyaa',
'ッニェー' => 'nnyee',
'ッニィー' => 'nnyii',
'ッニョー' => 'nnyoo',
'ッニュー' => 'nnyuu',
'ッリャー' => 'rryaa',
'ッリェー' => 'rryee',
'ッリィー' => 'rryii',
'ッリョー' => 'rryoo',
'ッリュー' => 'rryuu',
'ッシャー' => 'sshaa',
'ッシェー' => 'sshee',
'ッシー' => 'sshii',
'ッショー' => 'sshoo',
'ッシュー' => 'sshuu',
'ッチャー' => 'cchaa',
'ッチェー' => 'cchee',
'ッチー' => 'cchii',
'ッチョー' => 'cchoo',
'ッチュー' => 'cchuu',
'ッティー' => 'ttii',
'ッヂィー' => 'ddii',
// 3 character syllables - doubled vowels
'ファー' => 'faa',
'フェー' => 'fee',
'フィー' => 'fii',
'フォー' => 'foo',
'フャー' => 'fyaa',
'フェー' => 'fyee',
'フィー' => 'fyii',
'フョー' => 'fyoo',
'フュー' => 'fyuu',
'ヒャー' => 'hyaa',
'ヒェー' => 'hyee',
'ヒィー' => 'hyii',
'ヒョー' => 'hyoo',
'ヒュー' => 'hyuu',
'ビャー' => 'byaa',
'ビェー' => 'byee',
'ビィー' => 'byii',
'ビョー' => 'byoo',
'ビュー' => 'byuu',
'ピャー' => 'pyaa',
'ピェー' => 'pyee',
'ピィー' => 'pyii',
'ピョー' => 'pyoo',
'ピュー' => 'pyuu',
'キャー' => 'kyaa',
'キェー' => 'kyee',
'キィー' => 'kyii',
'キョー' => 'kyoo',
'キュー' => 'kyuu',
'ギャー' => 'gyaa',
'ギェー' => 'gyee',
'ギィー' => 'gyii',
'ギョー' => 'gyoo',
'ギュー' => 'gyuu',
'ミャー' => 'myaa',
'ミェー' => 'myee',
'ミィー' => 'myii',
'ミョー' => 'myoo',
'ミュー' => 'myuu',
'ニャー' => 'nyaa',
'ニェー' => 'nyee',
'ニィー' => 'nyii',
'ニョー' => 'nyoo',
'ニュー' => 'nyuu',
'リャー' => 'ryaa',
'リェー' => 'ryee',
'リィー' => 'ryii',
'リョー' => 'ryoo',
'リュー' => 'ryuu',
'シャー' => 'shaa',
'シェー' => 'shee',
'シー' => 'shii',
'ショー' => 'shoo',
'シュー' => 'shuu',
'ジャー' => 'jaa',
'ジェー' => 'jee',
'ジー' => 'jii',
'ジョー' => 'joo',
'ジュー' => 'juu',
'スァー' => 'swaa',
'スェー' => 'swee',
'スィー' => 'swii',
'スォー' => 'swoo',
'スゥー' => 'swuu',
'デァー' => 'daa',
'デェー' => 'dee',
'ディー' => 'dii',
'デォー' => 'doo',
'デゥー' => 'duu',
'チャー' => 'chaa',
'チェー' => 'chee',
'チー' => 'chii',
'チョー' => 'choo',
'チュー' => 'chuu',
'ヂャー' => 'dyaa',
'ヂェー' => 'dyee',
'ヂィー' => 'dyii',
'ヂョー' => 'dyoo',
'ヂュー' => 'dyuu',
'ツャー' => 'tsaa',
'ツェー' => 'tsee',
'ツィー' => 'tsii',
'ツョー' => 'tsoo',
'ツー' => 'tsuu',
'トァー' => 'twaa',
'トェー' => 'twee',
'トィー' => 'twii',
'トォー' => 'twoo',
'トゥー' => 'twuu',
'ドァー' => 'dwaa',
'ドェー' => 'dwee',
'ドィー' => 'dwii',
'ドォー' => 'dwoo',
'ドゥー' => 'dwuu',
'ウァー' => 'whaa',
'ウェー' => 'whee',
'ウィー' => 'whii',
'ウォー' => 'whoo',
'ウゥー' => 'whuu',
'ヴャー' => 'vyaa',
'ヴェー' => 'vyee',
'ヴィー' => 'vyii',
'ヴョー' => 'vyoo',
'ヴュー' => 'vyuu',
'ヴァー' => 'vaa',
'ヴェー' => 'vee',
'ヴィー' => 'vii',
'ヴォー' => 'voo',
'ヴー' => 'vuu',
'ウェー' => 'wee',
'ウィー' => 'wii',
'イェー' => 'yee',
'ティー' => 'tii',
'ヂィー' => 'dii',
// 3 character syllables - doubled consonants
'ッビャ' => 'bbya',
'ッビェ' => 'bbye',
'ッビィ' => 'bbyi',
'ッビョ' => 'bbyo',
'ッビュ' => 'bbyu',
'ッピャ' => 'ppya',
'ッピェ' => 'ppye',
'ッピィ' => 'ppyi',
'ッピョ' => 'ppyo',
'ッピュ' => 'ppyu',
'ッキャ' => 'kkya',
'ッキェ' => 'kkye',
'ッキィ' => 'kkyi',
'ッキョ' => 'kkyo',
'ッキュ' => 'kkyu',
'ッギャ' => 'ggya',
'ッギェ' => 'ggye',
'ッギィ' => 'ggyi',
'ッギョ' => 'ggyo',
'ッギュ' => 'ggyu',
'ッミャ' => 'mmya',
'ッミェ' => 'mmye',
'ッミィ' => 'mmyi',
'ッミョ' => 'mmyo',
'ッミュ' => 'mmyu',
'ッニャ' => 'nnya',
'ッニェ' => 'nnye',
'ッニィ' => 'nnyi',
'ッニョ' => 'nnyo',
'ッニュ' => 'nnyu',
'ッリャ' => 'rrya',
'ッリェ' => 'rrye',
'ッリィ' => 'rryi',
'ッリョ' => 'rryo',
'ッリュ' => 'rryu',
'ッシャ' => 'ssha',
'ッシェ' => 'sshe',
'ッシ' => 'sshi',
'ッショ' => 'ssho',
'ッシュ' => 'sshu',
'ッチャ' => 'ccha',
'ッチェ' => 'cche',
'ッチ' => 'cchi',
'ッチョ' => 'ccho',
'ッチュ' => 'cchu',
'ッティ' => 'tti',
'ッヂィ' => 'ddi',
// 3 character syllables - doubled vowel and consonants
'ッバー' => 'bbaa',
'ッベー' => 'bbee',
'ッビー' => 'bbii',
'ッボー' => 'bboo',
'ッブー' => 'bbuu',
'ッパー' => 'ppaa',
'ッペー' => 'ppee',
'ッピー' => 'ppii',
'ッポー' => 'ppoo',
'ップー' => 'ppuu',
'ッケー' => 'kkee',
'ッキー' => 'kkii',
'ッコー' => 'kkoo',
'ックー' => 'kkuu',
'ッカー' => 'kkaa',
'ッガー' => 'ggaa',
'ッゲー' => 'ggee',
'ッギー' => 'ggii',
'ッゴー' => 'ggoo',
'ッグー' => 'gguu',
'ッマー' => 'maa',
'ッメー' => 'mee',
'ッミー' => 'mii',
'ッモー' => 'moo',
'ッムー' => 'muu',
'ッナー' => 'nnaa',
'ッネー' => 'nnee',
'ッニー' => 'nnii',
'ッノー' => 'nnoo',
'ッヌー' => 'nnuu',
'ッラー' => 'rraa',
'ッレー' => 'rree',
'ッリー' => 'rrii',
'ッロー' => 'rroo',
'ッルー' => 'rruu',
'ッサー' => 'ssaa',
'ッセー' => 'ssee',
'ッシー' => 'sshii',
'ッソー' => 'ssoo',
'ッスー' => 'ssuu',
'ッザー' => 'zzaa',
'ッゼー' => 'zzee',
'ッジー' => 'jjii',
'ッゾー' => 'zzoo',
'ッズー' => 'zzuu',
'ッター' => 'ttaa',
'ッテー' => 'ttee',
'ッチー' => 'chii',
'ットー' => 'ttoo',
'ッツー' => 'ttsuu',
'ッダー' => 'ddaa',
'ッデー' => 'ddee',
'ッヂー' => 'ddii',
'ッドー' => 'ddoo',
'ッヅー' => 'dduu',
// 2 character syllables - normal
'ファ' => 'fa',
'フェ' => 'fe',
'フィ' => 'fi',
'フォ' => 'fo',
'フゥ' => 'fu',
// 'フャ'=>'fya',
// 'フェ'=>'fye',
// 'フィ'=>'fyi',
// 'フョ'=>'fyo',
// 'フュ'=>'fyu',
'フャ' => 'fa',
'フェ' => 'fe',
'フィ' => 'fi',
'フョ' => 'fo',
'フュ' => 'fu',
'ヒャ' => 'hya',
'ヒェ' => 'hye',
'ヒィ' => 'hyi',
'ヒョ' => 'hyo',
'ヒュ' => 'hyu',
'ビャ' => 'bya',
'ビェ' => 'bye',
'ビィ' => 'byi',
'ビョ' => 'byo',
'ビュ' => 'byu',
'ピャ' => 'pya',
'ピェ' => 'pye',
'ピィ' => 'pyi',
'ピョ' => 'pyo',
'ピュ' => 'pyu',
'キャ' => 'kya',
'キェ' => 'kye',
'キィ' => 'kyi',
'キョ' => 'kyo',
'キュ' => 'kyu',
'ギャ' => 'gya',
'ギェ' => 'gye',
'ギィ' => 'gyi',
'ギョ' => 'gyo',
'ギュ' => 'gyu',
'ミャ' => 'mya',
'ミェ' => 'mye',
'ミィ' => 'myi',
'ミョ' => 'myo',
'ミュ' => 'myu',
'ニャ' => 'nya',
'ニェ' => 'nye',
'ニィ' => 'nyi',
'ニョ' => 'nyo',
'ニュ' => 'nyu',
'リャ' => 'rya',
'リェ' => 'rye',
'リィ' => 'ryi',
'リョ' => 'ryo',
'リュ' => 'ryu',
'シャ' => 'sha',
'シェ' => 'she',
'ショ' => 'sho',
'シュ' => 'shu',
'ジャ' => 'ja',
'ジェ' => 'je',
'ジョ' => 'jo',
'ジュ' => 'ju',
'スァ' => 'swa',
'スェ' => 'swe',
'スィ' => 'swi',
'スォ' => 'swo',
'スゥ' => 'swu',
'デァ' => 'da',
'デェ' => 'de',
'ディ' => 'di',
'デォ' => 'do',
'デゥ' => 'du',
'チャ' => 'cha',
'チェ' => 'che',
'チ' => 'chi',
'チョ' => 'cho',
'チュ' => 'chu',
// 'ヂャ'=>'dya',
// 'ヂェ'=>'dye',
// 'ヂィ'=>'dyi',
// 'ヂョ'=>'dyo',
// 'ヂュ'=>'dyu',
'ツャ' => 'tsa',
'ツェ' => 'tse',
'ツィ' => 'tsi',
'ツョ' => 'tso',
'ツ' => 'tsu',
'トァ' => 'twa',
'トェ' => 'twe',
'トィ' => 'twi',
'トォ' => 'two',
'トゥ' => 'twu',
'ドァ' => 'dwa',
'ドェ' => 'dwe',
'ドィ' => 'dwi',
'ドォ' => 'dwo',
'ドゥ' => 'dwu',
'ウァ' => 'wha',
'ウェ' => 'whe',
'ウィ' => 'whi',
'ウォ' => 'who',
'ウゥ' => 'whu',
'ヴャ' => 'vya',
'ヴェ' => 'vye',
'ヴィ' => 'vyi',
'ヴョ' => 'vyo',
'ヴュ' => 'vyu',
'ヴァ' => 'va',
'ヴェ' => 've',
'ヴィ' => 'vi',
'ヴォ' => 'vo',
'ヴ' => 'vu',
'ウェ' => 'we',
'ウィ' => 'wi',
'イェ' => 'ye',
'ティ' => 'ti',
'ヂィ' => 'di',
// 2 character syllables - doubled vocal
'アー' => 'aa',
'エー' => 'ee',
'イー' => 'ii',
'オー' => 'oo',
'ウー' => 'uu',
'ダー' => 'daa',
'デー' => 'dee',
'ヂー' => 'dii',
'ドー' => 'doo',
'ヅー' => 'duu',
'ハー' => 'haa',
'ヘー' => 'hee',
'ヒー' => 'hii',
'ホー' => 'hoo',
'フー' => 'fuu',
'バー' => 'baa',
'ベー' => 'bee',
'ビー' => 'bii',
'ボー' => 'boo',
'ブー' => 'buu',
'パー' => 'paa',
'ペー' => 'pee',
'ピー' => 'pii',
'ポー' => 'poo',
'プー' => 'puu',
'ケー' => 'kee',
'キー' => 'kii',
'コー' => 'koo',
'クー' => 'kuu',
'カー' => 'kaa',
'ガー' => 'gaa',
'ゲー' => 'gee',
'ギー' => 'gii',
'ゴー' => 'goo',
'グー' => 'guu',
'マー' => 'maa',
'メー' => 'mee',
'ミー' => 'mii',
'モー' => 'moo',
'ムー' => 'muu',
'ナー' => 'naa',
'ネー' => 'nee',
'ニー' => 'nii',
'ノー' => 'noo',
'ヌー' => 'nuu',
'ラー' => 'raa',
'レー' => 'ree',
'リー' => 'rii',
'ロー' => 'roo',
'ルー' => 'ruu',
'サー' => 'saa',
'セー' => 'see',
'シー' => 'shii',
'ソー' => 'soo',
'スー' => 'suu',
'ザー' => 'zaa',
'ゼー' => 'zee',
'ジー' => 'jii',
'ゾー' => 'zoo',
'ズー' => 'zuu',
'ター' => 'taa',
'テー' => 'tee',
'チー' => 'chii',
'トー' => 'too',
'ツー' => 'tsuu',
'ワー' => 'waa',
'ヲー' => 'woo',
'ヤー' => 'yaa',
'ヨー' => 'yoo',
'ユー' => 'yuu',
'ヵー' => 'kaa',
'ヶー' => 'kee',
// old characters
'ヱー' => 'wee',
'ヰー' => 'wii',
// seperate katakana 'n'
'ンア' => 'n_a',
'ンエ' => 'n_e',
'ンイ' => 'n_i',
'ンオ' => 'n_o',
'ンウ' => 'n_u',
'ンヤ' => 'n_ya',
'ンヨ' => 'n_yo',
'ンユ' => 'n_yu',
// 2 character syllables - doubled consonants
'ッバ' => 'bba',
'ッベ' => 'bbe',
'ッビ' => 'bbi',
'ッボ' => 'bbo',
'ッブ' => 'bbu',
'ッパ' => 'ppa',
'ッペ' => 'ppe',
'ッピ' => 'ppi',
'ッポ' => 'ppo',
'ップ' => 'ppu',
'ッケ' => 'kke',
'ッキ' => 'kki',
'ッコ' => 'kko',
'ック' => 'kku',
'ッカ' => 'kka',
'ッガ' => 'gga',
'ッゲ' => 'gge',
'ッギ' => 'ggi',
'ッゴ' => 'ggo',
'ッグ' => 'ggu',
'ッマ' => 'ma',
'ッメ' => 'me',
'ッミ' => 'mi',
'ッモ' => 'mo',
'ッム' => 'mu',
'ッナ' => 'nna',
'ッネ' => 'nne',
'ッニ' => 'nni',
'ッノ' => 'nno',
'ッヌ' => 'nnu',
'ッラ' => 'rra',
'ッレ' => 'rre',
'ッリ' => 'rri',
'ッロ' => 'rro',
'ッル' => 'rru',
'ッサ' => 'ssa',
'ッセ' => 'sse',
'ッシ' => 'sshi',
'ッソ' => 'sso',
'ッス' => 'ssu',
'ッザ' => 'zza',
'ッゼ' => 'zze',
'ッジ' => 'jji',
'ッゾ' => 'zzo',
'ッズ' => 'zzu',
'ッタ' => 'tta',
'ッテ' => 'tte',
'ッチ' => 'cchi',
'ット' => 'tto',
'ッツ' => 'ttsu',
'ッダ' => 'dda',
'ッデ' => 'dde',
'ッヂ' => 'ddi',
'ッド' => 'ddo',
'ッヅ' => 'ddu',
// 1 character syllables
'ア' => 'a',
'エ' => 'e',
'イ' => 'i',
'オ' => 'o',
'ウ' => 'u',
'ン' => 'n',
'ハ' => 'ha',
'ヘ' => 'he',
'ヒ' => 'hi',
'ホ' => 'ho',
'フ' => 'fu',
'バ' => 'ba',
'ベ' => 'be',
'ビ' => 'bi',
'ボ' => 'bo',
'ブ' => 'bu',
'パ' => 'pa',
'ペ' => 'pe',
'ピ' => 'pi',
'ポ' => 'po',
'プ' => 'pu',
'ケ' => 'ke',
'キ' => 'ki',
'コ' => 'ko',
'ク' => 'ku',
'カ' => 'ka',
'ガ' => 'ga',
'ゲ' => 'ge',
'ギ' => 'gi',
'ゴ' => 'go',
'グ' => 'gu',
'マ' => 'ma',
'メ' => 'me',
'ミ' => 'mi',
'モ' => 'mo',
'ム' => 'mu',
'ナ' => 'na',
'ネ' => 'ne',
'ニ' => 'ni',
'' => 'no',
'ヌ' => 'nu',
'ラ' => 'ra',
'レ' => 're',
'リ' => 'ri',
'ロ' => 'ro',
'ル' => 'ru',
'サ' => 'sa',
'セ' => 'se',
'シ' => 'shi',
'ソ' => 'so',
'ス' => 'su',
'ザ' => 'za',
'ゼ' => 'ze',
'ジ' => 'ji',
'ゾ' => 'zo',
'ズ' => 'zu',
'タ' => 'ta',
'テ' => 'te',
'チ' => 'chi',
'ト' => 'to',
'ツ' => 'tsu',
'ダ' => 'da',
'デ' => 'de',
'ヂ' => 'di',
'ド' => 'do',
'ヅ' => 'du',
'ワ' => 'wa',
'ヲ' => 'wo',
'ヤ' => 'ya',
'ヨ' => 'yo',
'ユ' => 'yu',
'ヵ' => 'ka',
'ヶ' => 'ke',
// old characters
'ヱ' => 'we',
'ヰ' => 'wi',
// convert what's left (probably only kicks in when something's missing above)
'ァ' => 'a',
'ェ' => 'e',
'ィ' => 'i',
'ォ' => 'o',
'ゥ' => 'u',
'ャ' => 'ya',
'ョ' => 'yo',
'ュ' => 'yu',
// special characters
'・' => '_',
'、' => '_',
'ー' => '_',
// when used with hiragana (seldom), this character would not be converted otherwise
// 'ラ'=>'la',
// 'レ'=>'le',
// 'リ'=>'li',
// 'ロ'=>'lo',
// 'ル'=>'lu',
// 'チャ'=>'cya',
// 'チェ'=>'cye',
// 'チィ'=>'cyi',
// 'チョ'=>'cyo',
// 'チュ'=>'cyu',
// 'デャ'=>'dha',
// 'デェ'=>'dhe',
// 'ディ'=>'dhi',
// 'デョ'=>'dho',
// 'デュ'=>'dhu',
// 'リャ'=>'lya',
// 'リェ'=>'lye',
// 'リィ'=>'lyi',
// 'リョ'=>'lyo',
// 'リュ'=>'lyu',
// 'テャ'=>'tha',
// 'テェ'=>'the',
// 'ティ'=>'thi',
// 'テョ'=>'tho',
// 'テュ'=>'thu',
// 'ファ'=>'fwa',
// 'フェ'=>'fwe',
// 'フィ'=>'fwi',
// 'フォ'=>'fwo',
// 'フゥ'=>'fwu',
// 'チャ'=>'tya',
// 'チェ'=>'tye',
// 'チィ'=>'tyi',
// 'チョ'=>'tyo',
// 'チュ'=>'tyu',
// 'ジャ'=>'jya',
// 'ジェ'=>'jye',
// 'ジィ'=>'jyi',
// 'ジョ'=>'jyo',
// 'ジュ'=>'jyu',
// 'ジャ'=>'zha',
// 'ジェ'=>'zhe',
// 'ジィ'=>'zhi',
// 'ジョ'=>'zho',
// 'ジュ'=>'zhu',
// 'ジャ'=>'zya',
// 'ジェ'=>'zye',
// 'ジィ'=>'zyi',
// 'ジョ'=>'zyo',
// 'ジュ'=>'zyu',
// 'シャ'=>'sya',
// 'シェ'=>'sye',
// 'シィ'=>'syi',
// 'ショ'=>'syo',
// 'シュ'=>'syu',
// 'シ'=>'ci',
// 'フ'=>'hu',
// 'シ'=>'si',
// 'チ'=>'ti',
// 'ツ'=>'tu',
// 'イ'=>'yi',
// 'ヂ'=>'dzi',
// "Greeklish"
'Γ' => 'G',
'Δ' => 'E',
'Θ' => 'Th',
'Λ' => 'L',
'Ξ' => 'X',
'Π' => 'P',
'Σ' => 'S',
'Φ' => 'F',
'Ψ' => 'Ps',
'γ' => 'g',
'δ' => 'e',
'θ' => 'th',
'λ' => 'l',
'ξ' => 'x',
'π' => 'p',
'σ' => 's',
'φ' => 'f',
'ψ' => 'ps',
// Thai
'ก' => 'k',
'ข' => 'kh',
'ฃ' => 'kh',
'ค' => 'kh',
'ฅ' => 'kh',
'ฆ' => 'kh',
'ง' => 'ng',
'จ' => 'ch',
'ฉ' => 'ch',
'ช' => 'ch',
'ซ' => 's',
'ฌ' => 'ch',
'ญ' => 'y',
'ฎ' => 'd',
'ฏ' => 't',
'ฐ' => 'th',
'ฑ' => 'd',
'ฒ' => 'th',
'ณ' => 'n',
'ด' => 'd',
'ต' => 't',
'ถ' => 'th',
'ท' => 'th',
'ธ' => 'th',
'น' => 'n',
'บ' => 'b',
'ป' => 'p',
'ผ' => 'ph',
'ฝ' => 'f',
'พ' => 'ph',
'ฟ' => 'f',
'ภ' => 'ph',
'ม' => 'm',
'ย' => 'y',
'ร' => 'r',
'ฤ' => 'rue',
'ฤๅ' => 'rue',
'ล' => 'l',
'ฦ' => 'lue',
'ฦๅ' => 'lue',
'ว' => 'w',
'ศ' => 's',
'ษ' => 's',
'ส' => 's',
'ห' => 'h',
'ฬ' => 'l',
'ฮ' => 'h',
'ะ' => 'a',
'ั' => 'a',
'รร' => 'a',
'า' => 'a',
'ๅ' => 'a',
'ำ' => 'am',
'ํา' => 'am',
'ิ' => 'i',
'ี' => 'i',
'ึ' => 'ue',
'ี' => 'ue',
'ุ' => 'u',
'ู' => 'u',
'เ' => 'e',
'แ' => 'ae',
'โ' => 'o',
'อ' => 'o',
'ียะ' => 'ia',
'ีย' => 'ia',
'ือะ' => 'uea',
'ือ' => 'uea',
'ัวะ' => 'ua',
'ัว' => 'ua',
'ใ' => 'ai',
'ไ' => 'ai',
'ัย' => 'ai',
'าย' => 'ai',
'าว' => 'ao',
'ุย' => 'ui',
'อย' => 'oi',
'ือย' => 'ueai',
'วย' => 'uai',
'ิว' => 'io',
'็ว' => 'eo',
'ียว' => 'iao',
'่' => '',
'้' => '',
'๊' => '',
'๋' => '',
'็' => '',
'์' => '',
'๎' => '',
'ํ' => '',
'ฺ' => '',
'ๆ' => '2',
'๏' => 'o',
'ฯ' => '-',
'๚' => '-',
'๛' => '-',
'' => '0',
'๑' => '1',
'๒' => '2',
'๓' => '3',
'๔' => '4',
'๕' => '5',
'๖' => '6',
'๗' => '7',
'๘' => '8',
'๙' => '9',
// Korean
'ㄱ' => 'k', 'ㅋ' => 'kh',
'ㄲ' => 'kk',
'ㄷ' => 't',
'ㅌ' => 'th',
'ㄸ' => 'tt',
'ㅂ' => 'p',
'ㅍ' => 'ph',
'ㅃ' => 'pp',
'ㅈ' => 'c',
'ㅊ' => 'ch',
'ㅉ' => 'cc',
'ㅅ' => 's',
'ㅆ' => 'ss',
'ㅎ' => 'h',
'ㅇ' => 'ng',
'ㄴ' => 'n',
'ㄹ' => 'l',
'ㅁ' => 'm',
'ㅏ' => 'a',
'ㅓ' => 'e',
'ㅗ' => 'o',
'ㅜ' => 'wu',
'ㅡ' => 'u',
'ㅣ' => 'i',
'ㅐ' => 'ay',
'ㅔ' => 'ey',
'ㅚ' => 'oy',
'ㅘ' => 'wa',
'ㅝ' => 'we',
'ㅟ' => 'wi',
'ㅙ' => 'way',
'ㅞ' => 'wey',
'ㅢ' => 'uy',
'ㅑ' => 'ya',
'ㅕ' => 'ye',
'ㅛ' => 'oy',
'ㅠ' => 'yu',
'ㅒ' => 'yay',
'ㅖ' => 'yey',
];