xref: /dokuwiki/inc/Utf8/tables/romanization.php (revision 55b5a0954cb543331f5901583987a6348972237f)
1<?php
2/**
3 * Romanization lookup table
4 *
5 * This lookup tables provides a way to transform strings written in a language
6 * different from the ones based upon latin letters into plain ASCII.
7 *
8 * Please note: this is not a scientific transliteration table. It only works
9 * oneway from nonlatin to ASCII and it works by simple character replacement
10 * only. Specialities of each language are not supported.
11 *
12 * @todo some keys are used multiple times
13 * @todo remove or integrate commented pairs
14 *
15 * @author Andreas Gohr <andi@splitbrain.org>
16 * @author Vitaly Blokhin <vitinfo@vitn.com>
17 * @author Bisqwit <bisqwit@iki.fi>
18 * @author Arthit Suriyawongkul <arthit@gmail.com>
19 * @author Denis Scheither <amorphis@uni-bremen.de>
20 * @author Eivind Morland <eivind.morland@gmail.com>
21 * @link   http://www.uconv.com/translit.htm
22 * @link   http://kanjidict.stc.cx/hiragana.php?src=2
23 * @link   http://www.translatum.gr/converter/greek-transliteration.htm
24 * @link   http://en.wikipedia.org/wiki/Royal_Thai_General_System_of_Transcription
25 * @link   http://www.btranslations.com/resources/romanization/korean.asp
26 */
27return [
28    // scandinavian - differs from what we do in deaccent
29    'å' => 'a',
30    'Å' => 'A',
31    'ä' => 'a',
32    'Ä' => 'A',
33    'ö' => 'o',
34    'Ö' => 'O',
35
36    //russian cyrillic
37    'а' => 'a',
38    'А' => 'A',
39    'б' => 'b',
40    'Б' => 'B',
41    'в' => 'v',
42    'В' => 'V',
43    'г' => 'g',
44    'Г' => 'G',
45    'д' => 'd',
46    'Д' => 'D',
47    'е' => 'e',
48    'Е' => 'E',
49    'ё' => 'jo',
50    'Ё' => 'Jo',
51    'ж' => 'zh',
52    'Ж' => 'Zh',
53    'з' => 'z',
54    'З' => 'Z',
55    'и' => 'i',
56    'И' => 'I',
57    'й' => 'j',
58    'Й' => 'J',
59    'к' => 'k',
60    'К' => 'K',
61    'л' => 'l',
62    'Л' => 'L',
63    'м' => 'm',
64    'М' => 'M',
65    'н' => 'n',
66    'Н' => 'N',
67    'о' => 'o',
68    'О' => 'O',
69    'п' => 'p',
70    'П' => 'P',
71    'р' => 'r',
72    'Р' => 'R',
73    'с' => 's',
74    'С' => 'S',
75    'т' => 't',
76    'Т' => 'T',
77    'у' => 'u',
78    'У' => 'U',
79    'ф' => 'f',
80    'Ф' => 'F',
81    'х' => 'x',
82    'Х' => 'X',
83    'ц' => 'c',
84    'Ц' => 'C',
85    'ч' => 'ch',
86    'Ч' => 'Ch',
87    'ш' => 'sh',
88    'Ш' => 'Sh',
89    'щ' => 'sch',
90    'Щ' => 'Sch',
91    'ъ' => '',
92    'Ъ' => '',
93    'ы' => 'y',
94    'Ы' => 'Y',
95    'ь' => '',
96    'Ь' => '',
97    'э' => 'eh',
98    'Э' => 'Eh',
99    'ю' => 'ju',
100    'Ю' => 'Ju',
101    'я' => 'ja',
102    'Я' => 'Ja',
103
104    // Ukrainian cyrillic
105    'Ґ' => 'Gh',
106    'ґ' => 'gh',
107    'Є' => 'Je',
108    'є' => 'je',
109    'І' => 'I',
110    'і' => 'i',
111    'Ї' => 'Ji',
112    'ї' => 'ji',
113
114    // Georgian
115    'ა' => 'a',
116    'ბ' => 'b',
117    'გ' => 'g',
118    'დ' => 'd',
119    'ე' => 'e',
120    'ვ' => 'v',
121    'ზ' => 'z',
122    'თ' => 'th',
123    'ი' => 'i',
124    'კ' => 'p',
125    'ლ' => 'l',
126    'მ' => 'm',
127    'ნ' => 'n',
128    'ო' => 'o',
129    'პ' => 'p',
130    'ჟ' => 'zh',
131    'რ' => 'r',
132    'ს' => 's',
133    'ტ' => 't',
134    'უ' => 'u',
135    'ფ' => 'ph',
136    'ქ' => 'kh',
137    'ღ' => 'gh',
138    'ყ' => 'q',
139    'შ' => 'sh',
140    'ჩ' => 'ch',
141    'ც' => 'c',
142    'ძ' => 'dh',
143    'წ' => 'w',
144    'ჭ' => 'j',
145    'ხ' => 'x',
146    'ჯ' => 'jh',
147    'ჰ' => 'xh',
148
149    //Sanskrit
150    'अ' => 'a',
151    'आ' => 'ah',
152    'इ' => 'i',
153    'ई' => 'ih',
154    'उ' => 'u',
155    'ऊ' => 'uh',
156    'ऋ' => 'ry',
157    'ॠ' => 'ryh',
158    'ऌ' => 'ly',
159    'ॡ' => 'lyh',
160    'ए' => 'e',
161    'ऐ' => 'ay',
162    'ओ' => 'o',
163    'औ' => 'aw',
164    'अं' => 'amh',
165    'अः' => 'aq',
166    'क' => 'k',
167    'ख' => 'kh',
168    'ग' => 'g',
169    'घ' => 'gh',
170    'ङ' => 'nh',
171    'च' => 'c',
172    'छ' => 'ch',
173    'ज' => 'j',
174    'झ' => 'jh',
175    'ञ' => 'ny',
176    'ट' => 'tq',
177    'ठ' => 'tqh',
178    'ड' => 'dq',
179    'ढ' => 'dqh',
180    'ण' => 'nq',
181    'त' => 't',
182    'थ' => 'th',
183    'द' => 'd',
184    'ध' => 'dh',
185    'न' => 'n',
186    'प' => 'p',
187    'फ' => 'ph',
188    'ब' => 'b',
189    'भ' => 'bh',
190    'म' => 'm',
191    'य' => 'z',
192    'र' => 'r',
193    'ल' => 'l',
194    'व' => 'v',
195    'श' => 'sh',
196    'ष' => 'sqh',
197    'स' => 's',
198    'ह' => 'x',
199
200    //Sanskrit diacritics
201    'Ā' => 'A',
202    'Ī' => 'I',
203    'Ū' => 'U',
204    'Ṛ' => 'R',
205    'Ṝ' => 'R',
206    'Ṅ' => 'N',
207    'Ñ' => 'N',
208    'Ṭ' => 'T',
209    'Ḍ' => 'D',
210    'Ṇ' => 'N',
211    'Ś' => 'S',
212    'Ṣ' => 'S',
213    'Ṁ' => 'M',
214    'Ṃ' => 'M',
215    'Ḥ' => 'H',
216    'Ḷ' => 'L',
217    'Ḹ' => 'L',
218    'ā' => 'a',
219    'ī' => 'i',
220    'ū' => 'u',
221    'ṛ' => 'r',
222    'ṝ' => 'r',
223    'ṅ' => 'n',
224    'ñ' => 'n',
225    'ṭ' => 't',
226    'ḍ' => 'd',
227    'ṇ' => 'n',
228    'ś' => 's',
229    'ṣ' => 's',
230    'ṁ' => 'm',
231    'ṃ' => 'm',
232    'ḥ' => 'h',
233    'ḷ' => 'l',
234    'ḹ' => 'l',
235
236    //Hebrew
237    'א' => 'a',
238    'ב' => 'b',
239    'ג' => 'g',
240    'ד' => 'd',
241    'ה' => 'h',
242    'ו' => 'v',
243    'ז' => 'z',
244    'ח' => 'kh',
245    'ט' => 'th',
246    'י' => 'y',
247    'ך' => 'h',
248    'כ' => 'k',
249    'ל' => 'l',
250    'ם' => 'm',
251    'מ' => 'm',
252    'ן' => 'n',
253    'נ' => 'n',
254    'ס' => 's',
255    'ע' => 'ah',
256    'ף' => 'f',
257    'פ' => 'p',
258    'ץ' => 'c',
259    'צ' => 'c',
260    'ק' => 'q',
261    'ר' => 'r',
262    'ש' => 'sh',
263    'ת' => 't',
264
265    //Arabic
266    'ا' => 'a',
267    'ب' => 'b',
268    'ت' => 't',
269    'ث' => 'th',
270    'ج' => 'g',
271    'ح' => 'xh',
272    'خ' => 'x',
273    'د' => 'd',
274    'ذ' => 'dh',
275    'ر' => 'r',
276    'ز' => 'z',
277    'س' => 's',
278    'ش' => 'sh',
279    'ص' => 's\'',
280    'ض' => 'd\'',
281    'ط' => 't\'',
282    'ظ' => 'z\'',
283    'ع' => 'y',
284    'غ' => 'gh',
285    'ف' => 'f',
286    'ق' => 'q',
287    'ك' => 'k',
288    'ل' => 'l',
289    'م' => 'm',
290    'ن' => 'n',
291    'ه' => 'x\'',
292    'و' => 'u',
293    'ي' => 'i',
294
295    // Japanese characters  (last update: 2008-05-09)
296
297    // Japanese hiragana
298
299    // 3 character syllables, っ doubles the consonant after
300    'っちゃ' => 'ccha',
301    'っちぇ' => 'cche',
302    'っちょ' => 'ccho',
303    'っちゅ' => 'cchu',
304    'っびゃ' => 'bbya',
305    'っびぇ' => 'bbye',
306    'っびぃ' => 'bbyi',
307    'っびょ' => 'bbyo',
308    'っびゅ' => 'bbyu',
309    'っぴゃ' => 'ppya',
310    'っぴぇ' => 'ppye',
311    'っぴぃ' => 'ppyi',
312    'っぴょ' => 'ppyo',
313    'っぴゅ' => 'ppyu',
314    'っちゃ' => 'ccha',
315    'っちぇ' => 'cche',
316    'っち' => 'cchi',
317    'っちょ' => 'ccho',
318    'っちゅ' => 'cchu',
319    // 'っひゃ'=>'hya',
320    // 'っひぇ'=>'hye',
321    // 'っひぃ'=>'hyi',
322    // 'っひょ'=>'hyo',
323    // 'っひゅ'=>'hyu',
324    'っきゃ' => 'kkya',
325    'っきぇ' => 'kkye',
326    'っきぃ' => 'kkyi',
327    'っきょ' => 'kkyo',
328    'っきゅ' => 'kkyu',
329    'っぎゃ' => 'ggya',
330    'っぎぇ' => 'ggye',
331    'っぎぃ' => 'ggyi',
332    'っぎょ' => 'ggyo',
333    'っぎゅ' => 'ggyu',
334    'っみゃ' => 'mmya',
335    'っみぇ' => 'mmye',
336    'っみぃ' => 'mmyi',
337    'っみょ' => 'mmyo',
338    'っみゅ' => 'mmyu',
339    'っにゃ' => 'nnya',
340    'っにぇ' => 'nnye',
341    'っにぃ' => 'nnyi',
342    'っにょ' => 'nnyo',
343    'っにゅ' => 'nnyu',
344    'っりゃ' => 'rrya',
345    'っりぇ' => 'rrye',
346    'っりぃ' => 'rryi',
347    'っりょ' => 'rryo',
348    'っりゅ' => 'rryu',
349    'っしゃ' => 'ssha',
350    'っしぇ' => 'sshe',
351    'っし' => 'sshi',
352    'っしょ' => 'ssho',
353    'っしゅ' => 'sshu',
354
355    // seperate hiragana 'n' ('n' + 'i' != 'ni', normally we would write "kon'nichi wa" but the
356    // apostrophe would be converted to _ anyway)
357    'んあ' => 'n_a',
358    'んえ' => 'n_e',
359    'んい' => 'n_i',
360    'んお' => 'n_o',
361    'んう' => 'n_u',
362    'んや' => 'n_ya',
363    'んよ' => 'n_yo',
364    'んゆ' => 'n_yu',
365
366    // 2 character syllables - normal
367    'ふぁ' => 'fa',
368    'ふぇ' => 'fe',
369    'ふぃ' => 'fi',
370    'ふぉ' => 'fo',
371    'ちゃ' => 'cha',
372    'ちぇ' => 'che',
373    'ち' => 'chi',
374    'ちょ' => 'cho',
375    'ちゅ' => 'chu',
376    'ひゃ' => 'hya',
377    'ひぇ' => 'hye',
378    'ひぃ' => 'hyi',
379    'ひょ' => 'hyo',
380    'ひゅ' => 'hyu',
381    'びゃ' => 'bya',
382    'びぇ' => 'bye',
383    'びぃ' => 'byi',
384    'びょ' => 'byo',
385    'びゅ' => 'byu',
386    'ぴゃ' => 'pya',
387    'ぴぇ' => 'pye',
388    'ぴぃ' => 'pyi',
389    'ぴょ' => 'pyo',
390    'ぴゅ' => 'pyu',
391    'きゃ' => 'kya',
392    'きぇ' => 'kye',
393    'きぃ' => 'kyi',
394    'きょ' => 'kyo',
395    'きゅ' => 'kyu',
396    'ぎゃ' => 'gya',
397    'ぎぇ' => 'gye',
398    'ぎぃ' => 'gyi',
399    'ぎょ' => 'gyo',
400    'ぎゅ' => 'gyu',
401    'みゃ' => 'mya',
402    'みぇ' => 'mye',
403    'みぃ' => 'myi',
404    'みょ' => 'myo',
405    'みゅ' => 'myu',
406    'にゃ' => 'nya',
407    'にぇ' => 'nye',
408    'にぃ' => 'nyi',
409    'にょ' => 'nyo',
410    'にゅ' => 'nyu',
411    'りゃ' => 'rya',
412    'りぇ' => 'rye',
413    'りぃ' => 'ryi',
414    'りょ' => 'ryo',
415    'りゅ' => 'ryu',
416    'しゃ' => 'sha',
417    'しぇ' => 'she',
418    'し' => 'shi',
419    'しょ' => 'sho',
420    'しゅ' => 'shu',
421    'じゃ' => 'ja',
422    'じぇ' => 'je',
423    'じょ' => 'jo',
424    'じゅ' => 'ju',
425    'うぇ' => 'we',
426    'うぃ' => 'wi',
427    'いぇ' => 'ye',
428
429    // 2 character syllables, っ doubles the consonant after
430    'っば' => 'bba',
431    'っべ' => 'bbe',
432    'っび' => 'bbi',
433    'っぼ' => 'bbo',
434    'っぶ' => 'bbu',
435    'っぱ' => 'ppa',
436    'っぺ' => 'ppe',
437    'っぴ' => 'ppi',
438    'っぽ' => 'ppo',
439    'っぷ' => 'ppu',
440    'った' => 'tta',
441    'って' => 'tte',
442    'っち' => 'cchi',
443    'っと' => 'tto',
444    'っつ' => 'ttsu',
445    'っだ' => 'dda',
446    'っで' => 'dde',
447    'っぢ' => 'ddi',
448    'っど' => 'ddo',
449    'っづ' => 'ddu',
450    'っが' => 'gga',
451    'っげ' => 'gge',
452    'っぎ' => 'ggi',
453    'っご' => 'ggo',
454    'っぐ' => 'ggu',
455    'っか' => 'kka',
456    'っけ' => 'kke',
457    'っき' => 'kki',
458    'っこ' => 'kko',
459    'っく' => 'kku',
460    'っま' => 'mma',
461    'っめ' => 'mme',
462    'っみ' => 'mmi',
463    'っも' => 'mmo',
464    'っむ' => 'mmu',
465    'っな' => 'nna',
466    'っね' => 'nne',
467    'っに' => 'nni',
468    'っの' => 'nno',
469    'っぬ' => 'nnu',
470    'っら' => 'rra',
471    'っれ' => 'rre',
472    'っり' => 'rri',
473    'っろ' => 'rro',
474    'っる' => 'rru',
475    'っさ' => 'ssa',
476    'っせ' => 'sse',
477    'っし' => 'sshi',
478    'っそ' => 'sso',
479    'っす' => 'ssu',
480    'っざ' => 'zza',
481    'っぜ' => 'zze',
482    'っじ' => 'jji',
483    'っぞ' => 'zzo',
484    'っず' => 'zzu',
485
486    // 1 character syllabels
487    'あ' => 'a',
488    'え' => 'e',
489    'い' => 'i',
490    'お' => 'o',
491    'う' => 'u',
492    'ん' => 'n',
493    'は' => 'ha',
494    'へ' => 'he',
495    'ひ' => 'hi',
496    'ほ' => 'ho',
497    'ふ' => 'fu',
498    'ば' => 'ba',
499    'べ' => 'be',
500    'び' => 'bi',
501    'ぼ' => 'bo',
502    'ぶ' => 'bu',
503    'ぱ' => 'pa',
504    'ぺ' => 'pe',
505    'ぴ' => 'pi',
506    'ぽ' => 'po',
507    'ぷ' => 'pu',
508    'た' => 'ta',
509    'て' => 'te',
510    'ち' => 'chi',
511    'と' => 'to',
512    'つ' => 'tsu',
513    'だ' => 'da',
514    'で' => 'de',
515    'ぢ' => 'di',
516    'ど' => 'do',
517    'づ' => 'du',
518    'が' => 'ga',
519    'げ' => 'ge',
520    'ぎ' => 'gi',
521    'ご' => 'go',
522    'ぐ' => 'gu',
523    'か' => 'ka',
524    'け' => 'ke',
525    'き' => 'ki',
526    'こ' => 'ko',
527    'く' => 'ku',
528    'ま' => 'ma',
529    'め' => 'me',
530    'み' => 'mi',
531    'も' => 'mo',
532    'む' => 'mu',
533    'な' => 'na',
534    'ね' => 'ne',
535    'に' => 'ni',
536    'の' => 'no',
537    'ぬ' => 'nu',
538    'ら' => 'ra',
539    'れ' => 're',
540    'り' => 'ri',
541    'ろ' => 'ro',
542    'る' => 'ru',
543    'さ' => 'sa',
544    'せ' => 'se',
545    'し' => 'shi',
546    'そ' => 'so',
547    'す' => 'su',
548    'わ' => 'wa',
549    'を' => 'wo',
550    'ざ' => 'za',
551    'ぜ' => 'ze',
552    'じ' => 'ji',
553    'ぞ' => 'zo',
554    'ず' => 'zu',
555    'や' => 'ya',
556    'よ' => 'yo',
557    'ゆ' => 'yu',
558    // old characters
559    'ゑ' => 'we',
560    'ゐ' => 'wi',
561
562    //  convert what's left (probably only kicks in when something's missing above)
563    // 'ぁ'=>'a','ぇ'=>'e','ぃ'=>'i','ぉ'=>'o','ぅ'=>'u',
564    // 'ゃ'=>'ya','ょ'=>'yo','ゅ'=>'yu',
565
566    // never seen one of those (disabled for the moment)
567    // 'ヴぁ'=>'va','ヴぇ'=>'ve','ヴぃ'=>'vi','ヴぉ'=>'vo','ヴ'=>'vu',
568    // 'でゃ'=>'dha','でぇ'=>'dhe','でぃ'=>'dhi','でょ'=>'dho','でゅ'=>'dhu',
569    // 'どぁ'=>'dwa','どぇ'=>'dwe','どぃ'=>'dwi','どぉ'=>'dwo','どぅ'=>'dwu',
570    // 'ぢゃ'=>'dya','ぢぇ'=>'dye','ぢぃ'=>'dyi','ぢょ'=>'dyo','ぢゅ'=>'dyu',
571    // 'ふぁ'=>'fwa','ふぇ'=>'fwe','ふぃ'=>'fwi','ふぉ'=>'fwo','ふぅ'=>'fwu',
572    // 'ふゃ'=>'fya','ふぇ'=>'fye','ふぃ'=>'fyi','ふょ'=>'fyo','ふゅ'=>'fyu',
573    // 'すぁ'=>'swa','すぇ'=>'swe','すぃ'=>'swi','すぉ'=>'swo','すぅ'=>'swu',
574    // 'てゃ'=>'tha','てぇ'=>'the','てぃ'=>'thi','てょ'=>'tho','てゅ'=>'thu',
575    // 'つゃ'=>'tsa','つぇ'=>'tse','つぃ'=>'tsi','つょ'=>'tso','つ'=>'tsu',
576    // 'とぁ'=>'twa','とぇ'=>'twe','とぃ'=>'twi','とぉ'=>'two','とぅ'=>'twu',
577    // 'ヴゃ'=>'vya','ヴぇ'=>'vye','ヴぃ'=>'vyi','ヴょ'=>'vyo','ヴゅ'=>'vyu',
578    // 'うぁ'=>'wha','うぇ'=>'whe','うぃ'=>'whi','うぉ'=>'who','うぅ'=>'whu',
579    // 'じゃ'=>'zha','じぇ'=>'zhe','じぃ'=>'zhi','じょ'=>'zho','じゅ'=>'zhu',
580    // 'じゃ'=>'zya','じぇ'=>'zye','じぃ'=>'zyi','じょ'=>'zyo','じゅ'=>'zyu',
581
582    // 'spare' characters from other romanization systems
583    // 'だ'=>'da','で'=>'de','ぢ'=>'di','ど'=>'do','づ'=>'du',
584    // 'ら'=>'la','れ'=>'le','り'=>'li','ろ'=>'lo','る'=>'lu',
585    // 'さ'=>'sa','せ'=>'se','し'=>'si','そ'=>'so','す'=>'su',
586    // 'ちゃ'=>'cya','ちぇ'=>'cye','ちぃ'=>'cyi','ちょ'=>'cyo','ちゅ'=>'cyu',
587    //'じゃ'=>'jya','じぇ'=>'jye','じぃ'=>'jyi','じょ'=>'jyo','じゅ'=>'jyu',
588    //'りゃ'=>'lya','りぇ'=>'lye','りぃ'=>'lyi','りょ'=>'lyo','りゅ'=>'lyu',
589    //'しゃ'=>'sya','しぇ'=>'sye','しぃ'=>'syi','しょ'=>'syo','しゅ'=>'syu',
590    //'ちゃ'=>'tya','ちぇ'=>'tye','ちぃ'=>'tyi','ちょ'=>'tyo','ちゅ'=>'tyu',
591    //'し'=>'ci',,い'=>'yi','ぢ'=>'dzi',
592    //'っじゃ'=>'jja','っじぇ'=>'jje','っじ'=>'jji','っじょ'=>'jjo','っじゅ'=>'jju',
593
594
595    // Japanese katakana
596
597    // 4 character syllables: ッ doubles the consonant after, ー doubles the vowel before
598    // (usualy written with macron, but we don't want that in our URLs)
599    'ッビャー' => 'bbyaa',
600    'ッビェー' => 'bbyee',
601    'ッビィー' => 'bbyii',
602    'ッビョー' => 'bbyoo',
603    'ッビュー' => 'bbyuu',
604    'ッピャー' => 'ppyaa',
605    'ッピェー' => 'ppyee',
606    'ッピィー' => 'ppyii',
607    'ッピョー' => 'ppyoo',
608    'ッピュー' => 'ppyuu',
609    'ッキャー' => 'kkyaa',
610    'ッキェー' => 'kkyee',
611    'ッキィー' => 'kkyii',
612    'ッキョー' => 'kkyoo',
613    'ッキュー' => 'kkyuu',
614    'ッギャー' => 'ggyaa',
615    'ッギェー' => 'ggyee',
616    'ッギィー' => 'ggyii',
617    'ッギョー' => 'ggyoo',
618    'ッギュー' => 'ggyuu',
619    'ッミャー' => 'mmyaa',
620    'ッミェー' => 'mmyee',
621    'ッミィー' => 'mmyii',
622    'ッミョー' => 'mmyoo',
623    'ッミュー' => 'mmyuu',
624    'ッニャー' => 'nnyaa',
625    'ッニェー' => 'nnyee',
626    'ッニィー' => 'nnyii',
627    'ッニョー' => 'nnyoo',
628    'ッニュー' => 'nnyuu',
629    'ッリャー' => 'rryaa',
630    'ッリェー' => 'rryee',
631    'ッリィー' => 'rryii',
632    'ッリョー' => 'rryoo',
633    'ッリュー' => 'rryuu',
634    'ッシャー' => 'sshaa',
635    'ッシェー' => 'sshee',
636    'ッシー' => 'sshii',
637    'ッショー' => 'sshoo',
638    'ッシュー' => 'sshuu',
639    'ッチャー' => 'cchaa',
640    'ッチェー' => 'cchee',
641    'ッチー' => 'cchii',
642    'ッチョー' => 'cchoo',
643    'ッチュー' => 'cchuu',
644    'ッティー' => 'ttii',
645    'ッヂィー' => 'ddii',
646
647    // 3 character syllables - doubled vowels
648    'ファー' => 'faa',
649    'フェー' => 'fee',
650    'フィー' => 'fii',
651    'フォー' => 'foo',
652    'フャー' => 'fyaa',
653    'フェー' => 'fyee',
654    'フィー' => 'fyii',
655    'フョー' => 'fyoo',
656    'フュー' => 'fyuu',
657    'ヒャー' => 'hyaa',
658    'ヒェー' => 'hyee',
659    'ヒィー' => 'hyii',
660    'ヒョー' => 'hyoo',
661    'ヒュー' => 'hyuu',
662    'ビャー' => 'byaa',
663    'ビェー' => 'byee',
664    'ビィー' => 'byii',
665    'ビョー' => 'byoo',
666    'ビュー' => 'byuu',
667    'ピャー' => 'pyaa',
668    'ピェー' => 'pyee',
669    'ピィー' => 'pyii',
670    'ピョー' => 'pyoo',
671    'ピュー' => 'pyuu',
672    'キャー' => 'kyaa',
673    'キェー' => 'kyee',
674    'キィー' => 'kyii',
675    'キョー' => 'kyoo',
676    'キュー' => 'kyuu',
677    'ギャー' => 'gyaa',
678    'ギェー' => 'gyee',
679    'ギィー' => 'gyii',
680    'ギョー' => 'gyoo',
681    'ギュー' => 'gyuu',
682    'ミャー' => 'myaa',
683    'ミェー' => 'myee',
684    'ミィー' => 'myii',
685    'ミョー' => 'myoo',
686    'ミュー' => 'myuu',
687    'ニャー' => 'nyaa',
688    'ニェー' => 'nyee',
689    'ニィー' => 'nyii',
690    'ニョー' => 'nyoo',
691    'ニュー' => 'nyuu',
692    'リャー' => 'ryaa',
693    'リェー' => 'ryee',
694    'リィー' => 'ryii',
695    'リョー' => 'ryoo',
696    'リュー' => 'ryuu',
697    'シャー' => 'shaa',
698    'シェー' => 'shee',
699    'シー' => 'shii',
700    'ショー' => 'shoo',
701    'シュー' => 'shuu',
702    'ジャー' => 'jaa',
703    'ジェー' => 'jee',
704    'ジー' => 'jii',
705    'ジョー' => 'joo',
706    'ジュー' => 'juu',
707    'スァー' => 'swaa',
708    'スェー' => 'swee',
709    'スィー' => 'swii',
710    'スォー' => 'swoo',
711    'スゥー' => 'swuu',
712    'デァー' => 'daa',
713    'デェー' => 'dee',
714    'ディー' => 'dii',
715    'デォー' => 'doo',
716    'デゥー' => 'duu',
717    'チャー' => 'chaa',
718    'チェー' => 'chee',
719    'チー' => 'chii',
720    'チョー' => 'choo',
721    'チュー' => 'chuu',
722    'ヂャー' => 'dyaa',
723    'ヂェー' => 'dyee',
724    'ヂィー' => 'dyii',
725    'ヂョー' => 'dyoo',
726    'ヂュー' => 'dyuu',
727    'ツャー' => 'tsaa',
728    'ツェー' => 'tsee',
729    'ツィー' => 'tsii',
730    'ツョー' => 'tsoo',
731    'ツー' => 'tsuu',
732    'トァー' => 'twaa',
733    'トェー' => 'twee',
734    'トィー' => 'twii',
735    'トォー' => 'twoo',
736    'トゥー' => 'twuu',
737    'ドァー' => 'dwaa',
738    'ドェー' => 'dwee',
739    'ドィー' => 'dwii',
740    'ドォー' => 'dwoo',
741    'ドゥー' => 'dwuu',
742    'ウァー' => 'whaa',
743    'ウェー' => 'whee',
744    'ウィー' => 'whii',
745    'ウォー' => 'whoo',
746    'ウゥー' => 'whuu',
747    'ヴャー' => 'vyaa',
748    'ヴェー' => 'vyee',
749    'ヴィー' => 'vyii',
750    'ヴョー' => 'vyoo',
751    'ヴュー' => 'vyuu',
752    'ヴァー' => 'vaa',
753    'ヴェー' => 'vee',
754    'ヴィー' => 'vii',
755    'ヴォー' => 'voo',
756    'ヴー' => 'vuu',
757    'ウェー' => 'wee',
758    'ウィー' => 'wii',
759    'イェー' => 'yee',
760    'ティー' => 'tii',
761    'ヂィー' => 'dii',
762
763    // 3 character syllables - doubled consonants
764    'ッビャ' => 'bbya',
765    'ッビェ' => 'bbye',
766    'ッビィ' => 'bbyi',
767    'ッビョ' => 'bbyo',
768    'ッビュ' => 'bbyu',
769    'ッピャ' => 'ppya',
770    'ッピェ' => 'ppye',
771    'ッピィ' => 'ppyi',
772    'ッピョ' => 'ppyo',
773    'ッピュ' => 'ppyu',
774    'ッキャ' => 'kkya',
775    'ッキェ' => 'kkye',
776    'ッキィ' => 'kkyi',
777    'ッキョ' => 'kkyo',
778    'ッキュ' => 'kkyu',
779    'ッギャ' => 'ggya',
780    'ッギェ' => 'ggye',
781    'ッギィ' => 'ggyi',
782    'ッギョ' => 'ggyo',
783    'ッギュ' => 'ggyu',
784    'ッミャ' => 'mmya',
785    'ッミェ' => 'mmye',
786    'ッミィ' => 'mmyi',
787    'ッミョ' => 'mmyo',
788    'ッミュ' => 'mmyu',
789    'ッニャ' => 'nnya',
790    'ッニェ' => 'nnye',
791    'ッニィ' => 'nnyi',
792    'ッニョ' => 'nnyo',
793    'ッニュ' => 'nnyu',
794    'ッリャ' => 'rrya',
795    'ッリェ' => 'rrye',
796    'ッリィ' => 'rryi',
797    'ッリョ' => 'rryo',
798    'ッリュ' => 'rryu',
799    'ッシャ' => 'ssha',
800    'ッシェ' => 'sshe',
801    'ッシ' => 'sshi',
802    'ッショ' => 'ssho',
803    'ッシュ' => 'sshu',
804    'ッチャ' => 'ccha',
805    'ッチェ' => 'cche',
806    'ッチ' => 'cchi',
807    'ッチョ' => 'ccho',
808    'ッチュ' => 'cchu',
809    'ッティ' => 'tti',
810    'ッヂィ' => 'ddi',
811
812    // 3 character syllables - doubled vowel and consonants
813    'ッバー' => 'bbaa',
814    'ッベー' => 'bbee',
815    'ッビー' => 'bbii',
816    'ッボー' => 'bboo',
817    'ッブー' => 'bbuu',
818    'ッパー' => 'ppaa',
819    'ッペー' => 'ppee',
820    'ッピー' => 'ppii',
821    'ッポー' => 'ppoo',
822    'ップー' => 'ppuu',
823    'ッケー' => 'kkee',
824    'ッキー' => 'kkii',
825    'ッコー' => 'kkoo',
826    'ックー' => 'kkuu',
827    'ッカー' => 'kkaa',
828    'ッガー' => 'ggaa',
829    'ッゲー' => 'ggee',
830    'ッギー' => 'ggii',
831    'ッゴー' => 'ggoo',
832    'ッグー' => 'gguu',
833    'ッマー' => 'maa',
834    'ッメー' => 'mee',
835    'ッミー' => 'mii',
836    'ッモー' => 'moo',
837    'ッムー' => 'muu',
838    'ッナー' => 'nnaa',
839    'ッネー' => 'nnee',
840    'ッニー' => 'nnii',
841    'ッノー' => 'nnoo',
842    'ッヌー' => 'nnuu',
843    'ッラー' => 'rraa',
844    'ッレー' => 'rree',
845    'ッリー' => 'rrii',
846    'ッロー' => 'rroo',
847    'ッルー' => 'rruu',
848    'ッサー' => 'ssaa',
849    'ッセー' => 'ssee',
850    'ッシー' => 'sshii',
851    'ッソー' => 'ssoo',
852    'ッスー' => 'ssuu',
853    'ッザー' => 'zzaa',
854    'ッゼー' => 'zzee',
855    'ッジー' => 'jjii',
856    'ッゾー' => 'zzoo',
857    'ッズー' => 'zzuu',
858    'ッター' => 'ttaa',
859    'ッテー' => 'ttee',
860    'ッチー' => 'chii',
861    'ットー' => 'ttoo',
862    'ッツー' => 'ttsuu',
863    'ッダー' => 'ddaa',
864    'ッデー' => 'ddee',
865    'ッヂー' => 'ddii',
866    'ッドー' => 'ddoo',
867    'ッヅー' => 'dduu',
868
869    // 2 character syllables - normal
870    'ファ' => 'fa',
871    'フェ' => 'fe',
872    'フィ' => 'fi',
873    'フォ' => 'fo',
874    'フゥ' => 'fu',
875    // 'フャ'=>'fya',
876    // 'フェ'=>'fye',
877    // 'フィ'=>'fyi',
878    // 'フョ'=>'fyo',
879    // 'フュ'=>'fyu',
880    'フャ' => 'fa',
881    'フェ' => 'fe',
882    'フィ' => 'fi',
883    'フョ' => 'fo',
884    'フュ' => 'fu',
885    'ヒャ' => 'hya',
886    'ヒェ' => 'hye',
887    'ヒィ' => 'hyi',
888    'ヒョ' => 'hyo',
889    'ヒュ' => 'hyu',
890    'ビャ' => 'bya',
891    'ビェ' => 'bye',
892    'ビィ' => 'byi',
893    'ビョ' => 'byo',
894    'ビュ' => 'byu',
895    'ピャ' => 'pya',
896    'ピェ' => 'pye',
897    'ピィ' => 'pyi',
898    'ピョ' => 'pyo',
899    'ピュ' => 'pyu',
900    'キャ' => 'kya',
901    'キェ' => 'kye',
902    'キィ' => 'kyi',
903    'キョ' => 'kyo',
904    'キュ' => 'kyu',
905    'ギャ' => 'gya',
906    'ギェ' => 'gye',
907    'ギィ' => 'gyi',
908    'ギョ' => 'gyo',
909    'ギュ' => 'gyu',
910    'ミャ' => 'mya',
911    'ミェ' => 'mye',
912    'ミィ' => 'myi',
913    'ミョ' => 'myo',
914    'ミュ' => 'myu',
915    'ニャ' => 'nya',
916    'ニェ' => 'nye',
917    'ニィ' => 'nyi',
918    'ニョ' => 'nyo',
919    'ニュ' => 'nyu',
920    'リャ' => 'rya',
921    'リェ' => 'rye',
922    'リィ' => 'ryi',
923    'リョ' => 'ryo',
924    'リュ' => 'ryu',
925    'シャ' => 'sha',
926    'シェ' => 'she',
927    'ショ' => 'sho',
928    'シュ' => 'shu',
929    'ジャ' => 'ja',
930    'ジェ' => 'je',
931    'ジョ' => 'jo',
932    'ジュ' => 'ju',
933    'スァ' => 'swa',
934    'スェ' => 'swe',
935    'スィ' => 'swi',
936    'スォ' => 'swo',
937    'スゥ' => 'swu',
938    'デァ' => 'da',
939    'デェ' => 'de',
940    'ディ' => 'di',
941    'デォ' => 'do',
942    'デゥ' => 'du',
943    'チャ' => 'cha',
944    'チェ' => 'che',
945    'チ' => 'chi',
946    'チョ' => 'cho',
947    'チュ' => 'chu',
948    // 'ヂャ'=>'dya',
949    // 'ヂェ'=>'dye',
950    // 'ヂィ'=>'dyi',
951    // 'ヂョ'=>'dyo',
952    // 'ヂュ'=>'dyu',
953    'ツャ' => 'tsa',
954    'ツェ' => 'tse',
955    'ツィ' => 'tsi',
956    'ツョ' => 'tso',
957    'ツ' => 'tsu',
958    'トァ' => 'twa',
959    'トェ' => 'twe',
960    'トィ' => 'twi',
961    'トォ' => 'two',
962    'トゥ' => 'twu',
963    'ドァ' => 'dwa',
964    'ドェ' => 'dwe',
965    'ドィ' => 'dwi',
966    'ドォ' => 'dwo',
967    'ドゥ' => 'dwu',
968    'ウァ' => 'wha',
969    'ウェ' => 'whe',
970    'ウィ' => 'whi',
971    'ウォ' => 'who',
972    'ウゥ' => 'whu',
973    'ヴャ' => 'vya',
974    'ヴェ' => 'vye',
975    'ヴィ' => 'vyi',
976    'ヴョ' => 'vyo',
977    'ヴュ' => 'vyu',
978    'ヴァ' => 'va',
979    'ヴェ' => 've',
980    'ヴィ' => 'vi',
981    'ヴォ' => 'vo',
982    'ヴ' => 'vu',
983    'ウェ' => 'we',
984    'ウィ' => 'wi',
985    'イェ' => 'ye',
986    'ティ' => 'ti',
987    'ヂィ' => 'di',
988
989    // 2 character syllables - doubled vocal
990    'アー' => 'aa',
991    'エー' => 'ee',
992    'イー' => 'ii',
993    'オー' => 'oo',
994    'ウー' => 'uu',
995    'ダー' => 'daa',
996    'デー' => 'dee',
997    'ヂー' => 'dii',
998    'ドー' => 'doo',
999    'ヅー' => 'duu',
1000    'ハー' => 'haa',
1001    'ヘー' => 'hee',
1002    'ヒー' => 'hii',
1003    'ホー' => 'hoo',
1004    'フー' => 'fuu',
1005    'バー' => 'baa',
1006    'ベー' => 'bee',
1007    'ビー' => 'bii',
1008    'ボー' => 'boo',
1009    'ブー' => 'buu',
1010    'パー' => 'paa',
1011    'ペー' => 'pee',
1012    'ピー' => 'pii',
1013    'ポー' => 'poo',
1014    'プー' => 'puu',
1015    'ケー' => 'kee',
1016    'キー' => 'kii',
1017    'コー' => 'koo',
1018    'クー' => 'kuu',
1019    'カー' => 'kaa',
1020    'ガー' => 'gaa',
1021    'ゲー' => 'gee',
1022    'ギー' => 'gii',
1023    'ゴー' => 'goo',
1024    'グー' => 'guu',
1025    'マー' => 'maa',
1026    'メー' => 'mee',
1027    'ミー' => 'mii',
1028    'モー' => 'moo',
1029    'ムー' => 'muu',
1030    'ナー' => 'naa',
1031    'ネー' => 'nee',
1032    'ニー' => 'nii',
1033    'ノー' => 'noo',
1034    'ヌー' => 'nuu',
1035    'ラー' => 'raa',
1036    'レー' => 'ree',
1037    'リー' => 'rii',
1038    'ロー' => 'roo',
1039    'ルー' => 'ruu',
1040    'サー' => 'saa',
1041    'セー' => 'see',
1042    'シー' => 'shii',
1043    'ソー' => 'soo',
1044    'スー' => 'suu',
1045    'ザー' => 'zaa',
1046    'ゼー' => 'zee',
1047    'ジー' => 'jii',
1048    'ゾー' => 'zoo',
1049    'ズー' => 'zuu',
1050    'ター' => 'taa',
1051    'テー' => 'tee',
1052    'チー' => 'chii',
1053    'トー' => 'too',
1054    'ツー' => 'tsuu',
1055    'ワー' => 'waa',
1056    'ヲー' => 'woo',
1057    'ヤー' => 'yaa',
1058    'ヨー' => 'yoo',
1059    'ユー' => 'yuu',
1060    'ヵー' => 'kaa',
1061    'ヶー' => 'kee',
1062    // old characters
1063    'ヱー' => 'wee',
1064    'ヰー' => 'wii',
1065
1066    // seperate katakana 'n'
1067    'ンア' => 'n_a',
1068    'ンエ' => 'n_e',
1069    'ンイ' => 'n_i',
1070    'ンオ' => 'n_o',
1071    'ンウ' => 'n_u',
1072    'ンヤ' => 'n_ya',
1073    'ンヨ' => 'n_yo',
1074    'ンユ' => 'n_yu',
1075
1076    // 2 character syllables - doubled consonants
1077    'ッバ' => 'bba',
1078    'ッベ' => 'bbe',
1079    'ッビ' => 'bbi',
1080    'ッボ' => 'bbo',
1081    'ッブ' => 'bbu',
1082    'ッパ' => 'ppa',
1083    'ッペ' => 'ppe',
1084    'ッピ' => 'ppi',
1085    'ッポ' => 'ppo',
1086    'ップ' => 'ppu',
1087    'ッケ' => 'kke',
1088    'ッキ' => 'kki',
1089    'ッコ' => 'kko',
1090    'ック' => 'kku',
1091    'ッカ' => 'kka',
1092    'ッガ' => 'gga',
1093    'ッゲ' => 'gge',
1094    'ッギ' => 'ggi',
1095    'ッゴ' => 'ggo',
1096    'ッグ' => 'ggu',
1097    'ッマ' => 'ma',
1098    'ッメ' => 'me',
1099    'ッミ' => 'mi',
1100    'ッモ' => 'mo',
1101    'ッム' => 'mu',
1102    'ッナ' => 'nna',
1103    'ッネ' => 'nne',
1104    'ッニ' => 'nni',
1105    'ッノ' => 'nno',
1106    'ッヌ' => 'nnu',
1107    'ッラ' => 'rra',
1108    'ッレ' => 'rre',
1109    'ッリ' => 'rri',
1110    'ッロ' => 'rro',
1111    'ッル' => 'rru',
1112    'ッサ' => 'ssa',
1113    'ッセ' => 'sse',
1114    'ッシ' => 'sshi',
1115    'ッソ' => 'sso',
1116    'ッス' => 'ssu',
1117    'ッザ' => 'zza',
1118    'ッゼ' => 'zze',
1119    'ッジ' => 'jji',
1120    'ッゾ' => 'zzo',
1121    'ッズ' => 'zzu',
1122    'ッタ' => 'tta',
1123    'ッテ' => 'tte',
1124    'ッチ' => 'cchi',
1125    'ット' => 'tto',
1126    'ッツ' => 'ttsu',
1127    'ッダ' => 'dda',
1128    'ッデ' => 'dde',
1129    'ッヂ' => 'ddi',
1130    'ッド' => 'ddo',
1131    'ッヅ' => 'ddu',
1132
1133    // 1 character syllables
1134    'ア' => 'a',
1135    'エ' => 'e',
1136    'イ' => 'i',
1137    'オ' => 'o',
1138    'ウ' => 'u',
1139    'ン' => 'n',
1140    'ハ' => 'ha',
1141    'ヘ' => 'he',
1142    'ヒ' => 'hi',
1143    'ホ' => 'ho',
1144    'フ' => 'fu',
1145    'バ' => 'ba',
1146    'ベ' => 'be',
1147    'ビ' => 'bi',
1148    'ボ' => 'bo',
1149    'ブ' => 'bu',
1150    'パ' => 'pa',
1151    'ペ' => 'pe',
1152    'ピ' => 'pi',
1153    'ポ' => 'po',
1154    'プ' => 'pu',
1155    'ケ' => 'ke',
1156    'キ' => 'ki',
1157    'コ' => 'ko',
1158    'ク' => 'ku',
1159    'カ' => 'ka',
1160    'ガ' => 'ga',
1161    'ゲ' => 'ge',
1162    'ギ' => 'gi',
1163    'ゴ' => 'go',
1164    'グ' => 'gu',
1165    'マ' => 'ma',
1166    'メ' => 'me',
1167    'ミ' => 'mi',
1168    'モ' => 'mo',
1169    'ム' => 'mu',
1170    'ナ' => 'na',
1171    'ネ' => 'ne',
1172    'ニ' => 'ni',
1173    'ノ' => 'no',
1174    'ヌ' => 'nu',
1175    'ラ' => 'ra',
1176    'レ' => 're',
1177    'リ' => 'ri',
1178    'ロ' => 'ro',
1179    'ル' => 'ru',
1180    'サ' => 'sa',
1181    'セ' => 'se',
1182    'シ' => 'shi',
1183    'ソ' => 'so',
1184    'ス' => 'su',
1185    'ザ' => 'za',
1186    'ゼ' => 'ze',
1187    'ジ' => 'ji',
1188    'ゾ' => 'zo',
1189    'ズ' => 'zu',
1190    'タ' => 'ta',
1191    'テ' => 'te',
1192    'チ' => 'chi',
1193    'ト' => 'to',
1194    'ツ' => 'tsu',
1195    'ダ' => 'da',
1196    'デ' => 'de',
1197    'ヂ' => 'di',
1198    'ド' => 'do',
1199    'ヅ' => 'du',
1200    'ワ' => 'wa',
1201    'ヲ' => 'wo',
1202    'ヤ' => 'ya',
1203    'ヨ' => 'yo',
1204    'ユ' => 'yu',
1205    'ヵ' => 'ka',
1206    'ヶ' => 'ke',
1207    // old characters
1208    'ヱ' => 'we',
1209    'ヰ' => 'wi',
1210
1211    //  convert what's left (probably only kicks in when something's missing above)
1212    'ァ' => 'a',
1213    'ェ' => 'e',
1214    'ィ' => 'i',
1215    'ォ' => 'o',
1216    'ゥ' => 'u',
1217    'ャ' => 'ya',
1218    'ョ' => 'yo',
1219    'ュ' => 'yu',
1220
1221    // special characters
1222    '・' => '_',
1223    '、' => '_',
1224    'ー' => '_',
1225    // when used with hiragana (seldom), this character would not be converted otherwise
1226
1227    // 'ラ'=>'la',
1228    // 'レ'=>'le',
1229    // 'リ'=>'li',
1230    // 'ロ'=>'lo',
1231    // 'ル'=>'lu',
1232    // 'チャ'=>'cya',
1233    // 'チェ'=>'cye',
1234    // 'チィ'=>'cyi',
1235    // 'チョ'=>'cyo',
1236    // 'チュ'=>'cyu',
1237    // 'デャ'=>'dha',
1238    // 'デェ'=>'dhe',
1239    // 'ディ'=>'dhi',
1240    // 'デョ'=>'dho',
1241    // 'デュ'=>'dhu',
1242    // 'リャ'=>'lya',
1243    // 'リェ'=>'lye',
1244    // 'リィ'=>'lyi',
1245    // 'リョ'=>'lyo',
1246    // 'リュ'=>'lyu',
1247    // 'テャ'=>'tha',
1248    // 'テェ'=>'the',
1249    // 'ティ'=>'thi',
1250    // 'テョ'=>'tho',
1251    // 'テュ'=>'thu',
1252    // 'ファ'=>'fwa',
1253    // 'フェ'=>'fwe',
1254    // 'フィ'=>'fwi',
1255    // 'フォ'=>'fwo',
1256    // 'フゥ'=>'fwu',
1257    // 'チャ'=>'tya',
1258    // 'チェ'=>'tye',
1259    // 'チィ'=>'tyi',
1260    // 'チョ'=>'tyo',
1261    // 'チュ'=>'tyu',
1262    // 'ジャ'=>'jya',
1263    // 'ジェ'=>'jye',
1264    // 'ジィ'=>'jyi',
1265    // 'ジョ'=>'jyo',
1266    // 'ジュ'=>'jyu',
1267    // 'ジャ'=>'zha',
1268    // 'ジェ'=>'zhe',
1269    // 'ジィ'=>'zhi',
1270    // 'ジョ'=>'zho',
1271    // 'ジュ'=>'zhu',
1272    // 'ジャ'=>'zya',
1273    // 'ジェ'=>'zye',
1274    // 'ジィ'=>'zyi',
1275    // 'ジョ'=>'zyo',
1276    // 'ジュ'=>'zyu',
1277    // 'シャ'=>'sya',
1278    // 'シェ'=>'sye',
1279    // 'シィ'=>'syi',
1280    // 'ショ'=>'syo',
1281    // 'シュ'=>'syu',
1282    // 'シ'=>'ci',
1283    // 'フ'=>'hu',
1284    // 'シ'=>'si',
1285    // 'チ'=>'ti',
1286    // 'ツ'=>'tu',
1287    // 'イ'=>'yi',
1288    // 'ヂ'=>'dzi',
1289
1290    // "Greeklish"
1291    'Α' => 'a',
1292    'Ά' => 'a',
1293    'Β' => 'b',
1294    'Γ' => 'g',
1295    'Δ' => 'd',
1296    'Ε' => 'e',
1297    'Έ' => 'e',
1298    'Ζ' => 'z',
1299    'Η' => 'i',
1300    'Ή' => 'i',
1301    'Θ' => 'th',
1302    'Ι' => 'i',
1303    'Ί' => 'i',
1304    'Ϊ' => 'i',
1305    'ΐ' => 'i',
1306    'Κ' => 'k',
1307    'Λ' => 'l',
1308    'Μ' => 'm',
1309    'Ν' => 'n',
1310    'Ξ' => 'x',
1311    'Ο' => 'o',
1312    'Ό' => 'o',
1313    'Π' => 'p',
1314    'Ρ' => 'r',
1315    'Σ' => 's',
1316    'Τ' => 't',
1317    'Υ' => 'y',
1318    'Ύ' => 'y',
1319    'Ϋ' => 'y',
1320    'ΰ' => 'y',
1321    'Φ' => 'f',
1322    'Χ' => 'ch',
1323    'Ψ' => 'ps',
1324    'Ω' => 'o',
1325    'Ώ' => 'o',
1326    'α' => 'a',
1327    'ά' => 'a',
1328    'β' => 'b',
1329    'γ' => 'g',
1330    'δ' => 'd',
1331    'ε' => 'e',
1332    'έ' => 'e',
1333    'ζ' => 'z',
1334    'η' => 'i',
1335    'ή' => 'i',
1336    'θ' => 'th',
1337    'ι' => 'i',
1338    'ί' => 'i',
1339    'ϊ' => 'i',
1340    'κ' => 'k',
1341    'λ' => 'l',
1342    'μ' => 'm',
1343    'ν' => 'n',
1344    'ξ' => 'x',
1345    'ο' => 'o',
1346    'ό' => 'o',
1347    'π' => 'p',
1348    'ρ' => 'r',
1349    'σ' => 's',
1350    'ς' => 's',
1351    'τ' => 't',
1352    'υ' => 'y',
1353    'ύ' => 'y',
1354    'ϋ' => 'y',
1355    'φ' => 'f',
1356    'χ' => 'ch',
1357    'ψ' => 'ps',
1358    'ω' => 'o',
1359    'ώ' => 'o',
1360
1361    // Thai
1362    'ก' => 'k',
1363    'ข' => 'kh',
1364    'ฃ' => 'kh',
1365    'ค' => 'kh',
1366    'ฅ' => 'kh',
1367    'ฆ' => 'kh',
1368    'ง' => 'ng',
1369    'จ' => 'ch',
1370    'ฉ' => 'ch',
1371    'ช' => 'ch',
1372    'ซ' => 's',
1373    'ฌ' => 'ch',
1374    'ญ' => 'y',
1375    'ฎ' => 'd',
1376    'ฏ' => 't',
1377    'ฐ' => 'th',
1378    'ฑ' => 'd',
1379    'ฒ' => 'th',
1380    'ณ' => 'n',
1381    'ด' => 'd',
1382    'ต' => 't',
1383    'ถ' => 'th',
1384    'ท' => 'th',
1385    'ธ' => 'th',
1386    'น' => 'n',
1387    'บ' => 'b',
1388    'ป' => 'p',
1389    'ผ' => 'ph',
1390    'ฝ' => 'f',
1391    'พ' => 'ph',
1392    'ฟ' => 'f',
1393    'ภ' => 'ph',
1394    'ม' => 'm',
1395    'ย' => 'y',
1396    'ร' => 'r',
1397    'ฤ' => 'rue',
1398    'ฤๅ' => 'rue',
1399    'ล' => 'l',
1400    'ฦ' => 'lue',
1401    'ฦๅ' => 'lue',
1402    'ว' => 'w',
1403    'ศ' => 's',
1404    'ษ' => 's',
1405    'ส' => 's',
1406    'ห' => 'h',
1407    'ฬ' => 'l',
1408    'ฮ' => 'h',
1409    'ะ' => 'a',
1410    'ั' => 'a',
1411    'รร' => 'a',
1412    'า' => 'a',
1413    'ๅ' => 'a',
1414    'ำ' => 'am',
1415    'ํา' => 'am',
1416    'ิ' => 'i',
1417    'ี' => 'i',
1418    'ึ' => 'ue',
1419    'ี' => 'ue',
1420    'ุ' => 'u',
1421    'ู' => 'u',
1422    'เ' => 'e',
1423    'แ' => 'ae',
1424    'โ' => 'o',
1425    'อ' => 'o',
1426    'ียะ' => 'ia',
1427    'ีย' => 'ia',
1428    'ือะ' => 'uea',
1429    'ือ' => 'uea',
1430    'ัวะ' => 'ua',
1431    'ัว' => 'ua',
1432    'ใ' => 'ai',
1433    'ไ' => 'ai',
1434    'ัย' => 'ai',
1435    'าย' => 'ai',
1436    'าว' => 'ao',
1437    'ุย' => 'ui',
1438    'อย' => 'oi',
1439    'ือย' => 'ueai',
1440    'วย' => 'uai',
1441    'ิว' => 'io',
1442    '็ว' => 'eo',
1443    'ียว' => 'iao',
1444    '่' => '',
1445    '้' => '',
1446    '๊' => '',
1447    '๋' => '',
1448    '็' => '',
1449    '์' => '',
1450    '๎' => '',
1451    'ํ' => '',
1452    'ฺ' => '',
1453    'ๆ' => '2',
1454    '๏' => 'o',
1455    'ฯ' => '-',
1456    '๚' => '-',
1457    '๛' => '-',
1458    '๐' => '0',
1459    '๑' => '1',
1460    '๒' => '2',
1461    '๓' => '3',
1462    '๔' => '4',
1463    '๕' => '5',
1464    '๖' => '6',
1465    '๗' => '7',
1466    '๘' => '8',
1467    '๙' => '9',
1468
1469    // Korean
1470    'ㄱ' => 'k', 'ㅋ' => 'kh',
1471    'ㄲ' => 'kk',
1472    'ㄷ' => 't',
1473    'ㅌ' => 'th',
1474    'ㄸ' => 'tt',
1475    'ㅂ' => 'p',
1476    'ㅍ' => 'ph',
1477    'ㅃ' => 'pp',
1478    'ㅈ' => 'c',
1479    'ㅊ' => 'ch',
1480    'ㅉ' => 'cc',
1481    'ㅅ' => 's',
1482    'ㅆ' => 'ss',
1483    'ㅎ' => 'h',
1484    'ㅇ' => 'ng',
1485    'ㄴ' => 'n',
1486    'ㄹ' => 'l',
1487    'ㅁ' => 'm',
1488    'ㅏ' => 'a',
1489    'ㅓ' => 'e',
1490    'ㅗ' => 'o',
1491    'ㅜ' => 'wu',
1492    'ㅡ' => 'u',
1493    'ㅣ' => 'i',
1494    'ㅐ' => 'ay',
1495    'ㅔ' => 'ey',
1496    'ㅚ' => 'oy',
1497    'ㅘ' => 'wa',
1498    'ㅝ' => 'we',
1499    'ㅟ' => 'wi',
1500    'ㅙ' => 'way',
1501    'ㅞ' => 'wey',
1502    'ㅢ' => 'uy',
1503    'ㅑ' => 'ya',
1504    'ㅕ' => 'ye',
1505    'ㅛ' => 'oy',
1506    'ㅠ' => 'yu',
1507    'ㅒ' => 'yay',
1508    'ㅖ' => 'yey',
1509];
1510