xref: /dokuwiki/inc/Utf8/tables/romanization.php (revision 130677782a0ecc9e606d2224faebae95c406f280)
1*13067778SAndreas Gohr<?php
2*13067778SAndreas Gohr/**
3*13067778SAndreas Gohr * Romanization lookup table
4*13067778SAndreas Gohr *
5*13067778SAndreas Gohr * This lookup tables provides a way to transform strings written in a language
6*13067778SAndreas Gohr * different from the ones based upon latin letters into plain ASCII.
7*13067778SAndreas Gohr *
8*13067778SAndreas Gohr * Please note: this is not a scientific transliteration table. It only works
9*13067778SAndreas Gohr * oneway from nonlatin to ASCII and it works by simple character replacement
10*13067778SAndreas Gohr * only. Specialities of each language are not supported.
11*13067778SAndreas Gohr *
12*13067778SAndreas Gohr * @todo some keys are used multiple times
13*13067778SAndreas Gohr * @todo remove or integrate commented pairs
14*13067778SAndreas Gohr *
15*13067778SAndreas Gohr * @author Andreas Gohr <andi@splitbrain.org>
16*13067778SAndreas Gohr * @author Vitaly Blokhin <vitinfo@vitn.com>
17*13067778SAndreas Gohr * @author Bisqwit <bisqwit@iki.fi>
18*13067778SAndreas Gohr * @author Arthit Suriyawongkul <arthit@gmail.com>
19*13067778SAndreas Gohr * @author Denis Scheither <amorphis@uni-bremen.de>
20*13067778SAndreas Gohr * @author Eivind Morland <eivind.morland@gmail.com>
21*13067778SAndreas Gohr * @link   http://www.uconv.com/translit.htm
22*13067778SAndreas Gohr * @link   http://kanjidict.stc.cx/hiragana.php?src=2
23*13067778SAndreas Gohr * @link   http://www.translatum.gr/converter/greek-transliteration.htm
24*13067778SAndreas Gohr * @link   http://en.wikipedia.org/wiki/Royal_Thai_General_System_of_Transcription
25*13067778SAndreas Gohr * @link   http://www.btranslations.com/resources/romanization/korean.asp
26*13067778SAndreas Gohr */
27*13067778SAndreas Gohrreturn [
28*13067778SAndreas Gohr    // scandinavian - differs from what we do in deaccent
29*13067778SAndreas Gohr    'å' => 'a',
30*13067778SAndreas Gohr    'Å' => 'A',
31*13067778SAndreas Gohr    'ä' => 'a',
32*13067778SAndreas Gohr    'Ä' => 'A',
33*13067778SAndreas Gohr    'ö' => 'o',
34*13067778SAndreas Gohr    'Ö' => 'O',
35*13067778SAndreas Gohr
36*13067778SAndreas Gohr    //russian cyrillic
37*13067778SAndreas Gohr    'а' => 'a',
38*13067778SAndreas Gohr    'А' => 'A',
39*13067778SAndreas Gohr    'б' => 'b',
40*13067778SAndreas Gohr    'Б' => 'B',
41*13067778SAndreas Gohr    'в' => 'v',
42*13067778SAndreas Gohr    'В' => 'V',
43*13067778SAndreas Gohr    'г' => 'g',
44*13067778SAndreas Gohr    'Г' => 'G',
45*13067778SAndreas Gohr    'д' => 'd',
46*13067778SAndreas Gohr    'Д' => 'D',
47*13067778SAndreas Gohr    'е' => 'e',
48*13067778SAndreas Gohr    'Е' => 'E',
49*13067778SAndreas Gohr    'ё' => 'jo',
50*13067778SAndreas Gohr    'Ё' => 'Jo',
51*13067778SAndreas Gohr    'ж' => 'zh',
52*13067778SAndreas Gohr    'Ж' => 'Zh',
53*13067778SAndreas Gohr    'з' => 'z',
54*13067778SAndreas Gohr    'З' => 'Z',
55*13067778SAndreas Gohr    'и' => 'i',
56*13067778SAndreas Gohr    'И' => 'I',
57*13067778SAndreas Gohr    'й' => 'j',
58*13067778SAndreas Gohr    'Й' => 'J',
59*13067778SAndreas Gohr    'к' => 'k',
60*13067778SAndreas Gohr    'К' => 'K',
61*13067778SAndreas Gohr    'л' => 'l',
62*13067778SAndreas Gohr    'Л' => 'L',
63*13067778SAndreas Gohr    'м' => 'm',
64*13067778SAndreas Gohr    'М' => 'M',
65*13067778SAndreas Gohr    'н' => 'n',
66*13067778SAndreas Gohr    'Н' => 'N',
67*13067778SAndreas Gohr    'о' => 'o',
68*13067778SAndreas Gohr    'О' => 'O',
69*13067778SAndreas Gohr    'п' => 'p',
70*13067778SAndreas Gohr    'П' => 'P',
71*13067778SAndreas Gohr    'р' => 'r',
72*13067778SAndreas Gohr    'Р' => 'R',
73*13067778SAndreas Gohr    'с' => 's',
74*13067778SAndreas Gohr    'С' => 'S',
75*13067778SAndreas Gohr    'т' => 't',
76*13067778SAndreas Gohr    'Т' => 'T',
77*13067778SAndreas Gohr    'у' => 'u',
78*13067778SAndreas Gohr    'У' => 'U',
79*13067778SAndreas Gohr    'ф' => 'f',
80*13067778SAndreas Gohr    'Ф' => 'F',
81*13067778SAndreas Gohr    'х' => 'x',
82*13067778SAndreas Gohr    'Х' => 'X',
83*13067778SAndreas Gohr    'ц' => 'c',
84*13067778SAndreas Gohr    'Ц' => 'C',
85*13067778SAndreas Gohr    'ч' => 'ch',
86*13067778SAndreas Gohr    'Ч' => 'Ch',
87*13067778SAndreas Gohr    'ш' => 'sh',
88*13067778SAndreas Gohr    'Ш' => 'Sh',
89*13067778SAndreas Gohr    'щ' => 'sch',
90*13067778SAndreas Gohr    'Щ' => 'Sch',
91*13067778SAndreas Gohr    'ъ' => '',
92*13067778SAndreas Gohr    'Ъ' => '',
93*13067778SAndreas Gohr    'ы' => 'y',
94*13067778SAndreas Gohr    'Ы' => 'Y',
95*13067778SAndreas Gohr    'ь' => '',
96*13067778SAndreas Gohr    'Ь' => '',
97*13067778SAndreas Gohr    'э' => 'eh',
98*13067778SAndreas Gohr    'Э' => 'Eh',
99*13067778SAndreas Gohr    'ю' => 'ju',
100*13067778SAndreas Gohr    'Ю' => 'Ju',
101*13067778SAndreas Gohr    'я' => 'ja',
102*13067778SAndreas Gohr    'Я' => 'Ja',
103*13067778SAndreas Gohr
104*13067778SAndreas Gohr    // Ukrainian cyrillic
105*13067778SAndreas Gohr    'Ґ' => 'Gh',
106*13067778SAndreas Gohr    'ґ' => 'gh',
107*13067778SAndreas Gohr    'Є' => 'Je',
108*13067778SAndreas Gohr    'є' => 'je',
109*13067778SAndreas Gohr    'І' => 'I',
110*13067778SAndreas Gohr    'і' => 'i',
111*13067778SAndreas Gohr    'Ї' => 'Ji',
112*13067778SAndreas Gohr    'ї' => 'ji',
113*13067778SAndreas Gohr
114*13067778SAndreas Gohr    // Georgian
115*13067778SAndreas Gohr    'ა' => 'a',
116*13067778SAndreas Gohr    'ბ' => 'b',
117*13067778SAndreas Gohr    'გ' => 'g',
118*13067778SAndreas Gohr    'დ' => 'd',
119*13067778SAndreas Gohr    'ე' => 'e',
120*13067778SAndreas Gohr    'ვ' => 'v',
121*13067778SAndreas Gohr    'ზ' => 'z',
122*13067778SAndreas Gohr    'თ' => 'th',
123*13067778SAndreas Gohr    'ი' => 'i',
124*13067778SAndreas Gohr    'კ' => 'p',
125*13067778SAndreas Gohr    'ლ' => 'l',
126*13067778SAndreas Gohr    'მ' => 'm',
127*13067778SAndreas Gohr    'ნ' => 'n',
128*13067778SAndreas Gohr    'ო' => 'o',
129*13067778SAndreas Gohr    'პ' => 'p',
130*13067778SAndreas Gohr    'ჟ' => 'zh',
131*13067778SAndreas Gohr    'რ' => 'r',
132*13067778SAndreas Gohr    'ს' => 's',
133*13067778SAndreas Gohr    'ტ' => 't',
134*13067778SAndreas Gohr    'უ' => 'u',
135*13067778SAndreas Gohr    'ფ' => 'ph',
136*13067778SAndreas Gohr    'ქ' => 'kh',
137*13067778SAndreas Gohr    'ღ' => 'gh',
138*13067778SAndreas Gohr    'ყ' => 'q',
139*13067778SAndreas Gohr    'შ' => 'sh',
140*13067778SAndreas Gohr    'ჩ' => 'ch',
141*13067778SAndreas Gohr    'ც' => 'c',
142*13067778SAndreas Gohr    'ძ' => 'dh',
143*13067778SAndreas Gohr    'წ' => 'w',
144*13067778SAndreas Gohr    'ჭ' => 'j',
145*13067778SAndreas Gohr    'ხ' => 'x',
146*13067778SAndreas Gohr    'ჯ' => 'jh',
147*13067778SAndreas Gohr    'ჰ' => 'xh',
148*13067778SAndreas Gohr
149*13067778SAndreas Gohr    //Sanskrit
150*13067778SAndreas Gohr    'अ' => 'a',
151*13067778SAndreas Gohr    'आ' => 'ah',
152*13067778SAndreas Gohr    'इ' => 'i',
153*13067778SAndreas Gohr    'ई' => 'ih',
154*13067778SAndreas Gohr    'उ' => 'u',
155*13067778SAndreas Gohr    'ऊ' => 'uh',
156*13067778SAndreas Gohr    'ऋ' => 'ry',
157*13067778SAndreas Gohr    'ॠ' => 'ryh',
158*13067778SAndreas Gohr    'ऌ' => 'ly',
159*13067778SAndreas Gohr    'ॡ' => 'lyh',
160*13067778SAndreas Gohr    'ए' => 'e',
161*13067778SAndreas Gohr    'ऐ' => 'ay',
162*13067778SAndreas Gohr    'ओ' => 'o',
163*13067778SAndreas Gohr    'औ' => 'aw',
164*13067778SAndreas Gohr    'अं' => 'amh',
165*13067778SAndreas Gohr    'अः' => 'aq',
166*13067778SAndreas Gohr    'क' => 'k',
167*13067778SAndreas Gohr    'ख' => 'kh',
168*13067778SAndreas Gohr    'ग' => 'g',
169*13067778SAndreas Gohr    'घ' => 'gh',
170*13067778SAndreas Gohr    'ङ' => 'nh',
171*13067778SAndreas Gohr    'च' => 'c',
172*13067778SAndreas Gohr    'छ' => 'ch',
173*13067778SAndreas Gohr    'ज' => 'j',
174*13067778SAndreas Gohr    'झ' => 'jh',
175*13067778SAndreas Gohr    'ञ' => 'ny',
176*13067778SAndreas Gohr    'ट' => 'tq',
177*13067778SAndreas Gohr    'ठ' => 'tqh',
178*13067778SAndreas Gohr    'ड' => 'dq',
179*13067778SAndreas Gohr    'ढ' => 'dqh',
180*13067778SAndreas Gohr    'ण' => 'nq',
181*13067778SAndreas Gohr    'त' => 't',
182*13067778SAndreas Gohr    'थ' => 'th',
183*13067778SAndreas Gohr    'द' => 'd',
184*13067778SAndreas Gohr    'ध' => 'dh',
185*13067778SAndreas Gohr    'न' => 'n',
186*13067778SAndreas Gohr    'प' => 'p',
187*13067778SAndreas Gohr    'फ' => 'ph',
188*13067778SAndreas Gohr    'ब' => 'b',
189*13067778SAndreas Gohr    'भ' => 'bh',
190*13067778SAndreas Gohr    'म' => 'm',
191*13067778SAndreas Gohr    'य' => 'z',
192*13067778SAndreas Gohr    'र' => 'r',
193*13067778SAndreas Gohr    'ल' => 'l',
194*13067778SAndreas Gohr    'व' => 'v',
195*13067778SAndreas Gohr    'श' => 'sh',
196*13067778SAndreas Gohr    'ष' => 'sqh',
197*13067778SAndreas Gohr    'स' => 's',
198*13067778SAndreas Gohr    'ह' => 'x',
199*13067778SAndreas Gohr
200*13067778SAndreas Gohr    //Sanskrit diacritics
201*13067778SAndreas Gohr    'Ā' => 'A',
202*13067778SAndreas Gohr    'Ī' => 'I',
203*13067778SAndreas Gohr    'Ū' => 'U',
204*13067778SAndreas Gohr    'Ṛ' => 'R',
205*13067778SAndreas Gohr    'Ṝ' => 'R',
206*13067778SAndreas Gohr    'Ṅ' => 'N',
207*13067778SAndreas Gohr    'Ñ' => 'N',
208*13067778SAndreas Gohr    'Ṭ' => 'T',
209*13067778SAndreas Gohr    'Ḍ' => 'D',
210*13067778SAndreas Gohr    'Ṇ' => 'N',
211*13067778SAndreas Gohr    'Ś' => 'S',
212*13067778SAndreas Gohr    'Ṣ' => 'S',
213*13067778SAndreas Gohr    'Ṁ' => 'M',
214*13067778SAndreas Gohr    'Ṃ' => 'M',
215*13067778SAndreas Gohr    'Ḥ' => 'H',
216*13067778SAndreas Gohr    'Ḷ' => 'L',
217*13067778SAndreas Gohr    'Ḹ' => 'L',
218*13067778SAndreas Gohr    'ā' => 'a',
219*13067778SAndreas Gohr    'ī' => 'i',
220*13067778SAndreas Gohr    'ū' => 'u',
221*13067778SAndreas Gohr    'ṛ' => 'r',
222*13067778SAndreas Gohr    'ṝ' => 'r',
223*13067778SAndreas Gohr    'ṅ' => 'n',
224*13067778SAndreas Gohr    'ñ' => 'n',
225*13067778SAndreas Gohr    'ṭ' => 't',
226*13067778SAndreas Gohr    'ḍ' => 'd',
227*13067778SAndreas Gohr    'ṇ' => 'n',
228*13067778SAndreas Gohr    'ś' => 's',
229*13067778SAndreas Gohr    'ṣ' => 's',
230*13067778SAndreas Gohr    'ṁ' => 'm',
231*13067778SAndreas Gohr    'ṃ' => 'm',
232*13067778SAndreas Gohr    'ḥ' => 'h',
233*13067778SAndreas Gohr    'ḷ' => 'l',
234*13067778SAndreas Gohr    'ḹ' => 'l',
235*13067778SAndreas Gohr
236*13067778SAndreas Gohr    //Hebrew
237*13067778SAndreas Gohr    'א' => 'a',
238*13067778SAndreas Gohr    'ב' => 'b',
239*13067778SAndreas Gohr    'ג' => 'g',
240*13067778SAndreas Gohr    'ד' => 'd',
241*13067778SAndreas Gohr    'ה' => 'h',
242*13067778SAndreas Gohr    'ו' => 'v',
243*13067778SAndreas Gohr    'ז' => 'z',
244*13067778SAndreas Gohr    'ח' => 'kh',
245*13067778SAndreas Gohr    'ט' => 'th',
246*13067778SAndreas Gohr    'י' => 'y',
247*13067778SAndreas Gohr    'ך' => 'h',
248*13067778SAndreas Gohr    'כ' => 'k',
249*13067778SAndreas Gohr    'ל' => 'l',
250*13067778SAndreas Gohr    'ם' => 'm',
251*13067778SAndreas Gohr    'מ' => 'm',
252*13067778SAndreas Gohr    'ן' => 'n',
253*13067778SAndreas Gohr    'נ' => 'n',
254*13067778SAndreas Gohr    'ס' => 's',
255*13067778SAndreas Gohr    'ע' => 'ah',
256*13067778SAndreas Gohr    'ף' => 'f',
257*13067778SAndreas Gohr    'פ' => 'p',
258*13067778SAndreas Gohr    'ץ' => 'c',
259*13067778SAndreas Gohr    'צ' => 'c',
260*13067778SAndreas Gohr    'ק' => 'q',
261*13067778SAndreas Gohr    'ר' => 'r',
262*13067778SAndreas Gohr    'ש' => 'sh',
263*13067778SAndreas Gohr    'ת' => 't',
264*13067778SAndreas Gohr
265*13067778SAndreas Gohr    //Arabic
266*13067778SAndreas Gohr    'ا' => 'a',
267*13067778SAndreas Gohr    'ب' => 'b',
268*13067778SAndreas Gohr    'ت' => 't',
269*13067778SAndreas Gohr    'ث' => 'th',
270*13067778SAndreas Gohr    'ج' => 'g',
271*13067778SAndreas Gohr    'ح' => 'xh',
272*13067778SAndreas Gohr    'خ' => 'x',
273*13067778SAndreas Gohr    'د' => 'd',
274*13067778SAndreas Gohr    'ذ' => 'dh',
275*13067778SAndreas Gohr    'ر' => 'r',
276*13067778SAndreas Gohr    'ز' => 'z',
277*13067778SAndreas Gohr    'س' => 's',
278*13067778SAndreas Gohr    'ش' => 'sh',
279*13067778SAndreas Gohr    'ص' => 's\'',
280*13067778SAndreas Gohr    'ض' => 'd\'',
281*13067778SAndreas Gohr    'ط' => 't\'',
282*13067778SAndreas Gohr    'ظ' => 'z\'',
283*13067778SAndreas Gohr    'ع' => 'y',
284*13067778SAndreas Gohr    'غ' => 'gh',
285*13067778SAndreas Gohr    'ف' => 'f',
286*13067778SAndreas Gohr    'ق' => 'q',
287*13067778SAndreas Gohr    'ك' => 'k',
288*13067778SAndreas Gohr    'ل' => 'l',
289*13067778SAndreas Gohr    'م' => 'm',
290*13067778SAndreas Gohr    'ن' => 'n',
291*13067778SAndreas Gohr    'ه' => 'x\'',
292*13067778SAndreas Gohr    'و' => 'u',
293*13067778SAndreas Gohr    'ي' => 'i',
294*13067778SAndreas Gohr
295*13067778SAndreas Gohr    // Japanese characters  (last update: 2008-05-09)
296*13067778SAndreas Gohr
297*13067778SAndreas Gohr    // Japanese hiragana
298*13067778SAndreas Gohr
299*13067778SAndreas Gohr    // 3 character syllables, っ doubles the consonant after
300*13067778SAndreas Gohr    'っちゃ' => 'ccha',
301*13067778SAndreas Gohr    'っちぇ' => 'cche',
302*13067778SAndreas Gohr    'っちょ' => 'ccho',
303*13067778SAndreas Gohr    'っちゅ' => 'cchu',
304*13067778SAndreas Gohr    'っびゃ' => 'bbya',
305*13067778SAndreas Gohr    'っびぇ' => 'bbye',
306*13067778SAndreas Gohr    'っびぃ' => 'bbyi',
307*13067778SAndreas Gohr    'っびょ' => 'bbyo',
308*13067778SAndreas Gohr    'っびゅ' => 'bbyu',
309*13067778SAndreas Gohr    'っぴゃ' => 'ppya',
310*13067778SAndreas Gohr    'っぴぇ' => 'ppye',
311*13067778SAndreas Gohr    'っぴぃ' => 'ppyi',
312*13067778SAndreas Gohr    'っぴょ' => 'ppyo',
313*13067778SAndreas Gohr    'っぴゅ' => 'ppyu',
314*13067778SAndreas Gohr    'っちゃ' => 'ccha',
315*13067778SAndreas Gohr    'っちぇ' => 'cche',
316*13067778SAndreas Gohr    'っち' => 'cchi',
317*13067778SAndreas Gohr    'っちょ' => 'ccho',
318*13067778SAndreas Gohr    'っちゅ' => 'cchu',
319*13067778SAndreas Gohr    // 'っひゃ'=>'hya',
320*13067778SAndreas Gohr    // 'っひぇ'=>'hye',
321*13067778SAndreas Gohr    // 'っひぃ'=>'hyi',
322*13067778SAndreas Gohr    // 'っひょ'=>'hyo',
323*13067778SAndreas Gohr    // 'っひゅ'=>'hyu',
324*13067778SAndreas Gohr    'っきゃ' => 'kkya',
325*13067778SAndreas Gohr    'っきぇ' => 'kkye',
326*13067778SAndreas Gohr    'っきぃ' => 'kkyi',
327*13067778SAndreas Gohr    'っきょ' => 'kkyo',
328*13067778SAndreas Gohr    'っきゅ' => 'kkyu',
329*13067778SAndreas Gohr    'っぎゃ' => 'ggya',
330*13067778SAndreas Gohr    'っぎぇ' => 'ggye',
331*13067778SAndreas Gohr    'っぎぃ' => 'ggyi',
332*13067778SAndreas Gohr    'っぎょ' => 'ggyo',
333*13067778SAndreas Gohr    'っぎゅ' => 'ggyu',
334*13067778SAndreas Gohr    'っみゃ' => 'mmya',
335*13067778SAndreas Gohr    'っみぇ' => 'mmye',
336*13067778SAndreas Gohr    'っみぃ' => 'mmyi',
337*13067778SAndreas Gohr    'っみょ' => 'mmyo',
338*13067778SAndreas Gohr    'っみゅ' => 'mmyu',
339*13067778SAndreas Gohr    'っにゃ' => 'nnya',
340*13067778SAndreas Gohr    'っにぇ' => 'nnye',
341*13067778SAndreas Gohr    'っにぃ' => 'nnyi',
342*13067778SAndreas Gohr    'っにょ' => 'nnyo',
343*13067778SAndreas Gohr    'っにゅ' => 'nnyu',
344*13067778SAndreas Gohr    'っりゃ' => 'rrya',
345*13067778SAndreas Gohr    'っりぇ' => 'rrye',
346*13067778SAndreas Gohr    'っりぃ' => 'rryi',
347*13067778SAndreas Gohr    'っりょ' => 'rryo',
348*13067778SAndreas Gohr    'っりゅ' => 'rryu',
349*13067778SAndreas Gohr    'っしゃ' => 'ssha',
350*13067778SAndreas Gohr    'っしぇ' => 'sshe',
351*13067778SAndreas Gohr    'っし' => 'sshi',
352*13067778SAndreas Gohr    'っしょ' => 'ssho',
353*13067778SAndreas Gohr    'っしゅ' => 'sshu',
354*13067778SAndreas Gohr
355*13067778SAndreas Gohr    // seperate hiragana 'n' ('n' + 'i' != 'ni', normally we would write "kon'nichi wa" but the
356*13067778SAndreas Gohr    // apostrophe would be converted to _ anyway)
357*13067778SAndreas Gohr    'んあ' => 'n_a',
358*13067778SAndreas Gohr    'んえ' => 'n_e',
359*13067778SAndreas Gohr    'んい' => 'n_i',
360*13067778SAndreas Gohr    'んお' => 'n_o',
361*13067778SAndreas Gohr    'んう' => 'n_u',
362*13067778SAndreas Gohr    'んや' => 'n_ya',
363*13067778SAndreas Gohr    'んよ' => 'n_yo',
364*13067778SAndreas Gohr    'んゆ' => 'n_yu',
365*13067778SAndreas Gohr
366*13067778SAndreas Gohr    // 2 character syllables - normal
367*13067778SAndreas Gohr    'ふぁ' => 'fa',
368*13067778SAndreas Gohr    'ふぇ' => 'fe',
369*13067778SAndreas Gohr    'ふぃ' => 'fi',
370*13067778SAndreas Gohr    'ふぉ' => 'fo',
371*13067778SAndreas Gohr    'ちゃ' => 'cha',
372*13067778SAndreas Gohr    'ちぇ' => 'che',
373*13067778SAndreas Gohr    'ち' => 'chi',
374*13067778SAndreas Gohr    'ちょ' => 'cho',
375*13067778SAndreas Gohr    'ちゅ' => 'chu',
376*13067778SAndreas Gohr    'ひゃ' => 'hya',
377*13067778SAndreas Gohr    'ひぇ' => 'hye',
378*13067778SAndreas Gohr    'ひぃ' => 'hyi',
379*13067778SAndreas Gohr    'ひょ' => 'hyo',
380*13067778SAndreas Gohr    'ひゅ' => 'hyu',
381*13067778SAndreas Gohr    'びゃ' => 'bya',
382*13067778SAndreas Gohr    'びぇ' => 'bye',
383*13067778SAndreas Gohr    'びぃ' => 'byi',
384*13067778SAndreas Gohr    'びょ' => 'byo',
385*13067778SAndreas Gohr    'びゅ' => 'byu',
386*13067778SAndreas Gohr    'ぴゃ' => 'pya',
387*13067778SAndreas Gohr    'ぴぇ' => 'pye',
388*13067778SAndreas Gohr    'ぴぃ' => 'pyi',
389*13067778SAndreas Gohr    'ぴょ' => 'pyo',
390*13067778SAndreas Gohr    'ぴゅ' => 'pyu',
391*13067778SAndreas Gohr    'きゃ' => 'kya',
392*13067778SAndreas Gohr    'きぇ' => 'kye',
393*13067778SAndreas Gohr    'きぃ' => 'kyi',
394*13067778SAndreas Gohr    'きょ' => 'kyo',
395*13067778SAndreas Gohr    'きゅ' => 'kyu',
396*13067778SAndreas Gohr    'ぎゃ' => 'gya',
397*13067778SAndreas Gohr    'ぎぇ' => 'gye',
398*13067778SAndreas Gohr    'ぎぃ' => 'gyi',
399*13067778SAndreas Gohr    'ぎょ' => 'gyo',
400*13067778SAndreas Gohr    'ぎゅ' => 'gyu',
401*13067778SAndreas Gohr    'みゃ' => 'mya',
402*13067778SAndreas Gohr    'みぇ' => 'mye',
403*13067778SAndreas Gohr    'みぃ' => 'myi',
404*13067778SAndreas Gohr    'みょ' => 'myo',
405*13067778SAndreas Gohr    'みゅ' => 'myu',
406*13067778SAndreas Gohr    'にゃ' => 'nya',
407*13067778SAndreas Gohr    'にぇ' => 'nye',
408*13067778SAndreas Gohr    'にぃ' => 'nyi',
409*13067778SAndreas Gohr    'にょ' => 'nyo',
410*13067778SAndreas Gohr    'にゅ' => 'nyu',
411*13067778SAndreas Gohr    'りゃ' => 'rya',
412*13067778SAndreas Gohr    'りぇ' => 'rye',
413*13067778SAndreas Gohr    'りぃ' => 'ryi',
414*13067778SAndreas Gohr    'りょ' => 'ryo',
415*13067778SAndreas Gohr    'りゅ' => 'ryu',
416*13067778SAndreas Gohr    'しゃ' => 'sha',
417*13067778SAndreas Gohr    'しぇ' => 'she',
418*13067778SAndreas Gohr    'し' => 'shi',
419*13067778SAndreas Gohr    'しょ' => 'sho',
420*13067778SAndreas Gohr    'しゅ' => 'shu',
421*13067778SAndreas Gohr    'じゃ' => 'ja',
422*13067778SAndreas Gohr    'じぇ' => 'je',
423*13067778SAndreas Gohr    'じょ' => 'jo',
424*13067778SAndreas Gohr    'じゅ' => 'ju',
425*13067778SAndreas Gohr    'うぇ' => 'we',
426*13067778SAndreas Gohr    'うぃ' => 'wi',
427*13067778SAndreas Gohr    'いぇ' => 'ye',
428*13067778SAndreas Gohr
429*13067778SAndreas Gohr    // 2 character syllables, っ doubles the consonant after
430*13067778SAndreas Gohr    'っば' => 'bba',
431*13067778SAndreas Gohr    'っべ' => 'bbe',
432*13067778SAndreas Gohr    'っび' => 'bbi',
433*13067778SAndreas Gohr    'っぼ' => 'bbo',
434*13067778SAndreas Gohr    'っぶ' => 'bbu',
435*13067778SAndreas Gohr    'っぱ' => 'ppa',
436*13067778SAndreas Gohr    'っぺ' => 'ppe',
437*13067778SAndreas Gohr    'っぴ' => 'ppi',
438*13067778SAndreas Gohr    'っぽ' => 'ppo',
439*13067778SAndreas Gohr    'っぷ' => 'ppu',
440*13067778SAndreas Gohr    'った' => 'tta',
441*13067778SAndreas Gohr    'って' => 'tte',
442*13067778SAndreas Gohr    'っち' => 'cchi',
443*13067778SAndreas Gohr    'っと' => 'tto',
444*13067778SAndreas Gohr    'っつ' => 'ttsu',
445*13067778SAndreas Gohr    'っだ' => 'dda',
446*13067778SAndreas Gohr    'っで' => 'dde',
447*13067778SAndreas Gohr    'っぢ' => 'ddi',
448*13067778SAndreas Gohr    'っど' => 'ddo',
449*13067778SAndreas Gohr    'っづ' => 'ddu',
450*13067778SAndreas Gohr    'っが' => 'gga',
451*13067778SAndreas Gohr    'っげ' => 'gge',
452*13067778SAndreas Gohr    'っぎ' => 'ggi',
453*13067778SAndreas Gohr    'っご' => 'ggo',
454*13067778SAndreas Gohr    'っぐ' => 'ggu',
455*13067778SAndreas Gohr    'っか' => 'kka',
456*13067778SAndreas Gohr    'っけ' => 'kke',
457*13067778SAndreas Gohr    'っき' => 'kki',
458*13067778SAndreas Gohr    'っこ' => 'kko',
459*13067778SAndreas Gohr    'っく' => 'kku',
460*13067778SAndreas Gohr    'っま' => 'mma',
461*13067778SAndreas Gohr    'っめ' => 'mme',
462*13067778SAndreas Gohr    'っみ' => 'mmi',
463*13067778SAndreas Gohr    'っも' => 'mmo',
464*13067778SAndreas Gohr    'っむ' => 'mmu',
465*13067778SAndreas Gohr    'っな' => 'nna',
466*13067778SAndreas Gohr    'っね' => 'nne',
467*13067778SAndreas Gohr    'っに' => 'nni',
468*13067778SAndreas Gohr    'っの' => 'nno',
469*13067778SAndreas Gohr    'っぬ' => 'nnu',
470*13067778SAndreas Gohr    'っら' => 'rra',
471*13067778SAndreas Gohr    'っれ' => 'rre',
472*13067778SAndreas Gohr    'っり' => 'rri',
473*13067778SAndreas Gohr    'っろ' => 'rro',
474*13067778SAndreas Gohr    'っる' => 'rru',
475*13067778SAndreas Gohr    'っさ' => 'ssa',
476*13067778SAndreas Gohr    'っせ' => 'sse',
477*13067778SAndreas Gohr    'っし' => 'sshi',
478*13067778SAndreas Gohr    'っそ' => 'sso',
479*13067778SAndreas Gohr    'っす' => 'ssu',
480*13067778SAndreas Gohr    'っざ' => 'zza',
481*13067778SAndreas Gohr    'っぜ' => 'zze',
482*13067778SAndreas Gohr    'っじ' => 'jji',
483*13067778SAndreas Gohr    'っぞ' => 'zzo',
484*13067778SAndreas Gohr    'っず' => 'zzu',
485*13067778SAndreas Gohr
486*13067778SAndreas Gohr    // 1 character syllabels
487*13067778SAndreas Gohr    'あ' => 'a',
488*13067778SAndreas Gohr    'え' => 'e',
489*13067778SAndreas Gohr    'い' => 'i',
490*13067778SAndreas Gohr    'お' => 'o',
491*13067778SAndreas Gohr    'う' => 'u',
492*13067778SAndreas Gohr    'ん' => 'n',
493*13067778SAndreas Gohr    'は' => 'ha',
494*13067778SAndreas Gohr    'へ' => 'he',
495*13067778SAndreas Gohr    'ひ' => 'hi',
496*13067778SAndreas Gohr    'ほ' => 'ho',
497*13067778SAndreas Gohr    'ふ' => 'fu',
498*13067778SAndreas Gohr    'ば' => 'ba',
499*13067778SAndreas Gohr    'べ' => 'be',
500*13067778SAndreas Gohr    'び' => 'bi',
501*13067778SAndreas Gohr    'ぼ' => 'bo',
502*13067778SAndreas Gohr    'ぶ' => 'bu',
503*13067778SAndreas Gohr    'ぱ' => 'pa',
504*13067778SAndreas Gohr    'ぺ' => 'pe',
505*13067778SAndreas Gohr    'ぴ' => 'pi',
506*13067778SAndreas Gohr    'ぽ' => 'po',
507*13067778SAndreas Gohr    'ぷ' => 'pu',
508*13067778SAndreas Gohr    'た' => 'ta',
509*13067778SAndreas Gohr    'て' => 'te',
510*13067778SAndreas Gohr    'ち' => 'chi',
511*13067778SAndreas Gohr    'と' => 'to',
512*13067778SAndreas Gohr    'つ' => 'tsu',
513*13067778SAndreas Gohr    'だ' => 'da',
514*13067778SAndreas Gohr    'で' => 'de',
515*13067778SAndreas Gohr    'ぢ' => 'di',
516*13067778SAndreas Gohr    'ど' => 'do',
517*13067778SAndreas Gohr    'づ' => 'du',
518*13067778SAndreas Gohr    'が' => 'ga',
519*13067778SAndreas Gohr    'げ' => 'ge',
520*13067778SAndreas Gohr    'ぎ' => 'gi',
521*13067778SAndreas Gohr    'ご' => 'go',
522*13067778SAndreas Gohr    'ぐ' => 'gu',
523*13067778SAndreas Gohr    'か' => 'ka',
524*13067778SAndreas Gohr    'け' => 'ke',
525*13067778SAndreas Gohr    'き' => 'ki',
526*13067778SAndreas Gohr    'こ' => 'ko',
527*13067778SAndreas Gohr    'く' => 'ku',
528*13067778SAndreas Gohr    'ま' => 'ma',
529*13067778SAndreas Gohr    'め' => 'me',
530*13067778SAndreas Gohr    'み' => 'mi',
531*13067778SAndreas Gohr    'も' => 'mo',
532*13067778SAndreas Gohr    'む' => 'mu',
533*13067778SAndreas Gohr    'な' => 'na',
534*13067778SAndreas Gohr    'ね' => 'ne',
535*13067778SAndreas Gohr    'に' => 'ni',
536*13067778SAndreas Gohr    'の' => 'no',
537*13067778SAndreas Gohr    'ぬ' => 'nu',
538*13067778SAndreas Gohr    'ら' => 'ra',
539*13067778SAndreas Gohr    'れ' => 're',
540*13067778SAndreas Gohr    'り' => 'ri',
541*13067778SAndreas Gohr    'ろ' => 'ro',
542*13067778SAndreas Gohr    'る' => 'ru',
543*13067778SAndreas Gohr    'さ' => 'sa',
544*13067778SAndreas Gohr    'せ' => 'se',
545*13067778SAndreas Gohr    'し' => 'shi',
546*13067778SAndreas Gohr    'そ' => 'so',
547*13067778SAndreas Gohr    'す' => 'su',
548*13067778SAndreas Gohr    'わ' => 'wa',
549*13067778SAndreas Gohr    'を' => 'wo',
550*13067778SAndreas Gohr    'ざ' => 'za',
551*13067778SAndreas Gohr    'ぜ' => 'ze',
552*13067778SAndreas Gohr    'じ' => 'ji',
553*13067778SAndreas Gohr    'ぞ' => 'zo',
554*13067778SAndreas Gohr    'ず' => 'zu',
555*13067778SAndreas Gohr    'や' => 'ya',
556*13067778SAndreas Gohr    'よ' => 'yo',
557*13067778SAndreas Gohr    'ゆ' => 'yu',
558*13067778SAndreas Gohr    // old characters
559*13067778SAndreas Gohr    'ゑ' => 'we',
560*13067778SAndreas Gohr    'ゐ' => 'wi',
561*13067778SAndreas Gohr
562*13067778SAndreas Gohr    //  convert what's left (probably only kicks in when something's missing above)
563*13067778SAndreas Gohr    // 'ぁ'=>'a','ぇ'=>'e','ぃ'=>'i','ぉ'=>'o','ぅ'=>'u',
564*13067778SAndreas Gohr    // 'ゃ'=>'ya','ょ'=>'yo','ゅ'=>'yu',
565*13067778SAndreas Gohr
566*13067778SAndreas Gohr    // never seen one of those (disabled for the moment)
567*13067778SAndreas Gohr    // 'ヴぁ'=>'va','ヴぇ'=>'ve','ヴぃ'=>'vi','ヴぉ'=>'vo','ヴ'=>'vu',
568*13067778SAndreas Gohr    // 'でゃ'=>'dha','でぇ'=>'dhe','でぃ'=>'dhi','でょ'=>'dho','でゅ'=>'dhu',
569*13067778SAndreas Gohr    // 'どぁ'=>'dwa','どぇ'=>'dwe','どぃ'=>'dwi','どぉ'=>'dwo','どぅ'=>'dwu',
570*13067778SAndreas Gohr    // 'ぢゃ'=>'dya','ぢぇ'=>'dye','ぢぃ'=>'dyi','ぢょ'=>'dyo','ぢゅ'=>'dyu',
571*13067778SAndreas Gohr    // 'ふぁ'=>'fwa','ふぇ'=>'fwe','ふぃ'=>'fwi','ふぉ'=>'fwo','ふぅ'=>'fwu',
572*13067778SAndreas Gohr    // 'ふゃ'=>'fya','ふぇ'=>'fye','ふぃ'=>'fyi','ふょ'=>'fyo','ふゅ'=>'fyu',
573*13067778SAndreas Gohr    // 'すぁ'=>'swa','すぇ'=>'swe','すぃ'=>'swi','すぉ'=>'swo','すぅ'=>'swu',
574*13067778SAndreas Gohr    // 'てゃ'=>'tha','てぇ'=>'the','てぃ'=>'thi','てょ'=>'tho','てゅ'=>'thu',
575*13067778SAndreas Gohr    // 'つゃ'=>'tsa','つぇ'=>'tse','つぃ'=>'tsi','つょ'=>'tso','つ'=>'tsu',
576*13067778SAndreas Gohr    // 'とぁ'=>'twa','とぇ'=>'twe','とぃ'=>'twi','とぉ'=>'two','とぅ'=>'twu',
577*13067778SAndreas Gohr    // 'ヴゃ'=>'vya','ヴぇ'=>'vye','ヴぃ'=>'vyi','ヴょ'=>'vyo','ヴゅ'=>'vyu',
578*13067778SAndreas Gohr    // 'うぁ'=>'wha','うぇ'=>'whe','うぃ'=>'whi','うぉ'=>'who','うぅ'=>'whu',
579*13067778SAndreas Gohr    // 'じゃ'=>'zha','じぇ'=>'zhe','じぃ'=>'zhi','じょ'=>'zho','じゅ'=>'zhu',
580*13067778SAndreas Gohr    // 'じゃ'=>'zya','じぇ'=>'zye','じぃ'=>'zyi','じょ'=>'zyo','じゅ'=>'zyu',
581*13067778SAndreas Gohr
582*13067778SAndreas Gohr    // 'spare' characters from other romanization systems
583*13067778SAndreas Gohr    // 'だ'=>'da','で'=>'de','ぢ'=>'di','ど'=>'do','づ'=>'du',
584*13067778SAndreas Gohr    // 'ら'=>'la','れ'=>'le','り'=>'li','ろ'=>'lo','る'=>'lu',
585*13067778SAndreas Gohr    // 'さ'=>'sa','せ'=>'se','し'=>'si','そ'=>'so','す'=>'su',
586*13067778SAndreas Gohr    // 'ちゃ'=>'cya','ちぇ'=>'cye','ちぃ'=>'cyi','ちょ'=>'cyo','ちゅ'=>'cyu',
587*13067778SAndreas Gohr    //'じゃ'=>'jya','じぇ'=>'jye','じぃ'=>'jyi','じょ'=>'jyo','じゅ'=>'jyu',
588*13067778SAndreas Gohr    //'りゃ'=>'lya','りぇ'=>'lye','りぃ'=>'lyi','りょ'=>'lyo','りゅ'=>'lyu',
589*13067778SAndreas Gohr    //'しゃ'=>'sya','しぇ'=>'sye','しぃ'=>'syi','しょ'=>'syo','しゅ'=>'syu',
590*13067778SAndreas Gohr    //'ちゃ'=>'tya','ちぇ'=>'tye','ちぃ'=>'tyi','ちょ'=>'tyo','ちゅ'=>'tyu',
591*13067778SAndreas Gohr    //'し'=>'ci',,い'=>'yi','ぢ'=>'dzi',
592*13067778SAndreas Gohr    //'っじゃ'=>'jja','っじぇ'=>'jje','っじ'=>'jji','っじょ'=>'jjo','っじゅ'=>'jju',
593*13067778SAndreas Gohr
594*13067778SAndreas Gohr
595*13067778SAndreas Gohr    // Japanese katakana
596*13067778SAndreas Gohr
597*13067778SAndreas Gohr    // 4 character syllables: ッ doubles the consonant after, ー doubles the vowel before
598*13067778SAndreas Gohr    // (usualy written with macron, but we don't want that in our URLs)
599*13067778SAndreas Gohr    'ッビャー' => 'bbyaa',
600*13067778SAndreas Gohr    'ッビェー' => 'bbyee',
601*13067778SAndreas Gohr    'ッビィー' => 'bbyii',
602*13067778SAndreas Gohr    'ッビョー' => 'bbyoo',
603*13067778SAndreas Gohr    'ッビュー' => 'bbyuu',
604*13067778SAndreas Gohr    'ッピャー' => 'ppyaa',
605*13067778SAndreas Gohr    'ッピェー' => 'ppyee',
606*13067778SAndreas Gohr    'ッピィー' => 'ppyii',
607*13067778SAndreas Gohr    'ッピョー' => 'ppyoo',
608*13067778SAndreas Gohr    'ッピュー' => 'ppyuu',
609*13067778SAndreas Gohr    'ッキャー' => 'kkyaa',
610*13067778SAndreas Gohr    'ッキェー' => 'kkyee',
611*13067778SAndreas Gohr    'ッキィー' => 'kkyii',
612*13067778SAndreas Gohr    'ッキョー' => 'kkyoo',
613*13067778SAndreas Gohr    'ッキュー' => 'kkyuu',
614*13067778SAndreas Gohr    'ッギャー' => 'ggyaa',
615*13067778SAndreas Gohr    'ッギェー' => 'ggyee',
616*13067778SAndreas Gohr    'ッギィー' => 'ggyii',
617*13067778SAndreas Gohr    'ッギョー' => 'ggyoo',
618*13067778SAndreas Gohr    'ッギュー' => 'ggyuu',
619*13067778SAndreas Gohr    'ッミャー' => 'mmyaa',
620*13067778SAndreas Gohr    'ッミェー' => 'mmyee',
621*13067778SAndreas Gohr    'ッミィー' => 'mmyii',
622*13067778SAndreas Gohr    'ッミョー' => 'mmyoo',
623*13067778SAndreas Gohr    'ッミュー' => 'mmyuu',
624*13067778SAndreas Gohr    'ッニャー' => 'nnyaa',
625*13067778SAndreas Gohr    'ッニェー' => 'nnyee',
626*13067778SAndreas Gohr    'ッニィー' => 'nnyii',
627*13067778SAndreas Gohr    'ッニョー' => 'nnyoo',
628*13067778SAndreas Gohr    'ッニュー' => 'nnyuu',
629*13067778SAndreas Gohr    'ッリャー' => 'rryaa',
630*13067778SAndreas Gohr    'ッリェー' => 'rryee',
631*13067778SAndreas Gohr    'ッリィー' => 'rryii',
632*13067778SAndreas Gohr    'ッリョー' => 'rryoo',
633*13067778SAndreas Gohr    'ッリュー' => 'rryuu',
634*13067778SAndreas Gohr    'ッシャー' => 'sshaa',
635*13067778SAndreas Gohr    'ッシェー' => 'sshee',
636*13067778SAndreas Gohr    'ッシー' => 'sshii',
637*13067778SAndreas Gohr    'ッショー' => 'sshoo',
638*13067778SAndreas Gohr    'ッシュー' => 'sshuu',
639*13067778SAndreas Gohr    'ッチャー' => 'cchaa',
640*13067778SAndreas Gohr    'ッチェー' => 'cchee',
641*13067778SAndreas Gohr    'ッチー' => 'cchii',
642*13067778SAndreas Gohr    'ッチョー' => 'cchoo',
643*13067778SAndreas Gohr    'ッチュー' => 'cchuu',
644*13067778SAndreas Gohr    'ッティー' => 'ttii',
645*13067778SAndreas Gohr    'ッヂィー' => 'ddii',
646*13067778SAndreas Gohr
647*13067778SAndreas Gohr    // 3 character syllables - doubled vowels
648*13067778SAndreas Gohr    'ファー' => 'faa',
649*13067778SAndreas Gohr    'フェー' => 'fee',
650*13067778SAndreas Gohr    'フィー' => 'fii',
651*13067778SAndreas Gohr    'フォー' => 'foo',
652*13067778SAndreas Gohr    'フャー' => 'fyaa',
653*13067778SAndreas Gohr    'フェー' => 'fyee',
654*13067778SAndreas Gohr    'フィー' => 'fyii',
655*13067778SAndreas Gohr    'フョー' => 'fyoo',
656*13067778SAndreas Gohr    'フュー' => 'fyuu',
657*13067778SAndreas Gohr    'ヒャー' => 'hyaa',
658*13067778SAndreas Gohr    'ヒェー' => 'hyee',
659*13067778SAndreas Gohr    'ヒィー' => 'hyii',
660*13067778SAndreas Gohr    'ヒョー' => 'hyoo',
661*13067778SAndreas Gohr    'ヒュー' => 'hyuu',
662*13067778SAndreas Gohr    'ビャー' => 'byaa',
663*13067778SAndreas Gohr    'ビェー' => 'byee',
664*13067778SAndreas Gohr    'ビィー' => 'byii',
665*13067778SAndreas Gohr    'ビョー' => 'byoo',
666*13067778SAndreas Gohr    'ビュー' => 'byuu',
667*13067778SAndreas Gohr    'ピャー' => 'pyaa',
668*13067778SAndreas Gohr    'ピェー' => 'pyee',
669*13067778SAndreas Gohr    'ピィー' => 'pyii',
670*13067778SAndreas Gohr    'ピョー' => 'pyoo',
671*13067778SAndreas Gohr    'ピュー' => 'pyuu',
672*13067778SAndreas Gohr    'キャー' => 'kyaa',
673*13067778SAndreas Gohr    'キェー' => 'kyee',
674*13067778SAndreas Gohr    'キィー' => 'kyii',
675*13067778SAndreas Gohr    'キョー' => 'kyoo',
676*13067778SAndreas Gohr    'キュー' => 'kyuu',
677*13067778SAndreas Gohr    'ギャー' => 'gyaa',
678*13067778SAndreas Gohr    'ギェー' => 'gyee',
679*13067778SAndreas Gohr    'ギィー' => 'gyii',
680*13067778SAndreas Gohr    'ギョー' => 'gyoo',
681*13067778SAndreas Gohr    'ギュー' => 'gyuu',
682*13067778SAndreas Gohr    'ミャー' => 'myaa',
683*13067778SAndreas Gohr    'ミェー' => 'myee',
684*13067778SAndreas Gohr    'ミィー' => 'myii',
685*13067778SAndreas Gohr    'ミョー' => 'myoo',
686*13067778SAndreas Gohr    'ミュー' => 'myuu',
687*13067778SAndreas Gohr    'ニャー' => 'nyaa',
688*13067778SAndreas Gohr    'ニェー' => 'nyee',
689*13067778SAndreas Gohr    'ニィー' => 'nyii',
690*13067778SAndreas Gohr    'ニョー' => 'nyoo',
691*13067778SAndreas Gohr    'ニュー' => 'nyuu',
692*13067778SAndreas Gohr    'リャー' => 'ryaa',
693*13067778SAndreas Gohr    'リェー' => 'ryee',
694*13067778SAndreas Gohr    'リィー' => 'ryii',
695*13067778SAndreas Gohr    'リョー' => 'ryoo',
696*13067778SAndreas Gohr    'リュー' => 'ryuu',
697*13067778SAndreas Gohr    'シャー' => 'shaa',
698*13067778SAndreas Gohr    'シェー' => 'shee',
699*13067778SAndreas Gohr    'シー' => 'shii',
700*13067778SAndreas Gohr    'ショー' => 'shoo',
701*13067778SAndreas Gohr    'シュー' => 'shuu',
702*13067778SAndreas Gohr    'ジャー' => 'jaa',
703*13067778SAndreas Gohr    'ジェー' => 'jee',
704*13067778SAndreas Gohr    'ジー' => 'jii',
705*13067778SAndreas Gohr    'ジョー' => 'joo',
706*13067778SAndreas Gohr    'ジュー' => 'juu',
707*13067778SAndreas Gohr    'スァー' => 'swaa',
708*13067778SAndreas Gohr    'スェー' => 'swee',
709*13067778SAndreas Gohr    'スィー' => 'swii',
710*13067778SAndreas Gohr    'スォー' => 'swoo',
711*13067778SAndreas Gohr    'スゥー' => 'swuu',
712*13067778SAndreas Gohr    'デァー' => 'daa',
713*13067778SAndreas Gohr    'デェー' => 'dee',
714*13067778SAndreas Gohr    'ディー' => 'dii',
715*13067778SAndreas Gohr    'デォー' => 'doo',
716*13067778SAndreas Gohr    'デゥー' => 'duu',
717*13067778SAndreas Gohr    'チャー' => 'chaa',
718*13067778SAndreas Gohr    'チェー' => 'chee',
719*13067778SAndreas Gohr    'チー' => 'chii',
720*13067778SAndreas Gohr    'チョー' => 'choo',
721*13067778SAndreas Gohr    'チュー' => 'chuu',
722*13067778SAndreas Gohr    'ヂャー' => 'dyaa',
723*13067778SAndreas Gohr    'ヂェー' => 'dyee',
724*13067778SAndreas Gohr    'ヂィー' => 'dyii',
725*13067778SAndreas Gohr    'ヂョー' => 'dyoo',
726*13067778SAndreas Gohr    'ヂュー' => 'dyuu',
727*13067778SAndreas Gohr    'ツャー' => 'tsaa',
728*13067778SAndreas Gohr    'ツェー' => 'tsee',
729*13067778SAndreas Gohr    'ツィー' => 'tsii',
730*13067778SAndreas Gohr    'ツョー' => 'tsoo',
731*13067778SAndreas Gohr    'ツー' => 'tsuu',
732*13067778SAndreas Gohr    'トァー' => 'twaa',
733*13067778SAndreas Gohr    'トェー' => 'twee',
734*13067778SAndreas Gohr    'トィー' => 'twii',
735*13067778SAndreas Gohr    'トォー' => 'twoo',
736*13067778SAndreas Gohr    'トゥー' => 'twuu',
737*13067778SAndreas Gohr    'ドァー' => 'dwaa',
738*13067778SAndreas Gohr    'ドェー' => 'dwee',
739*13067778SAndreas Gohr    'ドィー' => 'dwii',
740*13067778SAndreas Gohr    'ドォー' => 'dwoo',
741*13067778SAndreas Gohr    'ドゥー' => 'dwuu',
742*13067778SAndreas Gohr    'ウァー' => 'whaa',
743*13067778SAndreas Gohr    'ウェー' => 'whee',
744*13067778SAndreas Gohr    'ウィー' => 'whii',
745*13067778SAndreas Gohr    'ウォー' => 'whoo',
746*13067778SAndreas Gohr    'ウゥー' => 'whuu',
747*13067778SAndreas Gohr    'ヴャー' => 'vyaa',
748*13067778SAndreas Gohr    'ヴェー' => 'vyee',
749*13067778SAndreas Gohr    'ヴィー' => 'vyii',
750*13067778SAndreas Gohr    'ヴョー' => 'vyoo',
751*13067778SAndreas Gohr    'ヴュー' => 'vyuu',
752*13067778SAndreas Gohr    'ヴァー' => 'vaa',
753*13067778SAndreas Gohr    'ヴェー' => 'vee',
754*13067778SAndreas Gohr    'ヴィー' => 'vii',
755*13067778SAndreas Gohr    'ヴォー' => 'voo',
756*13067778SAndreas Gohr    'ヴー' => 'vuu',
757*13067778SAndreas Gohr    'ウェー' => 'wee',
758*13067778SAndreas Gohr    'ウィー' => 'wii',
759*13067778SAndreas Gohr    'イェー' => 'yee',
760*13067778SAndreas Gohr    'ティー' => 'tii',
761*13067778SAndreas Gohr    'ヂィー' => 'dii',
762*13067778SAndreas Gohr
763*13067778SAndreas Gohr    // 3 character syllables - doubled consonants
764*13067778SAndreas Gohr    'ッビャ' => 'bbya',
765*13067778SAndreas Gohr    'ッビェ' => 'bbye',
766*13067778SAndreas Gohr    'ッビィ' => 'bbyi',
767*13067778SAndreas Gohr    'ッビョ' => 'bbyo',
768*13067778SAndreas Gohr    'ッビュ' => 'bbyu',
769*13067778SAndreas Gohr    'ッピャ' => 'ppya',
770*13067778SAndreas Gohr    'ッピェ' => 'ppye',
771*13067778SAndreas Gohr    'ッピィ' => 'ppyi',
772*13067778SAndreas Gohr    'ッピョ' => 'ppyo',
773*13067778SAndreas Gohr    'ッピュ' => 'ppyu',
774*13067778SAndreas Gohr    'ッキャ' => 'kkya',
775*13067778SAndreas Gohr    'ッキェ' => 'kkye',
776*13067778SAndreas Gohr    'ッキィ' => 'kkyi',
777*13067778SAndreas Gohr    'ッキョ' => 'kkyo',
778*13067778SAndreas Gohr    'ッキュ' => 'kkyu',
779*13067778SAndreas Gohr    'ッギャ' => 'ggya',
780*13067778SAndreas Gohr    'ッギェ' => 'ggye',
781*13067778SAndreas Gohr    'ッギィ' => 'ggyi',
782*13067778SAndreas Gohr    'ッギョ' => 'ggyo',
783*13067778SAndreas Gohr    'ッギュ' => 'ggyu',
784*13067778SAndreas Gohr    'ッミャ' => 'mmya',
785*13067778SAndreas Gohr    'ッミェ' => 'mmye',
786*13067778SAndreas Gohr    'ッミィ' => 'mmyi',
787*13067778SAndreas Gohr    'ッミョ' => 'mmyo',
788*13067778SAndreas Gohr    'ッミュ' => 'mmyu',
789*13067778SAndreas Gohr    'ッニャ' => 'nnya',
790*13067778SAndreas Gohr    'ッニェ' => 'nnye',
791*13067778SAndreas Gohr    'ッニィ' => 'nnyi',
792*13067778SAndreas Gohr    'ッニョ' => 'nnyo',
793*13067778SAndreas Gohr    'ッニュ' => 'nnyu',
794*13067778SAndreas Gohr    'ッリャ' => 'rrya',
795*13067778SAndreas Gohr    'ッリェ' => 'rrye',
796*13067778SAndreas Gohr    'ッリィ' => 'rryi',
797*13067778SAndreas Gohr    'ッリョ' => 'rryo',
798*13067778SAndreas Gohr    'ッリュ' => 'rryu',
799*13067778SAndreas Gohr    'ッシャ' => 'ssha',
800*13067778SAndreas Gohr    'ッシェ' => 'sshe',
801*13067778SAndreas Gohr    'ッシ' => 'sshi',
802*13067778SAndreas Gohr    'ッショ' => 'ssho',
803*13067778SAndreas Gohr    'ッシュ' => 'sshu',
804*13067778SAndreas Gohr    'ッチャ' => 'ccha',
805*13067778SAndreas Gohr    'ッチェ' => 'cche',
806*13067778SAndreas Gohr    'ッチ' => 'cchi',
807*13067778SAndreas Gohr    'ッチョ' => 'ccho',
808*13067778SAndreas Gohr    'ッチュ' => 'cchu',
809*13067778SAndreas Gohr    'ッティ' => 'tti',
810*13067778SAndreas Gohr    'ッヂィ' => 'ddi',
811*13067778SAndreas Gohr
812*13067778SAndreas Gohr    // 3 character syllables - doubled vowel and consonants
813*13067778SAndreas Gohr    'ッバー' => 'bbaa',
814*13067778SAndreas Gohr    'ッベー' => 'bbee',
815*13067778SAndreas Gohr    'ッビー' => 'bbii',
816*13067778SAndreas Gohr    'ッボー' => 'bboo',
817*13067778SAndreas Gohr    'ッブー' => 'bbuu',
818*13067778SAndreas Gohr    'ッパー' => 'ppaa',
819*13067778SAndreas Gohr    'ッペー' => 'ppee',
820*13067778SAndreas Gohr    'ッピー' => 'ppii',
821*13067778SAndreas Gohr    'ッポー' => 'ppoo',
822*13067778SAndreas Gohr    'ップー' => 'ppuu',
823*13067778SAndreas Gohr    'ッケー' => 'kkee',
824*13067778SAndreas Gohr    'ッキー' => 'kkii',
825*13067778SAndreas Gohr    'ッコー' => 'kkoo',
826*13067778SAndreas Gohr    'ックー' => 'kkuu',
827*13067778SAndreas Gohr    'ッカー' => 'kkaa',
828*13067778SAndreas Gohr    'ッガー' => 'ggaa',
829*13067778SAndreas Gohr    'ッゲー' => 'ggee',
830*13067778SAndreas Gohr    'ッギー' => 'ggii',
831*13067778SAndreas Gohr    'ッゴー' => 'ggoo',
832*13067778SAndreas Gohr    'ッグー' => 'gguu',
833*13067778SAndreas Gohr    'ッマー' => 'maa',
834*13067778SAndreas Gohr    'ッメー' => 'mee',
835*13067778SAndreas Gohr    'ッミー' => 'mii',
836*13067778SAndreas Gohr    'ッモー' => 'moo',
837*13067778SAndreas Gohr    'ッムー' => 'muu',
838*13067778SAndreas Gohr    'ッナー' => 'nnaa',
839*13067778SAndreas Gohr    'ッネー' => 'nnee',
840*13067778SAndreas Gohr    'ッニー' => 'nnii',
841*13067778SAndreas Gohr    'ッノー' => 'nnoo',
842*13067778SAndreas Gohr    'ッヌー' => 'nnuu',
843*13067778SAndreas Gohr    'ッラー' => 'rraa',
844*13067778SAndreas Gohr    'ッレー' => 'rree',
845*13067778SAndreas Gohr    'ッリー' => 'rrii',
846*13067778SAndreas Gohr    'ッロー' => 'rroo',
847*13067778SAndreas Gohr    'ッルー' => 'rruu',
848*13067778SAndreas Gohr    'ッサー' => 'ssaa',
849*13067778SAndreas Gohr    'ッセー' => 'ssee',
850*13067778SAndreas Gohr    'ッシー' => 'sshii',
851*13067778SAndreas Gohr    'ッソー' => 'ssoo',
852*13067778SAndreas Gohr    'ッスー' => 'ssuu',
853*13067778SAndreas Gohr    'ッザー' => 'zzaa',
854*13067778SAndreas Gohr    'ッゼー' => 'zzee',
855*13067778SAndreas Gohr    'ッジー' => 'jjii',
856*13067778SAndreas Gohr    'ッゾー' => 'zzoo',
857*13067778SAndreas Gohr    'ッズー' => 'zzuu',
858*13067778SAndreas Gohr    'ッター' => 'ttaa',
859*13067778SAndreas Gohr    'ッテー' => 'ttee',
860*13067778SAndreas Gohr    'ッチー' => 'chii',
861*13067778SAndreas Gohr    'ットー' => 'ttoo',
862*13067778SAndreas Gohr    'ッツー' => 'ttsuu',
863*13067778SAndreas Gohr    'ッダー' => 'ddaa',
864*13067778SAndreas Gohr    'ッデー' => 'ddee',
865*13067778SAndreas Gohr    'ッヂー' => 'ddii',
866*13067778SAndreas Gohr    'ッドー' => 'ddoo',
867*13067778SAndreas Gohr    'ッヅー' => 'dduu',
868*13067778SAndreas Gohr
869*13067778SAndreas Gohr    // 2 character syllables - normal
870*13067778SAndreas Gohr    'ファ' => 'fa',
871*13067778SAndreas Gohr    'フェ' => 'fe',
872*13067778SAndreas Gohr    'フィ' => 'fi',
873*13067778SAndreas Gohr    'フォ' => 'fo',
874*13067778SAndreas Gohr    'フゥ' => 'fu',
875*13067778SAndreas Gohr    // 'フャ'=>'fya',
876*13067778SAndreas Gohr    // 'フェ'=>'fye',
877*13067778SAndreas Gohr    // 'フィ'=>'fyi',
878*13067778SAndreas Gohr    // 'フョ'=>'fyo',
879*13067778SAndreas Gohr    // 'フュ'=>'fyu',
880*13067778SAndreas Gohr    'フャ' => 'fa',
881*13067778SAndreas Gohr    'フェ' => 'fe',
882*13067778SAndreas Gohr    'フィ' => 'fi',
883*13067778SAndreas Gohr    'フョ' => 'fo',
884*13067778SAndreas Gohr    'フュ' => 'fu',
885*13067778SAndreas Gohr    'ヒャ' => 'hya',
886*13067778SAndreas Gohr    'ヒェ' => 'hye',
887*13067778SAndreas Gohr    'ヒィ' => 'hyi',
888*13067778SAndreas Gohr    'ヒョ' => 'hyo',
889*13067778SAndreas Gohr    'ヒュ' => 'hyu',
890*13067778SAndreas Gohr    'ビャ' => 'bya',
891*13067778SAndreas Gohr    'ビェ' => 'bye',
892*13067778SAndreas Gohr    'ビィ' => 'byi',
893*13067778SAndreas Gohr    'ビョ' => 'byo',
894*13067778SAndreas Gohr    'ビュ' => 'byu',
895*13067778SAndreas Gohr    'ピャ' => 'pya',
896*13067778SAndreas Gohr    'ピェ' => 'pye',
897*13067778SAndreas Gohr    'ピィ' => 'pyi',
898*13067778SAndreas Gohr    'ピョ' => 'pyo',
899*13067778SAndreas Gohr    'ピュ' => 'pyu',
900*13067778SAndreas Gohr    'キャ' => 'kya',
901*13067778SAndreas Gohr    'キェ' => 'kye',
902*13067778SAndreas Gohr    'キィ' => 'kyi',
903*13067778SAndreas Gohr    'キョ' => 'kyo',
904*13067778SAndreas Gohr    'キュ' => 'kyu',
905*13067778SAndreas Gohr    'ギャ' => 'gya',
906*13067778SAndreas Gohr    'ギェ' => 'gye',
907*13067778SAndreas Gohr    'ギィ' => 'gyi',
908*13067778SAndreas Gohr    'ギョ' => 'gyo',
909*13067778SAndreas Gohr    'ギュ' => 'gyu',
910*13067778SAndreas Gohr    'ミャ' => 'mya',
911*13067778SAndreas Gohr    'ミェ' => 'mye',
912*13067778SAndreas Gohr    'ミィ' => 'myi',
913*13067778SAndreas Gohr    'ミョ' => 'myo',
914*13067778SAndreas Gohr    'ミュ' => 'myu',
915*13067778SAndreas Gohr    'ニャ' => 'nya',
916*13067778SAndreas Gohr    'ニェ' => 'nye',
917*13067778SAndreas Gohr    'ニィ' => 'nyi',
918*13067778SAndreas Gohr    'ニョ' => 'nyo',
919*13067778SAndreas Gohr    'ニュ' => 'nyu',
920*13067778SAndreas Gohr    'リャ' => 'rya',
921*13067778SAndreas Gohr    'リェ' => 'rye',
922*13067778SAndreas Gohr    'リィ' => 'ryi',
923*13067778SAndreas Gohr    'リョ' => 'ryo',
924*13067778SAndreas Gohr    'リュ' => 'ryu',
925*13067778SAndreas Gohr    'シャ' => 'sha',
926*13067778SAndreas Gohr    'シェ' => 'she',
927*13067778SAndreas Gohr    'ショ' => 'sho',
928*13067778SAndreas Gohr    'シュ' => 'shu',
929*13067778SAndreas Gohr    'ジャ' => 'ja',
930*13067778SAndreas Gohr    'ジェ' => 'je',
931*13067778SAndreas Gohr    'ジョ' => 'jo',
932*13067778SAndreas Gohr    'ジュ' => 'ju',
933*13067778SAndreas Gohr    'スァ' => 'swa',
934*13067778SAndreas Gohr    'スェ' => 'swe',
935*13067778SAndreas Gohr    'スィ' => 'swi',
936*13067778SAndreas Gohr    'スォ' => 'swo',
937*13067778SAndreas Gohr    'スゥ' => 'swu',
938*13067778SAndreas Gohr    'デァ' => 'da',
939*13067778SAndreas Gohr    'デェ' => 'de',
940*13067778SAndreas Gohr    'ディ' => 'di',
941*13067778SAndreas Gohr    'デォ' => 'do',
942*13067778SAndreas Gohr    'デゥ' => 'du',
943*13067778SAndreas Gohr    'チャ' => 'cha',
944*13067778SAndreas Gohr    'チェ' => 'che',
945*13067778SAndreas Gohr    'チ' => 'chi',
946*13067778SAndreas Gohr    'チョ' => 'cho',
947*13067778SAndreas Gohr    'チュ' => 'chu',
948*13067778SAndreas Gohr    // 'ヂャ'=>'dya',
949*13067778SAndreas Gohr    // 'ヂェ'=>'dye',
950*13067778SAndreas Gohr    // 'ヂィ'=>'dyi',
951*13067778SAndreas Gohr    // 'ヂョ'=>'dyo',
952*13067778SAndreas Gohr    // 'ヂュ'=>'dyu',
953*13067778SAndreas Gohr    'ツャ' => 'tsa',
954*13067778SAndreas Gohr    'ツェ' => 'tse',
955*13067778SAndreas Gohr    'ツィ' => 'tsi',
956*13067778SAndreas Gohr    'ツョ' => 'tso',
957*13067778SAndreas Gohr    'ツ' => 'tsu',
958*13067778SAndreas Gohr    'トァ' => 'twa',
959*13067778SAndreas Gohr    'トェ' => 'twe',
960*13067778SAndreas Gohr    'トィ' => 'twi',
961*13067778SAndreas Gohr    'トォ' => 'two',
962*13067778SAndreas Gohr    'トゥ' => 'twu',
963*13067778SAndreas Gohr    'ドァ' => 'dwa',
964*13067778SAndreas Gohr    'ドェ' => 'dwe',
965*13067778SAndreas Gohr    'ドィ' => 'dwi',
966*13067778SAndreas Gohr    'ドォ' => 'dwo',
967*13067778SAndreas Gohr    'ドゥ' => 'dwu',
968*13067778SAndreas Gohr    'ウァ' => 'wha',
969*13067778SAndreas Gohr    'ウェ' => 'whe',
970*13067778SAndreas Gohr    'ウィ' => 'whi',
971*13067778SAndreas Gohr    'ウォ' => 'who',
972*13067778SAndreas Gohr    'ウゥ' => 'whu',
973*13067778SAndreas Gohr    'ヴャ' => 'vya',
974*13067778SAndreas Gohr    'ヴェ' => 'vye',
975*13067778SAndreas Gohr    'ヴィ' => 'vyi',
976*13067778SAndreas Gohr    'ヴョ' => 'vyo',
977*13067778SAndreas Gohr    'ヴュ' => 'vyu',
978*13067778SAndreas Gohr    'ヴァ' => 'va',
979*13067778SAndreas Gohr    'ヴェ' => 've',
980*13067778SAndreas Gohr    'ヴィ' => 'vi',
981*13067778SAndreas Gohr    'ヴォ' => 'vo',
982*13067778SAndreas Gohr    'ヴ' => 'vu',
983*13067778SAndreas Gohr    'ウェ' => 'we',
984*13067778SAndreas Gohr    'ウィ' => 'wi',
985*13067778SAndreas Gohr    'イェ' => 'ye',
986*13067778SAndreas Gohr    'ティ' => 'ti',
987*13067778SAndreas Gohr    'ヂィ' => 'di',
988*13067778SAndreas Gohr
989*13067778SAndreas Gohr    // 2 character syllables - doubled vocal
990*13067778SAndreas Gohr    'アー' => 'aa',
991*13067778SAndreas Gohr    'エー' => 'ee',
992*13067778SAndreas Gohr    'イー' => 'ii',
993*13067778SAndreas Gohr    'オー' => 'oo',
994*13067778SAndreas Gohr    'ウー' => 'uu',
995*13067778SAndreas Gohr    'ダー' => 'daa',
996*13067778SAndreas Gohr    'デー' => 'dee',
997*13067778SAndreas Gohr    'ヂー' => 'dii',
998*13067778SAndreas Gohr    'ドー' => 'doo',
999*13067778SAndreas Gohr    'ヅー' => 'duu',
1000*13067778SAndreas Gohr    'ハー' => 'haa',
1001*13067778SAndreas Gohr    'ヘー' => 'hee',
1002*13067778SAndreas Gohr    'ヒー' => 'hii',
1003*13067778SAndreas Gohr    'ホー' => 'hoo',
1004*13067778SAndreas Gohr    'フー' => 'fuu',
1005*13067778SAndreas Gohr    'バー' => 'baa',
1006*13067778SAndreas Gohr    'ベー' => 'bee',
1007*13067778SAndreas Gohr    'ビー' => 'bii',
1008*13067778SAndreas Gohr    'ボー' => 'boo',
1009*13067778SAndreas Gohr    'ブー' => 'buu',
1010*13067778SAndreas Gohr    'パー' => 'paa',
1011*13067778SAndreas Gohr    'ペー' => 'pee',
1012*13067778SAndreas Gohr    'ピー' => 'pii',
1013*13067778SAndreas Gohr    'ポー' => 'poo',
1014*13067778SAndreas Gohr    'プー' => 'puu',
1015*13067778SAndreas Gohr    'ケー' => 'kee',
1016*13067778SAndreas Gohr    'キー' => 'kii',
1017*13067778SAndreas Gohr    'コー' => 'koo',
1018*13067778SAndreas Gohr    'クー' => 'kuu',
1019*13067778SAndreas Gohr    'カー' => 'kaa',
1020*13067778SAndreas Gohr    'ガー' => 'gaa',
1021*13067778SAndreas Gohr    'ゲー' => 'gee',
1022*13067778SAndreas Gohr    'ギー' => 'gii',
1023*13067778SAndreas Gohr    'ゴー' => 'goo',
1024*13067778SAndreas Gohr    'グー' => 'guu',
1025*13067778SAndreas Gohr    'マー' => 'maa',
1026*13067778SAndreas Gohr    'メー' => 'mee',
1027*13067778SAndreas Gohr    'ミー' => 'mii',
1028*13067778SAndreas Gohr    'モー' => 'moo',
1029*13067778SAndreas Gohr    'ムー' => 'muu',
1030*13067778SAndreas Gohr    'ナー' => 'naa',
1031*13067778SAndreas Gohr    'ネー' => 'nee',
1032*13067778SAndreas Gohr    'ニー' => 'nii',
1033*13067778SAndreas Gohr    'ノー' => 'noo',
1034*13067778SAndreas Gohr    'ヌー' => 'nuu',
1035*13067778SAndreas Gohr    'ラー' => 'raa',
1036*13067778SAndreas Gohr    'レー' => 'ree',
1037*13067778SAndreas Gohr    'リー' => 'rii',
1038*13067778SAndreas Gohr    'ロー' => 'roo',
1039*13067778SAndreas Gohr    'ルー' => 'ruu',
1040*13067778SAndreas Gohr    'サー' => 'saa',
1041*13067778SAndreas Gohr    'セー' => 'see',
1042*13067778SAndreas Gohr    'シー' => 'shii',
1043*13067778SAndreas Gohr    'ソー' => 'soo',
1044*13067778SAndreas Gohr    'スー' => 'suu',
1045*13067778SAndreas Gohr    'ザー' => 'zaa',
1046*13067778SAndreas Gohr    'ゼー' => 'zee',
1047*13067778SAndreas Gohr    'ジー' => 'jii',
1048*13067778SAndreas Gohr    'ゾー' => 'zoo',
1049*13067778SAndreas Gohr    'ズー' => 'zuu',
1050*13067778SAndreas Gohr    'ター' => 'taa',
1051*13067778SAndreas Gohr    'テー' => 'tee',
1052*13067778SAndreas Gohr    'チー' => 'chii',
1053*13067778SAndreas Gohr    'トー' => 'too',
1054*13067778SAndreas Gohr    'ツー' => 'tsuu',
1055*13067778SAndreas Gohr    'ワー' => 'waa',
1056*13067778SAndreas Gohr    'ヲー' => 'woo',
1057*13067778SAndreas Gohr    'ヤー' => 'yaa',
1058*13067778SAndreas Gohr    'ヨー' => 'yoo',
1059*13067778SAndreas Gohr    'ユー' => 'yuu',
1060*13067778SAndreas Gohr    'ヵー' => 'kaa',
1061*13067778SAndreas Gohr    'ヶー' => 'kee',
1062*13067778SAndreas Gohr    // old characters
1063*13067778SAndreas Gohr    'ヱー' => 'wee',
1064*13067778SAndreas Gohr    'ヰー' => 'wii',
1065*13067778SAndreas Gohr
1066*13067778SAndreas Gohr    // seperate katakana 'n'
1067*13067778SAndreas Gohr    'ンア' => 'n_a',
1068*13067778SAndreas Gohr    'ンエ' => 'n_e',
1069*13067778SAndreas Gohr    'ンイ' => 'n_i',
1070*13067778SAndreas Gohr    'ンオ' => 'n_o',
1071*13067778SAndreas Gohr    'ンウ' => 'n_u',
1072*13067778SAndreas Gohr    'ンヤ' => 'n_ya',
1073*13067778SAndreas Gohr    'ンヨ' => 'n_yo',
1074*13067778SAndreas Gohr    'ンユ' => 'n_yu',
1075*13067778SAndreas Gohr
1076*13067778SAndreas Gohr    // 2 character syllables - doubled consonants
1077*13067778SAndreas Gohr    'ッバ' => 'bba',
1078*13067778SAndreas Gohr    'ッベ' => 'bbe',
1079*13067778SAndreas Gohr    'ッビ' => 'bbi',
1080*13067778SAndreas Gohr    'ッボ' => 'bbo',
1081*13067778SAndreas Gohr    'ッブ' => 'bbu',
1082*13067778SAndreas Gohr    'ッパ' => 'ppa',
1083*13067778SAndreas Gohr    'ッペ' => 'ppe',
1084*13067778SAndreas Gohr    'ッピ' => 'ppi',
1085*13067778SAndreas Gohr    'ッポ' => 'ppo',
1086*13067778SAndreas Gohr    'ップ' => 'ppu',
1087*13067778SAndreas Gohr    'ッケ' => 'kke',
1088*13067778SAndreas Gohr    'ッキ' => 'kki',
1089*13067778SAndreas Gohr    'ッコ' => 'kko',
1090*13067778SAndreas Gohr    'ック' => 'kku',
1091*13067778SAndreas Gohr    'ッカ' => 'kka',
1092*13067778SAndreas Gohr    'ッガ' => 'gga',
1093*13067778SAndreas Gohr    'ッゲ' => 'gge',
1094*13067778SAndreas Gohr    'ッギ' => 'ggi',
1095*13067778SAndreas Gohr    'ッゴ' => 'ggo',
1096*13067778SAndreas Gohr    'ッグ' => 'ggu',
1097*13067778SAndreas Gohr    'ッマ' => 'ma',
1098*13067778SAndreas Gohr    'ッメ' => 'me',
1099*13067778SAndreas Gohr    'ッミ' => 'mi',
1100*13067778SAndreas Gohr    'ッモ' => 'mo',
1101*13067778SAndreas Gohr    'ッム' => 'mu',
1102*13067778SAndreas Gohr    'ッナ' => 'nna',
1103*13067778SAndreas Gohr    'ッネ' => 'nne',
1104*13067778SAndreas Gohr    'ッニ' => 'nni',
1105*13067778SAndreas Gohr    'ッノ' => 'nno',
1106*13067778SAndreas Gohr    'ッヌ' => 'nnu',
1107*13067778SAndreas Gohr    'ッラ' => 'rra',
1108*13067778SAndreas Gohr    'ッレ' => 'rre',
1109*13067778SAndreas Gohr    'ッリ' => 'rri',
1110*13067778SAndreas Gohr    'ッロ' => 'rro',
1111*13067778SAndreas Gohr    'ッル' => 'rru',
1112*13067778SAndreas Gohr    'ッサ' => 'ssa',
1113*13067778SAndreas Gohr    'ッセ' => 'sse',
1114*13067778SAndreas Gohr    'ッシ' => 'sshi',
1115*13067778SAndreas Gohr    'ッソ' => 'sso',
1116*13067778SAndreas Gohr    'ッス' => 'ssu',
1117*13067778SAndreas Gohr    'ッザ' => 'zza',
1118*13067778SAndreas Gohr    'ッゼ' => 'zze',
1119*13067778SAndreas Gohr    'ッジ' => 'jji',
1120*13067778SAndreas Gohr    'ッゾ' => 'zzo',
1121*13067778SAndreas Gohr    'ッズ' => 'zzu',
1122*13067778SAndreas Gohr    'ッタ' => 'tta',
1123*13067778SAndreas Gohr    'ッテ' => 'tte',
1124*13067778SAndreas Gohr    'ッチ' => 'cchi',
1125*13067778SAndreas Gohr    'ット' => 'tto',
1126*13067778SAndreas Gohr    'ッツ' => 'ttsu',
1127*13067778SAndreas Gohr    'ッダ' => 'dda',
1128*13067778SAndreas Gohr    'ッデ' => 'dde',
1129*13067778SAndreas Gohr    'ッヂ' => 'ddi',
1130*13067778SAndreas Gohr    'ッド' => 'ddo',
1131*13067778SAndreas Gohr    'ッヅ' => 'ddu',
1132*13067778SAndreas Gohr
1133*13067778SAndreas Gohr    // 1 character syllables
1134*13067778SAndreas Gohr    'ア' => 'a',
1135*13067778SAndreas Gohr    'エ' => 'e',
1136*13067778SAndreas Gohr    'イ' => 'i',
1137*13067778SAndreas Gohr    'オ' => 'o',
1138*13067778SAndreas Gohr    'ウ' => 'u',
1139*13067778SAndreas Gohr    'ン' => 'n',
1140*13067778SAndreas Gohr    'ハ' => 'ha',
1141*13067778SAndreas Gohr    'ヘ' => 'he',
1142*13067778SAndreas Gohr    'ヒ' => 'hi',
1143*13067778SAndreas Gohr    'ホ' => 'ho',
1144*13067778SAndreas Gohr    'フ' => 'fu',
1145*13067778SAndreas Gohr    'バ' => 'ba',
1146*13067778SAndreas Gohr    'ベ' => 'be',
1147*13067778SAndreas Gohr    'ビ' => 'bi',
1148*13067778SAndreas Gohr    'ボ' => 'bo',
1149*13067778SAndreas Gohr    'ブ' => 'bu',
1150*13067778SAndreas Gohr    'パ' => 'pa',
1151*13067778SAndreas Gohr    'ペ' => 'pe',
1152*13067778SAndreas Gohr    'ピ' => 'pi',
1153*13067778SAndreas Gohr    'ポ' => 'po',
1154*13067778SAndreas Gohr    'プ' => 'pu',
1155*13067778SAndreas Gohr    'ケ' => 'ke',
1156*13067778SAndreas Gohr    'キ' => 'ki',
1157*13067778SAndreas Gohr    'コ' => 'ko',
1158*13067778SAndreas Gohr    'ク' => 'ku',
1159*13067778SAndreas Gohr    'カ' => 'ka',
1160*13067778SAndreas Gohr    'ガ' => 'ga',
1161*13067778SAndreas Gohr    'ゲ' => 'ge',
1162*13067778SAndreas Gohr    'ギ' => 'gi',
1163*13067778SAndreas Gohr    'ゴ' => 'go',
1164*13067778SAndreas Gohr    'グ' => 'gu',
1165*13067778SAndreas Gohr    'マ' => 'ma',
1166*13067778SAndreas Gohr    'メ' => 'me',
1167*13067778SAndreas Gohr    'ミ' => 'mi',
1168*13067778SAndreas Gohr    'モ' => 'mo',
1169*13067778SAndreas Gohr    'ム' => 'mu',
1170*13067778SAndreas Gohr    'ナ' => 'na',
1171*13067778SAndreas Gohr    'ネ' => 'ne',
1172*13067778SAndreas Gohr    'ニ' => 'ni',
1173*13067778SAndreas Gohr    'ノ' => 'no',
1174*13067778SAndreas Gohr    'ヌ' => 'nu',
1175*13067778SAndreas Gohr    'ラ' => 'ra',
1176*13067778SAndreas Gohr    'レ' => 're',
1177*13067778SAndreas Gohr    'リ' => 'ri',
1178*13067778SAndreas Gohr    'ロ' => 'ro',
1179*13067778SAndreas Gohr    'ル' => 'ru',
1180*13067778SAndreas Gohr    'サ' => 'sa',
1181*13067778SAndreas Gohr    'セ' => 'se',
1182*13067778SAndreas Gohr    'シ' => 'shi',
1183*13067778SAndreas Gohr    'ソ' => 'so',
1184*13067778SAndreas Gohr    'ス' => 'su',
1185*13067778SAndreas Gohr    'ザ' => 'za',
1186*13067778SAndreas Gohr    'ゼ' => 'ze',
1187*13067778SAndreas Gohr    'ジ' => 'ji',
1188*13067778SAndreas Gohr    'ゾ' => 'zo',
1189*13067778SAndreas Gohr    'ズ' => 'zu',
1190*13067778SAndreas Gohr    'タ' => 'ta',
1191*13067778SAndreas Gohr    'テ' => 'te',
1192*13067778SAndreas Gohr    'チ' => 'chi',
1193*13067778SAndreas Gohr    'ト' => 'to',
1194*13067778SAndreas Gohr    'ツ' => 'tsu',
1195*13067778SAndreas Gohr    'ダ' => 'da',
1196*13067778SAndreas Gohr    'デ' => 'de',
1197*13067778SAndreas Gohr    'ヂ' => 'di',
1198*13067778SAndreas Gohr    'ド' => 'do',
1199*13067778SAndreas Gohr    'ヅ' => 'du',
1200*13067778SAndreas Gohr    'ワ' => 'wa',
1201*13067778SAndreas Gohr    'ヲ' => 'wo',
1202*13067778SAndreas Gohr    'ヤ' => 'ya',
1203*13067778SAndreas Gohr    'ヨ' => 'yo',
1204*13067778SAndreas Gohr    'ユ' => 'yu',
1205*13067778SAndreas Gohr    'ヵ' => 'ka',
1206*13067778SAndreas Gohr    'ヶ' => 'ke',
1207*13067778SAndreas Gohr    // old characters
1208*13067778SAndreas Gohr    'ヱ' => 'we',
1209*13067778SAndreas Gohr    'ヰ' => 'wi',
1210*13067778SAndreas Gohr
1211*13067778SAndreas Gohr    //  convert what's left (probably only kicks in when something's missing above)
1212*13067778SAndreas Gohr    'ァ' => 'a',
1213*13067778SAndreas Gohr    'ェ' => 'e',
1214*13067778SAndreas Gohr    'ィ' => 'i',
1215*13067778SAndreas Gohr    'ォ' => 'o',
1216*13067778SAndreas Gohr    'ゥ' => 'u',
1217*13067778SAndreas Gohr    'ャ' => 'ya',
1218*13067778SAndreas Gohr    'ョ' => 'yo',
1219*13067778SAndreas Gohr    'ュ' => 'yu',
1220*13067778SAndreas Gohr
1221*13067778SAndreas Gohr    // special characters
1222*13067778SAndreas Gohr    '・' => '_',
1223*13067778SAndreas Gohr    '、' => '_',
1224*13067778SAndreas Gohr    'ー' => '_',
1225*13067778SAndreas Gohr    // when used with hiragana (seldom), this character would not be converted otherwise
1226*13067778SAndreas Gohr
1227*13067778SAndreas Gohr    // 'ラ'=>'la',
1228*13067778SAndreas Gohr    // 'レ'=>'le',
1229*13067778SAndreas Gohr    // 'リ'=>'li',
1230*13067778SAndreas Gohr    // 'ロ'=>'lo',
1231*13067778SAndreas Gohr    // 'ル'=>'lu',
1232*13067778SAndreas Gohr    // 'チャ'=>'cya',
1233*13067778SAndreas Gohr    // 'チェ'=>'cye',
1234*13067778SAndreas Gohr    // 'チィ'=>'cyi',
1235*13067778SAndreas Gohr    // 'チョ'=>'cyo',
1236*13067778SAndreas Gohr    // 'チュ'=>'cyu',
1237*13067778SAndreas Gohr    // 'デャ'=>'dha',
1238*13067778SAndreas Gohr    // 'デェ'=>'dhe',
1239*13067778SAndreas Gohr    // 'ディ'=>'dhi',
1240*13067778SAndreas Gohr    // 'デョ'=>'dho',
1241*13067778SAndreas Gohr    // 'デュ'=>'dhu',
1242*13067778SAndreas Gohr    // 'リャ'=>'lya',
1243*13067778SAndreas Gohr    // 'リェ'=>'lye',
1244*13067778SAndreas Gohr    // 'リィ'=>'lyi',
1245*13067778SAndreas Gohr    // 'リョ'=>'lyo',
1246*13067778SAndreas Gohr    // 'リュ'=>'lyu',
1247*13067778SAndreas Gohr    // 'テャ'=>'tha',
1248*13067778SAndreas Gohr    // 'テェ'=>'the',
1249*13067778SAndreas Gohr    // 'ティ'=>'thi',
1250*13067778SAndreas Gohr    // 'テョ'=>'tho',
1251*13067778SAndreas Gohr    // 'テュ'=>'thu',
1252*13067778SAndreas Gohr    // 'ファ'=>'fwa',
1253*13067778SAndreas Gohr    // 'フェ'=>'fwe',
1254*13067778SAndreas Gohr    // 'フィ'=>'fwi',
1255*13067778SAndreas Gohr    // 'フォ'=>'fwo',
1256*13067778SAndreas Gohr    // 'フゥ'=>'fwu',
1257*13067778SAndreas Gohr    // 'チャ'=>'tya',
1258*13067778SAndreas Gohr    // 'チェ'=>'tye',
1259*13067778SAndreas Gohr    // 'チィ'=>'tyi',
1260*13067778SAndreas Gohr    // 'チョ'=>'tyo',
1261*13067778SAndreas Gohr    // 'チュ'=>'tyu',
1262*13067778SAndreas Gohr    // 'ジャ'=>'jya',
1263*13067778SAndreas Gohr    // 'ジェ'=>'jye',
1264*13067778SAndreas Gohr    // 'ジィ'=>'jyi',
1265*13067778SAndreas Gohr    // 'ジョ'=>'jyo',
1266*13067778SAndreas Gohr    // 'ジュ'=>'jyu',
1267*13067778SAndreas Gohr    // 'ジャ'=>'zha',
1268*13067778SAndreas Gohr    // 'ジェ'=>'zhe',
1269*13067778SAndreas Gohr    // 'ジィ'=>'zhi',
1270*13067778SAndreas Gohr    // 'ジョ'=>'zho',
1271*13067778SAndreas Gohr    // 'ジュ'=>'zhu',
1272*13067778SAndreas Gohr    // 'ジャ'=>'zya',
1273*13067778SAndreas Gohr    // 'ジェ'=>'zye',
1274*13067778SAndreas Gohr    // 'ジィ'=>'zyi',
1275*13067778SAndreas Gohr    // 'ジョ'=>'zyo',
1276*13067778SAndreas Gohr    // 'ジュ'=>'zyu',
1277*13067778SAndreas Gohr    // 'シャ'=>'sya',
1278*13067778SAndreas Gohr    // 'シェ'=>'sye',
1279*13067778SAndreas Gohr    // 'シィ'=>'syi',
1280*13067778SAndreas Gohr    // 'ショ'=>'syo',
1281*13067778SAndreas Gohr    // 'シュ'=>'syu',
1282*13067778SAndreas Gohr    // 'シ'=>'ci',
1283*13067778SAndreas Gohr    // 'フ'=>'hu',
1284*13067778SAndreas Gohr    // 'シ'=>'si',
1285*13067778SAndreas Gohr    // 'チ'=>'ti',
1286*13067778SAndreas Gohr    // 'ツ'=>'tu',
1287*13067778SAndreas Gohr    // 'イ'=>'yi',
1288*13067778SAndreas Gohr    // 'ヂ'=>'dzi',
1289*13067778SAndreas Gohr
1290*13067778SAndreas Gohr    // "Greeklish"
1291*13067778SAndreas Gohr    'Γ' => 'G',
1292*13067778SAndreas Gohr    'Δ' => 'E',
1293*13067778SAndreas Gohr    'Θ' => 'Th',
1294*13067778SAndreas Gohr    'Λ' => 'L',
1295*13067778SAndreas Gohr    'Ξ' => 'X',
1296*13067778SAndreas Gohr    'Π' => 'P',
1297*13067778SAndreas Gohr    'Σ' => 'S',
1298*13067778SAndreas Gohr    'Φ' => 'F',
1299*13067778SAndreas Gohr    'Ψ' => 'Ps',
1300*13067778SAndreas Gohr    'γ' => 'g',
1301*13067778SAndreas Gohr    'δ' => 'e',
1302*13067778SAndreas Gohr    'θ' => 'th',
1303*13067778SAndreas Gohr    'λ' => 'l',
1304*13067778SAndreas Gohr    'ξ' => 'x',
1305*13067778SAndreas Gohr    'π' => 'p',
1306*13067778SAndreas Gohr    'σ' => 's',
1307*13067778SAndreas Gohr    'φ' => 'f',
1308*13067778SAndreas Gohr    'ψ' => 'ps',
1309*13067778SAndreas Gohr
1310*13067778SAndreas Gohr    // Thai
1311*13067778SAndreas Gohr    'ก' => 'k',
1312*13067778SAndreas Gohr    'ข' => 'kh',
1313*13067778SAndreas Gohr    'ฃ' => 'kh',
1314*13067778SAndreas Gohr    'ค' => 'kh',
1315*13067778SAndreas Gohr    'ฅ' => 'kh',
1316*13067778SAndreas Gohr    'ฆ' => 'kh',
1317*13067778SAndreas Gohr    'ง' => 'ng',
1318*13067778SAndreas Gohr    'จ' => 'ch',
1319*13067778SAndreas Gohr    'ฉ' => 'ch',
1320*13067778SAndreas Gohr    'ช' => 'ch',
1321*13067778SAndreas Gohr    'ซ' => 's',
1322*13067778SAndreas Gohr    'ฌ' => 'ch',
1323*13067778SAndreas Gohr    'ญ' => 'y',
1324*13067778SAndreas Gohr    'ฎ' => 'd',
1325*13067778SAndreas Gohr    'ฏ' => 't',
1326*13067778SAndreas Gohr    'ฐ' => 'th',
1327*13067778SAndreas Gohr    'ฑ' => 'd',
1328*13067778SAndreas Gohr    'ฒ' => 'th',
1329*13067778SAndreas Gohr    'ณ' => 'n',
1330*13067778SAndreas Gohr    'ด' => 'd',
1331*13067778SAndreas Gohr    'ต' => 't',
1332*13067778SAndreas Gohr    'ถ' => 'th',
1333*13067778SAndreas Gohr    'ท' => 'th',
1334*13067778SAndreas Gohr    'ธ' => 'th',
1335*13067778SAndreas Gohr    'น' => 'n',
1336*13067778SAndreas Gohr    'บ' => 'b',
1337*13067778SAndreas Gohr    'ป' => 'p',
1338*13067778SAndreas Gohr    'ผ' => 'ph',
1339*13067778SAndreas Gohr    'ฝ' => 'f',
1340*13067778SAndreas Gohr    'พ' => 'ph',
1341*13067778SAndreas Gohr    'ฟ' => 'f',
1342*13067778SAndreas Gohr    'ภ' => 'ph',
1343*13067778SAndreas Gohr    'ม' => 'm',
1344*13067778SAndreas Gohr    'ย' => 'y',
1345*13067778SAndreas Gohr    'ร' => 'r',
1346*13067778SAndreas Gohr    'ฤ' => 'rue',
1347*13067778SAndreas Gohr    'ฤๅ' => 'rue',
1348*13067778SAndreas Gohr    'ล' => 'l',
1349*13067778SAndreas Gohr    'ฦ' => 'lue',
1350*13067778SAndreas Gohr    'ฦๅ' => 'lue',
1351*13067778SAndreas Gohr    'ว' => 'w',
1352*13067778SAndreas Gohr    'ศ' => 's',
1353*13067778SAndreas Gohr    'ษ' => 's',
1354*13067778SAndreas Gohr    'ส' => 's',
1355*13067778SAndreas Gohr    'ห' => 'h',
1356*13067778SAndreas Gohr    'ฬ' => 'l',
1357*13067778SAndreas Gohr    'ฮ' => 'h',
1358*13067778SAndreas Gohr    'ะ' => 'a',
1359*13067778SAndreas Gohr    'ั' => 'a',
1360*13067778SAndreas Gohr    'รร' => 'a',
1361*13067778SAndreas Gohr    'า' => 'a',
1362*13067778SAndreas Gohr    'ๅ' => 'a',
1363*13067778SAndreas Gohr    'ำ' => 'am',
1364*13067778SAndreas Gohr    'ํา' => 'am',
1365*13067778SAndreas Gohr    'ิ' => 'i',
1366*13067778SAndreas Gohr    'ี' => 'i',
1367*13067778SAndreas Gohr    'ึ' => 'ue',
1368*13067778SAndreas Gohr    'ี' => 'ue',
1369*13067778SAndreas Gohr    'ุ' => 'u',
1370*13067778SAndreas Gohr    'ู' => 'u',
1371*13067778SAndreas Gohr    'เ' => 'e',
1372*13067778SAndreas Gohr    'แ' => 'ae',
1373*13067778SAndreas Gohr    'โ' => 'o',
1374*13067778SAndreas Gohr    'อ' => 'o',
1375*13067778SAndreas Gohr    'ียะ' => 'ia',
1376*13067778SAndreas Gohr    'ีย' => 'ia',
1377*13067778SAndreas Gohr    'ือะ' => 'uea',
1378*13067778SAndreas Gohr    'ือ' => 'uea',
1379*13067778SAndreas Gohr    'ัวะ' => 'ua',
1380*13067778SAndreas Gohr    'ัว' => 'ua',
1381*13067778SAndreas Gohr    'ใ' => 'ai',
1382*13067778SAndreas Gohr    'ไ' => 'ai',
1383*13067778SAndreas Gohr    'ัย' => 'ai',
1384*13067778SAndreas Gohr    'าย' => 'ai',
1385*13067778SAndreas Gohr    'าว' => 'ao',
1386*13067778SAndreas Gohr    'ุย' => 'ui',
1387*13067778SAndreas Gohr    'อย' => 'oi',
1388*13067778SAndreas Gohr    'ือย' => 'ueai',
1389*13067778SAndreas Gohr    'วย' => 'uai',
1390*13067778SAndreas Gohr    'ิว' => 'io',
1391*13067778SAndreas Gohr    '็ว' => 'eo',
1392*13067778SAndreas Gohr    'ียว' => 'iao',
1393*13067778SAndreas Gohr    '่' => '',
1394*13067778SAndreas Gohr    '้' => '',
1395*13067778SAndreas Gohr    '๊' => '',
1396*13067778SAndreas Gohr    '๋' => '',
1397*13067778SAndreas Gohr    '็' => '',
1398*13067778SAndreas Gohr    '์' => '',
1399*13067778SAndreas Gohr    '๎' => '',
1400*13067778SAndreas Gohr    'ํ' => '',
1401*13067778SAndreas Gohr    'ฺ' => '',
1402*13067778SAndreas Gohr    'ๆ' => '2',
1403*13067778SAndreas Gohr    '๏' => 'o',
1404*13067778SAndreas Gohr    'ฯ' => '-',
1405*13067778SAndreas Gohr    '๚' => '-',
1406*13067778SAndreas Gohr    '๛' => '-',
1407*13067778SAndreas Gohr    '๐' => '0',
1408*13067778SAndreas Gohr    '๑' => '1',
1409*13067778SAndreas Gohr    '๒' => '2',
1410*13067778SAndreas Gohr    '๓' => '3',
1411*13067778SAndreas Gohr    '๔' => '4',
1412*13067778SAndreas Gohr    '๕' => '5',
1413*13067778SAndreas Gohr    '๖' => '6',
1414*13067778SAndreas Gohr    '๗' => '7',
1415*13067778SAndreas Gohr    '๘' => '8',
1416*13067778SAndreas Gohr    '๙' => '9',
1417*13067778SAndreas Gohr
1418*13067778SAndreas Gohr    // Korean
1419*13067778SAndreas Gohr    'ㄱ' => 'k', 'ㅋ' => 'kh',
1420*13067778SAndreas Gohr    'ㄲ' => 'kk',
1421*13067778SAndreas Gohr    'ㄷ' => 't',
1422*13067778SAndreas Gohr    'ㅌ' => 'th',
1423*13067778SAndreas Gohr    'ㄸ' => 'tt',
1424*13067778SAndreas Gohr    'ㅂ' => 'p',
1425*13067778SAndreas Gohr    'ㅍ' => 'ph',
1426*13067778SAndreas Gohr    'ㅃ' => 'pp',
1427*13067778SAndreas Gohr    'ㅈ' => 'c',
1428*13067778SAndreas Gohr    'ㅊ' => 'ch',
1429*13067778SAndreas Gohr    'ㅉ' => 'cc',
1430*13067778SAndreas Gohr    'ㅅ' => 's',
1431*13067778SAndreas Gohr    'ㅆ' => 'ss',
1432*13067778SAndreas Gohr    'ㅎ' => 'h',
1433*13067778SAndreas Gohr    'ㅇ' => 'ng',
1434*13067778SAndreas Gohr    'ㄴ' => 'n',
1435*13067778SAndreas Gohr    'ㄹ' => 'l',
1436*13067778SAndreas Gohr    'ㅁ' => 'm',
1437*13067778SAndreas Gohr    'ㅏ' => 'a',
1438*13067778SAndreas Gohr    'ㅓ' => 'e',
1439*13067778SAndreas Gohr    'ㅗ' => 'o',
1440*13067778SAndreas Gohr    'ㅜ' => 'wu',
1441*13067778SAndreas Gohr    'ㅡ' => 'u',
1442*13067778SAndreas Gohr    'ㅣ' => 'i',
1443*13067778SAndreas Gohr    'ㅐ' => 'ay',
1444*13067778SAndreas Gohr    'ㅔ' => 'ey',
1445*13067778SAndreas Gohr    'ㅚ' => 'oy',
1446*13067778SAndreas Gohr    'ㅘ' => 'wa',
1447*13067778SAndreas Gohr    'ㅝ' => 'we',
1448*13067778SAndreas Gohr    'ㅟ' => 'wi',
1449*13067778SAndreas Gohr    'ㅙ' => 'way',
1450*13067778SAndreas Gohr    'ㅞ' => 'wey',
1451*13067778SAndreas Gohr    'ㅢ' => 'uy',
1452*13067778SAndreas Gohr    'ㅑ' => 'ya',
1453*13067778SAndreas Gohr    'ㅕ' => 'ye',
1454*13067778SAndreas Gohr    'ㅛ' => 'oy',
1455*13067778SAndreas Gohr    'ㅠ' => 'yu',
1456*13067778SAndreas Gohr    'ㅒ' => 'yay',
1457*13067778SAndreas Gohr    'ㅖ' => 'yey',
1458*13067778SAndreas Gohr];
1459