xref: /aosp_15_r20/external/cldr/common/transforms/Myanmar-Latin.xml (revision 912701f9769bb47905792267661f0baf2b85bed5)
1<?xml version="1.0" encoding="UTF-8" ?>
2<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd">
3<!-- Copyright © 2020 Unicode, Inc.
4CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/)
5For terms of use, see http://www.unicode.org/copyright.html -->
6<supplementalData>
7	<version number="$Revision$" />
8	<transforms>
9		<transform source="my" target="my_Latn" direction="forward" draft="contributed" alias="Burmese-Latin Myanmar-Latin my-Latn-t-my">
10			<tRule><![CDATA[
11# Author: Arne Mauser, Moe Aung Naing
12# Description: Myanmar Romanization
13
14$consonants = [\u1000-\u1021];
15
16# Character combinations: "1 consonant 5 vowels"
17# ($consonants) ြောင့် > | $1 yount;
18($consonants) \u103C\u1031\u102C\u1004\u103A\u1037 > | $1 yount;
19
20# ($consonants) ျောင့် > | $1 yount;
21($consonants)  \u103B\u1031\u102C\u1004\u103A\u1037 > | $1 yount;
22
23# ($consonants) ြောင်း > | $1 yaungg;
24($consonants) \u103C\u1031\u102C\u1004\u103A\u1038 > | $1 yaungg;
25
26# ($consonants) ျောင်း > | $1 yaungg;
27($consonants) \u103B\u1031\u102C\u1004\u103A\u1038  > | $1 yaungg;
28
29
30
31#  Character combinations: "1 consonant 4 vowels"
32# ိုင်း > ine;
33 \u102D\u102F\u1004\u103A\u1038 > ine;
34
35# ($consonants) ြောင် > | $1 yaung;
36($consonants) \u103C\u1031\u102C\u1004\u103A  > | $1 yaung;
37
38# ($consonants) ျောင် > | $1 yaung;
39($consonants) \u103B\u1031\u102C\u1004\u103A  > | $1 yaung;
40
41
42
43#  Character combinations: "1 consonant 3 vowels"
44# ောက် > out; # 1c3v
45\u1031\u102C\u1000\u103A > out;
46
47# ေါက် > out; # 1c3v
48\u1031\u102B\u1000\u103A > out;
49
50# ိုက် > ite; # 1c3v
51\u102D\u102F\u1000\u103A > ite;
52
53# ိုင် > ine; # 1c3v
54\u102D\u102F\u1004\u103A > ine;
55
56# ိုယ် > o; # 1c3v
57\u102D\u102F\u101A\u103A > o;
58
59# ျင်း > yinn;
60\u103B\u1004\u103A\u1038 > yinn;
61
62# ျိန် > yane;
63\u103B\u102D\u1014\u103A > yane;
64
65# ($consonants) ောင်း > | $1 aungg;
66($consonants) \u1031\u102C\u1004\u103A\u1038 > | $1 aungg;
67
68# ($consonants) ေါင်း > | $1 aungg;
69($consonants) \u1031\u102B\u1004\u103A\u1038 > | $1 aungg;
70
71# ($consonants) ောင် > | $1 aung;
72($consonants) \u1031\u102C\u1004\u103A > | $1 aung;
73
74# ($consonants) ေါင် >  | $1 aung;
75($consonants) \u1031\u102B\u1004\u103A > | $1 aung;
76
77# ($consonants) ြင့် > | $1 yint;
78($consonants) \u103C\u1004\u103A\u1037 > | $1 yint;
79
80# ($consonants) ြင်း > | $1 yinn;
81($consonants) \u103C\u1004\u103A\u1038 > | $1 yinn;
82
83# ($consonants) ြင် > | $1 yin;
84($consonants) \u103C\u1004\u103A > | $1 yin;
85
86# ($consonants) ျင့် > | $1 yint;
87($consonants) \u103B\u1004\u103A\u1037 > | $1 yint;
88
89# ($consonants) ျင်း > | $1 yinn;
90($consonants) \u103B\u1004\u103A\u1038 > | $1 yinn;
91
92# ($consonants) ျင် > | $1 yin;
93($consonants) \u103B\u1004\u103A > | $1 yin;
94
95# ($consonants) ြစ် > | $1 yit;
96($consonants) \u103C\u1005\u103A > | $1 yit;
97
98# ($consonants) ျစ် > | $1 yit;
99($consonants)  \u103B\u1005\u103A > | $1 yit;
100
101# ($consonants) ြည် > | $1 yi;
102($consonants) \u103C\u100A\u103A > | $1 yi;
103
104# ($consonants) ြန် > | $1 yan;
105($consonants) \u103C\u1014\u103A > | $1 yan;
106
107# ($consonants) ြန်း > | $1 yann;
108($consonants) \u103C\u1014\u103A\u1038 > | $1 yann;
109
110# ($consonants) ျန်း > | $1 yann;
111($consonants) \u103B\u1014\u103A\u1038 > | $1 yann;
112
113# ိမ်း > aim;
114\u102D\u1019\u103A\u1038 > aim;
115
116# ိန်း > ein;
117\u102D\u1014\u103A\u1038 > ein;
118
119
120
121#  Character combinations: "4 vowels"
122# ျိုး > yoe;
123\u103B\u102D\u102F\u1038 > yoe;
124
125# ($consonants) ြော် > | $1 yaw;
126($consonants) \u103C\u1031\u102C\u103A > | $1 yaw;
127
128# ($consonants) ျော် > | $1 yaw;
129($consonants) \u103B\u1031\u102C\u103A > | $1 yaw;
130
131
132
133# Character combinations: "1 consonant 2 vowels"
134# ဦး > u;
135\u1025\u102E\u1038 > u;  # this is a misspelling of \u1026
136
137# ွက် > wat;
138\u103D\u1000\u103A > wat;
139
140# ွင် > win;
141\u103D\u1004\u103A > win;
142
143# န်း > ann;
144\u1014\u103A\u1038 > ann;
145
146# န့် > ant;
147\u1014\u103A\u1037 > ant;
148
149# င်း > inn;
150\u1004\u103A\u1038 > inn;
151
152# င့် > int;
153\u1004\u103A\u1037 > int;
154
155# ည်း > ee;
156\u100A\u103A\u1038 > ee;
157
158# ည့် > eet; # 1c2v
159\u100A\u103A\u1037 > eet;
160
161# ိတ် > ate; # 1c2v
162\u102D\u1010\u103A > ate;
163
164# ုတ် > ote; # 1c2v
165\u102F\u1010\u103A > ote;
166
167# ုန် > one; # 1c2v
168\u102F\u1014\u103A > one;
169
170# ုပ် > ote; # 1c2v
171\u102F\u1015\u103A > ote;
172
173# ိမ် > aim; # 1c2v
174\u102D\u1019\u103A > ain;
175
176# ိန် > ein;
177\u102D\u1014\u103A > ein;
178
179# ယ့် > ae; # 1c2v
180\u101A\u103A\u1037 > ae;
181
182# သျှ > sh; # 1c2v
183\u101E\u103B\u103E > sh;
184
185# လျှ > sh; # 1c2v
186\u101C\u103B\u103E > sh;
187
188# ရွှ > shw; # 1c2v
189\u101B\u103D\u103E > shw;
190
191# ြတ် > yat;
192\u103C\u1010\u103A > yat;
193
194# ျတ် > yat;
195\u103B\u1010\u103A > yat;
196
197# ြက်  > yet;
198\u103C\u1000\103A > yet;
199
200# ျက် > yet;
201\u103B\u1000\u103A > yet;
202
203# ျင် > yin;
204\u103B\u1004\u103A > yin;
205
206# ြင် > yin;
207\u103C\u1004\u103A > yin;
208
209
210
211
212#  Character combinations: "3 vowels"
213# ော့ > ot;
214\u1031\u102C\u1037 > ot;
215
216# ေါ့ > ot;
217\u1031\u102B\u1037 > ot;
218
219# ော် > aw;
220\u1031\u102C\u103A > aw;
221
222# ေါ် > aw;
223\u1031\u102B\u103A > aw;
224
225# ို့ > hoet; # 3v
226\u102D\u102F\u1037 > hoet;
227
228# ိုး > oe;
229\u102D\u102F\u1038 > oe;
230
231# ုံး > one; # 3v
232\u102F\u1036\u1038 > one;
233
234# ျား > yarr;
235\u103B\u102C\u1038 > yarr;
236
237# ြား > yarr;
238\u103C\u102C\u1038 > yarr;
239
240# ြီး > yee;
241\u103C\u102E\u1038 > yee;
242
243# ($consonants) ြော  > | $1 yaww;
244($consonants) \u103C\u1031\u102C > | $1 yaww;
245
246# ($consonants) ျော  > | $1 yaww;
247($consonants) \u103B\u1031\u102C > | $1 yaww;
248
249# ွား > warr;
250\u103D\u102C\u1038 > warr;
251
252# ွေ့ > wae;
253\u103D\u1031\u1037 > wae;
254
255
256
257
258#  Character combinations: "1 consonant 1 vowel"
259#က် > at;
260\u1000\u103A > at;
261
262# င် > in;
263\u1004\u103A > in;
264
265# စ် > it;
266\u1005\u103A > it;
267
268# ဥ် > in;
269\u1009\u103A > in;
270\u1025\u103A > in;  # \u1025 is a misspelling of \u1009
271
272# ည် > i;
273\u100A\u103A > i;
274
275# ပ် > ut;
276\u1015\u103A > ut;
277
278# ယ် > al;
279\u101A\u103A > al;
280
281# တ် > at;
282\u1010\u103A > at;
283
284# န် > an;
285\u1014\u103A > an;
286
287# ရှ > sh; # 1c1v
288\u101B\u103E > sh;
289
290#  Character combinations: "2 vowel"
291# ြီ > ye;
292\u103C\u102E > ye;
293
294# ြု > yu;
295\u103C\u102F > yu;
296
297# ြေ > yay;
298\u103C\u1031 > yay;
299
300# ွေ > way;
301\u103D\u1031 > way;
302
303# ွဲ > wal;
304\u103D\u1032 > wal;
305
306# ှု > hu;
307\u103E\u102F > hu;
308
309# ူ့ > hu;
310\u1030\u1037 > hu;
311
312# ူး > uu;
313\u1030\u1038 > uu;
314
315# ါး > arr;
316\u102B\u1038 > arr;
317
318# ား > arr;
319\u102C\u1038 > arr;
320
321# ီး > ee;
322\u102E\u1038 > ee;
323
324# ေး > ayy;
325\u1031\u1038 > ayy;
326
327# ေ့ > ae;
328\u1031\u1037 > ae;
329
330# ဲ့ > ae;
331\u1032\u1037 > ae;
332
333# ော > aw;
334\u1031\u102C > aw;
335
336# ေါ > aw;
337\u1031\u102B > aw;
338
339# ို > o;
340\u102D\u102F > o;
341
342# ုံ > one;
343\u102F\u1036 > one;
344
345# ှာ > har;
346\u103E\u102C > har;
347
348
349
350
351
352# Character combinations: "1 vowel"
353
354# ါ > ar;
355\u102B > ar;
356
357# ာ  > ar;
358\u102C > ar;
359
360# ိ > i;
361\u102D > i;
362
363# ီ  > e;
364\u102E > e;
365
366# ု  > u;
367\u102F > u;
368
369# ူ > uu;
370\u1030 > uu;
371
372# ေ  > ay;
373\u1031 > ay;
374
375# ဲ  > ell;
376\u1032 > ell;
377
378# ံ  > an;
379\u1036 > an;
380
381# ျ > ya;
382\u103B > ya;
383
384# ြ  > ya;
385\u103C > ya;
386
387#  ှ  > ha;
388\u103E > ha;
389
390
391# Modern Myanmar digits
392\u1040 > 0 ;
393\u1041 > 1 ;
394\u1042 > 2 ;
395\u1043 > 3 ;
396\u1044 > 4 ;
397\u1045 > 5 ;
398\u1046 > 6 ;
399\u1047 > 7 ;
400\u1048 > 8 ;
401\u1049 > 9 ;
402
403# Myanmar Punctuation
404
405\u104A > \, ; # MYANMAR SIGN LITTLE SECTION
406\u104B > \. ; # MYANMAR SIGN SECTION
407\u104C > ; # MYANMAR SYMBOL LOCATIVE
408\u104D > ; # MYANMAR SYMBOL COMPLETED
409
410# Inserting 'a' in between to consonants.
411
412($consonants) ($consonants) > | $1 a $2 ;
413
414# Consonant clusters
415# က္က > kk ;
416# က္ခ > khk ;
417# ဂ္ဂ > gg ;
418# ဂ္ဃ > ggh ;
419# င်္ဂ > ngg ;
420
421# Fundamental Burmese Consonants:
422# က > k;
423\u1000 > k;
424
425# ခ > hk;
426\u1001 > hk;
427
428# ဂ > g;
429\u1002 > g;
430
431# ဃ > gh;
432\u1003 > gh;
433
434# င > ng;
435\u1004 > ng;
436
437# စ > hc;
438\u1005 > hc;
439
440# ဆ > s;
441\u1006 > s;
442
443# ဇ > j;
444\u1007 > j;
445
446# ဈ > jh;
447\u1008 > jh;
448
449# ဉ > ny;
450\u1009 > ny;
451
452# ည > ny;
453\u100A > ny;
454
455# ဋ > t;
456\u100B > t;
457
458# ဌ > ht;
459\u100C > ht;
460
461# ဍ > d;
462\u100D > d;
463
464# ဎ > dh;
465\u100E > dh;
466
467# ဏ > n;
468\u100F > n;
469
470# တ > t;
471\u1010 > t;
472
473# ထ > ht;
474\u1011 > ht;
475
476# ဒ > d;
477\u1012 > d;
478
479# ဓ > dh;
480\u1013 > dh;
481
482# န > n;
483\u1014 > n;
484
485# ပ > p;
486\u1015 > p;
487
488# ဖ > hp;
489\u1016 > hp;
490
491# ဗ > b;
492\u1017 > b;
493
494# ဘ > bh;
495\u1018 > bh;
496
497# မ > m;
498\u1019 > m;
499
500# ယ > y;
501\u101A > y;
502
503# ရ > r;
504\u101B > r;
505
506# လ > l;
507\u101C > l;
508
509# ဝ > w;
510\u101D > w;
511
512# သ > s;
513\u101E > s;
514ဿ > s; #https://www.eki.ee/wgrs/rom2_my.htm
515
516# ဟ > h;
517\u101F > h;
518
519# ဠ > l;
520\u1020 > l;
521
522# အ > a;
523\u1021 > a;
524
525# ဣ > i;
526\u1023 > i;
527
528# ဤ > i;
529\u1024 > i;
530
531# ဥ > u;
532\u1025 > u;
533
534# ဦ > u;
535\u1026 > u;
536
537# ဧ > e;
538\u1027 > e;
539
540# ဩ > au;
541\u1029 > au;
542
543# ဪ > au;
544\u102A > au;
545
546# TODO: this character repeats the previous romanized letter
547# း > ;
548\u1038 > ;
549
550# ့  > ;
551\u1037 > ;
552
553#  ်  > ;
554\u103A > ;
555
556# ၏ > eat ;
557\u104F > eat;
558
559# ္  > ;
560\u1039 > ;
561
562# Leftovers
563
564\u103D > w;
565
566::NFC(NFD);
567			]]></tRule>
568		</transform>
569	</transforms>
570</supplementalData>
571