blob: 7a9c0eeef38b2c3883da90ce62c256699dc287f0 [file] [log] [blame]
J. Duke319a3b92007-12-01 00:00:00 +00001/*
2 * Portions Copyright 2005 Sun Microsystems, Inc. All Rights Reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation. Sun designates this
8 * particular file as subject to the "Classpath" exception as provided
9 * by Sun in the LICENSE file that accompanied this code.
10 *
11 * This code is distributed in the hope that it will be useful, but WITHOUT
12 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 * version 2 for more details (a copy is included in the LICENSE file that
15 * accompanied this code).
16 *
17 * You should have received a copy of the GNU General Public License version
18 * 2 along with this work; if not, write to the Free Software Foundation,
19 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
20 *
21 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
22 * CA 95054 USA or visit www.sun.com if you need additional information or
23 * have any questions.
24 */
25
26/*
27 */
28
29/*
30 * (C) Copyright Taligent, Inc. 1996, 1997 - All Rights Reserved
31 * (C) Copyright IBM Corp. 1996 - 1998 - All Rights Reserved
32 *
33 * The original version of this source code and documentation
34 * is copyrighted and owned by Taligent, Inc., a wholly-owned
35 * subsidiary of IBM. These materials are provided under terms
36 * of a License Agreement between Taligent and Sun. This technology
37 * is protected by multiple US and International patents.
38 *
39 * This notice and attribution to Taligent may not be removed.
40 * Taligent is a registered trademark of Taligent, Inc.
41 *
42 */
43
44package sun.text.resources;
45
46import java.util.ListResourceBundle;
47
48public class CollationData_th extends ListResourceBundle {
49
50 protected final Object[][] getContents() {
51 return new Object[][] {
52 { "Rule",
53 "! " // First turn on the SE Asian Vowel/Consonant
54 // swapping rule
55 + "& Z " // Put in all of the consonants, after Z
56 + "< \u0E01 " // KO KAI
57 + "< \u0E02 " // KHO KHAI
58 + "< \u0E03 " // KHO KHUAT
59 + "< \u0E04 " // KHO KHWAI
60 + "< \u0E05 " // KHO KHON
61 + "< \u0E06 " // KHO RAKHANG
62 + "< \u0E07 " // NGO NGU
63 + "< \u0E08 " // CHO CHAN
64 + "< \u0E09 " // CHO CHING
65 + "< \u0E0A " // CHO CHANG
66 + "< \u0E0B " // SO SO
67 + "< \u0E0C " // CHO CHOE
68 + "< \u0E0D " // YO YING
69 + "< \u0E0E " // DO CHADA
70 + "< \u0E0F " // TO PATAK
71 + "< \u0E10 " // THO THAN
72 + "< \u0E11 " // THO NANGMONTHO
73 + "< \u0E12 " // THO PHUTHAO
74 + "< \u0E13 " // NO NEN
75 + "< \u0E14 " // DO DEK
76 + "< \u0E15 " // TO TAO
77 + "< \u0E16 " // THO THUNG
78 + "< \u0E17 " // THO THAHAN
79 + "< \u0E18 " // THO THONG
80 + "< \u0E19 " // NO NU
81 + "< \u0E1A " // BO BAIMAI
82 + "< \u0E1B " // PO PLA
83 + "< \u0E1C " // PHO PHUNG
84 + "< \u0E1D " // FO FA
85 + "< \u0E1E " // PHO PHAN
86 + "< \u0E1F " // FO FAN
87 + "< \u0E20 " // PHO SAMPHAO
88 + "< \u0E21 " // MO MA
89 + "< \u0E22 " // YO YAK
90 + "< \u0E23 " // RO RUA
91 + "< \u0E24 " // RU
92 + "< \u0E25 " // LO LING
93 + "< \u0E26 " // LU
94 + "< \u0E27 " // WO WAEN
95 + "< \u0E28 " // SO SALA
96 + "< \u0E29 " // SO RUSI
97 + "< \u0E2A " // SO SUA
98 + "< \u0E2B " // HO HIP
99 + "< \u0E2C " // LO CHULA
100 + "< \u0E2D " // O ANG
101 + "< \u0E2E " // HO NOKHUK
102
103 //
104 // Normal vowels
105 //
106 + "< \u0E30 " // SARA A
107 + "< \u0E31 " // MAI HAN-AKAT
108 + "< \u0E32 " // SARA AA
109
110 // Normalizer will decompose this character to \u0e4d\u0e32. This is
111 // a Bad Thing, because we want the separate characters to sort
112 // differently than this individual one. Since there's no public way to
113 // set the decomposition to be used when creating a collator, there's
114 // no way around this right now.
115 // It's best to go ahead and leave the character in, because it occurs
116 // this way a lot more often than it occurs as separate characters.
117 + "< \u0E33 " // SARA AM
118
119 + "< \u0E34 " // SARA I
120
121 + "< \u0E35 " // SARA II
122 + "< \u0E36 " // SARA UE
123 + "< \u0E37 " // SARA UEE
124 + "< \u0E38 " // SARA U
125 + "< \u0E39 " // SARA UU
126
127 //
128 // Preceding vowels
129 //
130 + "< \u0E40 " // SARA E
131 + "< \u0E41 " // SARA AE
132 + "< \u0E42 " // SARA O
133 + "< \u0E43 " // SARA AI MAIMUAN
134 + "< \u0E44 " // SARA AI MAIMALAI
135
136 //
137 // Digits
138 //
139 + "< \u0E50 " // DIGIT ZERO
140 + "< \u0E51 " // DIGIT ONE
141 + "< \u0E52 " // DIGIT TWO
142 + "< \u0E53 " // DIGIT THREE
143 + "< \u0E54 " // DIGIT FOUR
144 + "< \u0E55 " // DIGIT FIVE
145 + "< \u0E56 " // DIGIT SIX
146 + "< \u0E57 " // DIGIT SEVEN
147 + "< \u0E58 " // DIGIT EIGHT
148 + "< \u0E59 " // DIGIT NINE
149
150 // Sorta tonal marks, but maybe not really
151 + "< \u0E4D " // NIKHAHIT
152
153 //
154 // Thai symbols are supposed to sort "after white space".
155 // I'm treating this as making them sort just after the normal Latin-1
156 // symbols, which are in turn after the white space.
157 //
158 + "&'\u007d'" // right-brace
159 + "< \u0E2F " // PAIYANNOI (ellipsis, abbreviation)
160 + "< \u0E46 " // MAIYAMOK
161 + "< \u0E4F " // FONGMAN
162 + "< \u0E5A " // ANGKHANKHU
163 + "< \u0E5B " // KHOMUT
164 + "< \u0E3F " // CURRENCY SYMBOL BAHT
165
166 // These symbols are supposed to be "after all characters"
167 + "< \u0E4E " // YAMAKKAN
168
169 // This rare symbol also comes after all characters. But when it is
170 // used in combination with RU and LU, the combination is treated as
171 // a separate letter, ala "CH" sorting after "C" in traditional Spanish.
172 + "< \u0E45 " // LAKKHANGYAO
173 + "& \u0E24 < \u0E24\u0E45 "
174 + "& \u0E26 < \u0E26\u0E45 "
175
176 // Tonal marks are primary ignorables but are treated as secondary
177 // differences
178 + "& \u0301 " // acute accent
179 + "; \u0E47 " // MAITAIKHU
180 + "; \u0E48 " // MAI EK
181 + "; \u0E49 " // MAI THO
182 + "; \u0E4A " // MAI TRI
183 + "; \u0E4B " // MAI CHATTAWA
184 + "; \u0E4C " // THANTHAKHAT
185
186
187 // These are supposed to be ignored, so I'm treating them as controls
188 + "& \u0001 "
189 + "= \u0E3A " // PHINTHU
190 + "= '.' " // period
191 }
192 };
193 }
194}