1*0e209d39SAndroid Build Coastguard Worker // © 2016 and later: Unicode, Inc. and others.
2*0e209d39SAndroid Build Coastguard Worker // License & terms of use: http://www.unicode.org/copyright.html
3*0e209d39SAndroid Build Coastguard Worker /*
4*0e209d39SAndroid Build Coastguard Worker **********************************************************************
5*0e209d39SAndroid Build Coastguard Worker * Copyright (c) 2002-2014, International Business Machines Corporation
6*0e209d39SAndroid Build Coastguard Worker * and others. All Rights Reserved.
7*0e209d39SAndroid Build Coastguard Worker **********************************************************************
8*0e209d39SAndroid Build Coastguard Worker * Date Name Description
9*0e209d39SAndroid Build Coastguard Worker * 01/14/2002 aliu Creation.
10*0e209d39SAndroid Build Coastguard Worker **********************************************************************
11*0e209d39SAndroid Build Coastguard Worker */
12*0e209d39SAndroid Build Coastguard Worker
13*0e209d39SAndroid Build Coastguard Worker #include "unicode/utypes.h"
14*0e209d39SAndroid Build Coastguard Worker
15*0e209d39SAndroid Build Coastguard Worker #if !UCONFIG_NO_TRANSLITERATION
16*0e209d39SAndroid Build Coastguard Worker
17*0e209d39SAndroid Build Coastguard Worker #include "tridpars.h"
18*0e209d39SAndroid Build Coastguard Worker #include "hash.h"
19*0e209d39SAndroid Build Coastguard Worker #include "mutex.h"
20*0e209d39SAndroid Build Coastguard Worker #include "transreg.h"
21*0e209d39SAndroid Build Coastguard Worker #include "uassert.h"
22*0e209d39SAndroid Build Coastguard Worker #include "ucln_in.h"
23*0e209d39SAndroid Build Coastguard Worker #include "unicode/parsepos.h"
24*0e209d39SAndroid Build Coastguard Worker #include "unicode/translit.h"
25*0e209d39SAndroid Build Coastguard Worker #include "unicode/uchar.h"
26*0e209d39SAndroid Build Coastguard Worker #include "unicode/uniset.h"
27*0e209d39SAndroid Build Coastguard Worker #include "unicode/unistr.h"
28*0e209d39SAndroid Build Coastguard Worker #include "unicode/utrans.h"
29*0e209d39SAndroid Build Coastguard Worker #include "util.h"
30*0e209d39SAndroid Build Coastguard Worker #include "uvector.h"
31*0e209d39SAndroid Build Coastguard Worker
32*0e209d39SAndroid Build Coastguard Worker U_NAMESPACE_BEGIN
33*0e209d39SAndroid Build Coastguard Worker
34*0e209d39SAndroid Build Coastguard Worker static const char16_t ID_DELIM = 0x003B; // ;
35*0e209d39SAndroid Build Coastguard Worker static const char16_t TARGET_SEP = 0x002D; // -
36*0e209d39SAndroid Build Coastguard Worker static const char16_t VARIANT_SEP = 0x002F; // /
37*0e209d39SAndroid Build Coastguard Worker static const char16_t OPEN_REV = 0x0028; // (
38*0e209d39SAndroid Build Coastguard Worker static const char16_t CLOSE_REV = 0x0029; // )
39*0e209d39SAndroid Build Coastguard Worker
40*0e209d39SAndroid Build Coastguard Worker //static const char16_t EMPTY[] = {0}; // ""
41*0e209d39SAndroid Build Coastguard Worker static const char16_t ANY[] = {65,110,121,0}; // "Any"
42*0e209d39SAndroid Build Coastguard Worker static const char16_t ANY_NULL[] = {65,110,121,45,78,117,108,108,0}; // "Any-Null"
43*0e209d39SAndroid Build Coastguard Worker
44*0e209d39SAndroid Build Coastguard Worker static const int32_t FORWARD = UTRANS_FORWARD;
45*0e209d39SAndroid Build Coastguard Worker static const int32_t REVERSE = UTRANS_REVERSE;
46*0e209d39SAndroid Build Coastguard Worker
47*0e209d39SAndroid Build Coastguard Worker static Hashtable* SPECIAL_INVERSES = nullptr;
48*0e209d39SAndroid Build Coastguard Worker static UInitOnce gSpecialInversesInitOnce {};
49*0e209d39SAndroid Build Coastguard Worker
50*0e209d39SAndroid Build Coastguard Worker /**
51*0e209d39SAndroid Build Coastguard Worker * The mutex controlling access to SPECIAL_INVERSES
52*0e209d39SAndroid Build Coastguard Worker */
53*0e209d39SAndroid Build Coastguard Worker static UMutex LOCK;
54*0e209d39SAndroid Build Coastguard Worker
Specs(const UnicodeString & s,const UnicodeString & t,const UnicodeString & v,UBool sawS,const UnicodeString & f)55*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::Specs::Specs(const UnicodeString& s, const UnicodeString& t,
56*0e209d39SAndroid Build Coastguard Worker const UnicodeString& v, UBool sawS,
57*0e209d39SAndroid Build Coastguard Worker const UnicodeString& f) {
58*0e209d39SAndroid Build Coastguard Worker source = s;
59*0e209d39SAndroid Build Coastguard Worker target = t;
60*0e209d39SAndroid Build Coastguard Worker variant = v;
61*0e209d39SAndroid Build Coastguard Worker sawSource = sawS;
62*0e209d39SAndroid Build Coastguard Worker filter = f;
63*0e209d39SAndroid Build Coastguard Worker }
64*0e209d39SAndroid Build Coastguard Worker
SingleID(const UnicodeString & c,const UnicodeString & b,const UnicodeString & f)65*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::SingleID::SingleID(const UnicodeString& c, const UnicodeString& b,
66*0e209d39SAndroid Build Coastguard Worker const UnicodeString& f) {
67*0e209d39SAndroid Build Coastguard Worker canonID = c;
68*0e209d39SAndroid Build Coastguard Worker basicID = b;
69*0e209d39SAndroid Build Coastguard Worker filter = f;
70*0e209d39SAndroid Build Coastguard Worker }
71*0e209d39SAndroid Build Coastguard Worker
SingleID(const UnicodeString & c,const UnicodeString & b)72*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::SingleID::SingleID(const UnicodeString& c, const UnicodeString& b) {
73*0e209d39SAndroid Build Coastguard Worker canonID = c;
74*0e209d39SAndroid Build Coastguard Worker basicID = b;
75*0e209d39SAndroid Build Coastguard Worker }
76*0e209d39SAndroid Build Coastguard Worker
createInstance()77*0e209d39SAndroid Build Coastguard Worker Transliterator* TransliteratorIDParser::SingleID::createInstance() {
78*0e209d39SAndroid Build Coastguard Worker Transliterator* t;
79*0e209d39SAndroid Build Coastguard Worker if (basicID.length() == 0) {
80*0e209d39SAndroid Build Coastguard Worker t = createBasicInstance(UnicodeString(true, ANY_NULL, 8), &canonID);
81*0e209d39SAndroid Build Coastguard Worker } else {
82*0e209d39SAndroid Build Coastguard Worker t = createBasicInstance(basicID, &canonID);
83*0e209d39SAndroid Build Coastguard Worker }
84*0e209d39SAndroid Build Coastguard Worker if (t != nullptr) {
85*0e209d39SAndroid Build Coastguard Worker if (filter.length() != 0) {
86*0e209d39SAndroid Build Coastguard Worker UErrorCode ec = U_ZERO_ERROR;
87*0e209d39SAndroid Build Coastguard Worker UnicodeSet *set = new UnicodeSet(filter, ec);
88*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(ec)) {
89*0e209d39SAndroid Build Coastguard Worker delete set;
90*0e209d39SAndroid Build Coastguard Worker } else {
91*0e209d39SAndroid Build Coastguard Worker t->adoptFilter(set);
92*0e209d39SAndroid Build Coastguard Worker }
93*0e209d39SAndroid Build Coastguard Worker }
94*0e209d39SAndroid Build Coastguard Worker }
95*0e209d39SAndroid Build Coastguard Worker return t;
96*0e209d39SAndroid Build Coastguard Worker }
97*0e209d39SAndroid Build Coastguard Worker
98*0e209d39SAndroid Build Coastguard Worker
99*0e209d39SAndroid Build Coastguard Worker /**
100*0e209d39SAndroid Build Coastguard Worker * Parse a single ID, that is, an ID of the general form
101*0e209d39SAndroid Build Coastguard Worker * "[f1] s1-t1/v1 ([f2] s2-t3/v2)", with the parenthesized element
102*0e209d39SAndroid Build Coastguard Worker * optional, the filters optional, and the variants optional.
103*0e209d39SAndroid Build Coastguard Worker * @param id the id to be parsed
104*0e209d39SAndroid Build Coastguard Worker * @param pos INPUT-OUTPUT parameter. On input, the position of
105*0e209d39SAndroid Build Coastguard Worker * the first character to parse. On output, the position after
106*0e209d39SAndroid Build Coastguard Worker * the last character parsed.
107*0e209d39SAndroid Build Coastguard Worker * @param dir the direction. If the direction is REVERSE then the
108*0e209d39SAndroid Build Coastguard Worker * SingleID is constructed for the reverse direction.
109*0e209d39SAndroid Build Coastguard Worker * @return a SingleID object or nullptr
110*0e209d39SAndroid Build Coastguard Worker */
111*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::SingleID*
parseSingleID(const UnicodeString & id,int32_t & pos,int32_t dir,UErrorCode & status)112*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::parseSingleID(const UnicodeString& id, int32_t& pos,
113*0e209d39SAndroid Build Coastguard Worker int32_t dir, UErrorCode& status) {
114*0e209d39SAndroid Build Coastguard Worker
115*0e209d39SAndroid Build Coastguard Worker int32_t start = pos;
116*0e209d39SAndroid Build Coastguard Worker
117*0e209d39SAndroid Build Coastguard Worker // The ID will be of the form A, A(), A(B), or (B), where
118*0e209d39SAndroid Build Coastguard Worker // A and B are filter IDs.
119*0e209d39SAndroid Build Coastguard Worker Specs* specsA = nullptr;
120*0e209d39SAndroid Build Coastguard Worker Specs* specsB = nullptr;
121*0e209d39SAndroid Build Coastguard Worker UBool sawParen = false;
122*0e209d39SAndroid Build Coastguard Worker
123*0e209d39SAndroid Build Coastguard Worker // On the first pass, look for (B) or (). If this fails, then
124*0e209d39SAndroid Build Coastguard Worker // on the second pass, look for A, A(B), or A().
125*0e209d39SAndroid Build Coastguard Worker for (int32_t pass=1; pass<=2; ++pass) {
126*0e209d39SAndroid Build Coastguard Worker if (pass == 2) {
127*0e209d39SAndroid Build Coastguard Worker specsA = parseFilterID(id, pos, true);
128*0e209d39SAndroid Build Coastguard Worker if (specsA == nullptr) {
129*0e209d39SAndroid Build Coastguard Worker pos = start;
130*0e209d39SAndroid Build Coastguard Worker return nullptr;
131*0e209d39SAndroid Build Coastguard Worker }
132*0e209d39SAndroid Build Coastguard Worker }
133*0e209d39SAndroid Build Coastguard Worker if (ICU_Utility::parseChar(id, pos, OPEN_REV)) {
134*0e209d39SAndroid Build Coastguard Worker sawParen = true;
135*0e209d39SAndroid Build Coastguard Worker if (!ICU_Utility::parseChar(id, pos, CLOSE_REV)) {
136*0e209d39SAndroid Build Coastguard Worker specsB = parseFilterID(id, pos, true);
137*0e209d39SAndroid Build Coastguard Worker // Must close with a ')'
138*0e209d39SAndroid Build Coastguard Worker if (specsB == nullptr || !ICU_Utility::parseChar(id, pos, CLOSE_REV)) {
139*0e209d39SAndroid Build Coastguard Worker delete specsA;
140*0e209d39SAndroid Build Coastguard Worker pos = start;
141*0e209d39SAndroid Build Coastguard Worker return nullptr;
142*0e209d39SAndroid Build Coastguard Worker }
143*0e209d39SAndroid Build Coastguard Worker }
144*0e209d39SAndroid Build Coastguard Worker break;
145*0e209d39SAndroid Build Coastguard Worker }
146*0e209d39SAndroid Build Coastguard Worker }
147*0e209d39SAndroid Build Coastguard Worker
148*0e209d39SAndroid Build Coastguard Worker // Assemble return results
149*0e209d39SAndroid Build Coastguard Worker SingleID* single;
150*0e209d39SAndroid Build Coastguard Worker if (sawParen) {
151*0e209d39SAndroid Build Coastguard Worker if (dir == FORWARD) {
152*0e209d39SAndroid Build Coastguard Worker SingleID* b = specsToID(specsB, FORWARD);
153*0e209d39SAndroid Build Coastguard Worker single = specsToID(specsA, FORWARD);
154*0e209d39SAndroid Build Coastguard Worker // Null pointers check
155*0e209d39SAndroid Build Coastguard Worker if (b == nullptr || single == nullptr) {
156*0e209d39SAndroid Build Coastguard Worker delete b;
157*0e209d39SAndroid Build Coastguard Worker delete single;
158*0e209d39SAndroid Build Coastguard Worker status = U_MEMORY_ALLOCATION_ERROR;
159*0e209d39SAndroid Build Coastguard Worker return nullptr;
160*0e209d39SAndroid Build Coastguard Worker }
161*0e209d39SAndroid Build Coastguard Worker single->canonID.append(OPEN_REV)
162*0e209d39SAndroid Build Coastguard Worker .append(b->canonID).append(CLOSE_REV);
163*0e209d39SAndroid Build Coastguard Worker if (specsA != nullptr) {
164*0e209d39SAndroid Build Coastguard Worker single->filter = specsA->filter;
165*0e209d39SAndroid Build Coastguard Worker }
166*0e209d39SAndroid Build Coastguard Worker delete b;
167*0e209d39SAndroid Build Coastguard Worker } else {
168*0e209d39SAndroid Build Coastguard Worker SingleID* a = specsToID(specsA, FORWARD);
169*0e209d39SAndroid Build Coastguard Worker single = specsToID(specsB, FORWARD);
170*0e209d39SAndroid Build Coastguard Worker // Check for null pointer.
171*0e209d39SAndroid Build Coastguard Worker if (a == nullptr || single == nullptr) {
172*0e209d39SAndroid Build Coastguard Worker delete a;
173*0e209d39SAndroid Build Coastguard Worker delete single;
174*0e209d39SAndroid Build Coastguard Worker status = U_MEMORY_ALLOCATION_ERROR;
175*0e209d39SAndroid Build Coastguard Worker return nullptr;
176*0e209d39SAndroid Build Coastguard Worker }
177*0e209d39SAndroid Build Coastguard Worker single->canonID.append(OPEN_REV)
178*0e209d39SAndroid Build Coastguard Worker .append(a->canonID).append(CLOSE_REV);
179*0e209d39SAndroid Build Coastguard Worker if (specsB != nullptr) {
180*0e209d39SAndroid Build Coastguard Worker single->filter = specsB->filter;
181*0e209d39SAndroid Build Coastguard Worker }
182*0e209d39SAndroid Build Coastguard Worker delete a;
183*0e209d39SAndroid Build Coastguard Worker }
184*0e209d39SAndroid Build Coastguard Worker } else {
185*0e209d39SAndroid Build Coastguard Worker // assert(specsA != nullptr);
186*0e209d39SAndroid Build Coastguard Worker if (dir == FORWARD) {
187*0e209d39SAndroid Build Coastguard Worker single = specsToID(specsA, FORWARD);
188*0e209d39SAndroid Build Coastguard Worker } else {
189*0e209d39SAndroid Build Coastguard Worker single = specsToSpecialInverse(*specsA, status);
190*0e209d39SAndroid Build Coastguard Worker if (single == nullptr) {
191*0e209d39SAndroid Build Coastguard Worker single = specsToID(specsA, REVERSE);
192*0e209d39SAndroid Build Coastguard Worker }
193*0e209d39SAndroid Build Coastguard Worker }
194*0e209d39SAndroid Build Coastguard Worker // Check for nullptr pointer
195*0e209d39SAndroid Build Coastguard Worker if (single == nullptr) {
196*0e209d39SAndroid Build Coastguard Worker status = U_MEMORY_ALLOCATION_ERROR;
197*0e209d39SAndroid Build Coastguard Worker return nullptr;
198*0e209d39SAndroid Build Coastguard Worker }
199*0e209d39SAndroid Build Coastguard Worker single->filter = specsA->filter;
200*0e209d39SAndroid Build Coastguard Worker }
201*0e209d39SAndroid Build Coastguard Worker
202*0e209d39SAndroid Build Coastguard Worker delete specsA;
203*0e209d39SAndroid Build Coastguard Worker delete specsB;
204*0e209d39SAndroid Build Coastguard Worker
205*0e209d39SAndroid Build Coastguard Worker return single;
206*0e209d39SAndroid Build Coastguard Worker }
207*0e209d39SAndroid Build Coastguard Worker
208*0e209d39SAndroid Build Coastguard Worker /**
209*0e209d39SAndroid Build Coastguard Worker * Parse a filter ID, that is, an ID of the general form
210*0e209d39SAndroid Build Coastguard Worker * "[f1] s1-t1/v1", with the filters optional, and the variants optional.
211*0e209d39SAndroid Build Coastguard Worker * @param id the id to be parsed
212*0e209d39SAndroid Build Coastguard Worker * @param pos INPUT-OUTPUT parameter. On input, the position of
213*0e209d39SAndroid Build Coastguard Worker * the first character to parse. On output, the position after
214*0e209d39SAndroid Build Coastguard Worker * the last character parsed.
215*0e209d39SAndroid Build Coastguard Worker * @return a SingleID object or null if the parse fails
216*0e209d39SAndroid Build Coastguard Worker */
217*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::SingleID*
parseFilterID(const UnicodeString & id,int32_t & pos)218*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::parseFilterID(const UnicodeString& id, int32_t& pos) {
219*0e209d39SAndroid Build Coastguard Worker
220*0e209d39SAndroid Build Coastguard Worker int32_t start = pos;
221*0e209d39SAndroid Build Coastguard Worker
222*0e209d39SAndroid Build Coastguard Worker Specs* specs = parseFilterID(id, pos, true);
223*0e209d39SAndroid Build Coastguard Worker if (specs == nullptr) {
224*0e209d39SAndroid Build Coastguard Worker pos = start;
225*0e209d39SAndroid Build Coastguard Worker return nullptr;
226*0e209d39SAndroid Build Coastguard Worker }
227*0e209d39SAndroid Build Coastguard Worker
228*0e209d39SAndroid Build Coastguard Worker // Assemble return results
229*0e209d39SAndroid Build Coastguard Worker SingleID* single = specsToID(specs, FORWARD);
230*0e209d39SAndroid Build Coastguard Worker if (single != nullptr) {
231*0e209d39SAndroid Build Coastguard Worker single->filter = specs->filter;
232*0e209d39SAndroid Build Coastguard Worker }
233*0e209d39SAndroid Build Coastguard Worker delete specs;
234*0e209d39SAndroid Build Coastguard Worker return single;
235*0e209d39SAndroid Build Coastguard Worker }
236*0e209d39SAndroid Build Coastguard Worker
237*0e209d39SAndroid Build Coastguard Worker /**
238*0e209d39SAndroid Build Coastguard Worker * Parse a global filter of the form "[f]" or "([f])", depending
239*0e209d39SAndroid Build Coastguard Worker * on 'withParens'.
240*0e209d39SAndroid Build Coastguard Worker * @param id the pattern the parse
241*0e209d39SAndroid Build Coastguard Worker * @param pos INPUT-OUTPUT parameter. On input, the position of
242*0e209d39SAndroid Build Coastguard Worker * the first character to parse. On output, the position after
243*0e209d39SAndroid Build Coastguard Worker * the last character parsed.
244*0e209d39SAndroid Build Coastguard Worker * @param dir the direction.
245*0e209d39SAndroid Build Coastguard Worker * @param withParens INPUT-OUTPUT parameter. On entry, if
246*0e209d39SAndroid Build Coastguard Worker * withParens is 0, then parens are disallowed. If it is 1,
247*0e209d39SAndroid Build Coastguard Worker * then parens are requires. If it is -1, then parens are
248*0e209d39SAndroid Build Coastguard Worker * optional, and the return result will be set to 0 or 1.
249*0e209d39SAndroid Build Coastguard Worker * @param canonID OUTPUT parameter. The pattern for the filter
250*0e209d39SAndroid Build Coastguard Worker * added to the canonID, either at the end, if dir is FORWARD, or
251*0e209d39SAndroid Build Coastguard Worker * at the start, if dir is REVERSE. The pattern will be enclosed
252*0e209d39SAndroid Build Coastguard Worker * in parentheses if appropriate, and will be suffixed with an
253*0e209d39SAndroid Build Coastguard Worker * ID_DELIM character. May be nullptr.
254*0e209d39SAndroid Build Coastguard Worker * @return a UnicodeSet object or nullptr. A non-nullptr results
255*0e209d39SAndroid Build Coastguard Worker * indicates a successful parse, regardless of whether the filter
256*0e209d39SAndroid Build Coastguard Worker * applies to the given direction. The caller should discard it
257*0e209d39SAndroid Build Coastguard Worker * if withParens != (dir == REVERSE).
258*0e209d39SAndroid Build Coastguard Worker */
parseGlobalFilter(const UnicodeString & id,int32_t & pos,int32_t dir,int32_t & withParens,UnicodeString * canonID)259*0e209d39SAndroid Build Coastguard Worker UnicodeSet* TransliteratorIDParser::parseGlobalFilter(const UnicodeString& id, int32_t& pos,
260*0e209d39SAndroid Build Coastguard Worker int32_t dir,
261*0e209d39SAndroid Build Coastguard Worker int32_t& withParens,
262*0e209d39SAndroid Build Coastguard Worker UnicodeString* canonID) {
263*0e209d39SAndroid Build Coastguard Worker UnicodeSet* filter = nullptr;
264*0e209d39SAndroid Build Coastguard Worker int32_t start = pos;
265*0e209d39SAndroid Build Coastguard Worker
266*0e209d39SAndroid Build Coastguard Worker if (withParens == -1) {
267*0e209d39SAndroid Build Coastguard Worker withParens = ICU_Utility::parseChar(id, pos, OPEN_REV) ? 1 : 0;
268*0e209d39SAndroid Build Coastguard Worker } else if (withParens == 1) {
269*0e209d39SAndroid Build Coastguard Worker if (!ICU_Utility::parseChar(id, pos, OPEN_REV)) {
270*0e209d39SAndroid Build Coastguard Worker pos = start;
271*0e209d39SAndroid Build Coastguard Worker return nullptr;
272*0e209d39SAndroid Build Coastguard Worker }
273*0e209d39SAndroid Build Coastguard Worker }
274*0e209d39SAndroid Build Coastguard Worker
275*0e209d39SAndroid Build Coastguard Worker ICU_Utility::skipWhitespace(id, pos, true);
276*0e209d39SAndroid Build Coastguard Worker
277*0e209d39SAndroid Build Coastguard Worker if (UnicodeSet::resemblesPattern(id, pos)) {
278*0e209d39SAndroid Build Coastguard Worker ParsePosition ppos(pos);
279*0e209d39SAndroid Build Coastguard Worker UErrorCode ec = U_ZERO_ERROR;
280*0e209d39SAndroid Build Coastguard Worker filter = new UnicodeSet(id, ppos, USET_IGNORE_SPACE, nullptr, ec);
281*0e209d39SAndroid Build Coastguard Worker /* test for nullptr */
282*0e209d39SAndroid Build Coastguard Worker if (filter == nullptr) {
283*0e209d39SAndroid Build Coastguard Worker pos = start;
284*0e209d39SAndroid Build Coastguard Worker return nullptr;
285*0e209d39SAndroid Build Coastguard Worker }
286*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(ec)) {
287*0e209d39SAndroid Build Coastguard Worker delete filter;
288*0e209d39SAndroid Build Coastguard Worker pos = start;
289*0e209d39SAndroid Build Coastguard Worker return nullptr;
290*0e209d39SAndroid Build Coastguard Worker }
291*0e209d39SAndroid Build Coastguard Worker
292*0e209d39SAndroid Build Coastguard Worker UnicodeString pattern;
293*0e209d39SAndroid Build Coastguard Worker id.extractBetween(pos, ppos.getIndex(), pattern);
294*0e209d39SAndroid Build Coastguard Worker pos = ppos.getIndex();
295*0e209d39SAndroid Build Coastguard Worker
296*0e209d39SAndroid Build Coastguard Worker if (withParens == 1 && !ICU_Utility::parseChar(id, pos, CLOSE_REV)) {
297*0e209d39SAndroid Build Coastguard Worker delete filter;
298*0e209d39SAndroid Build Coastguard Worker pos = start;
299*0e209d39SAndroid Build Coastguard Worker return nullptr;
300*0e209d39SAndroid Build Coastguard Worker }
301*0e209d39SAndroid Build Coastguard Worker
302*0e209d39SAndroid Build Coastguard Worker // In the forward direction, append the pattern to the
303*0e209d39SAndroid Build Coastguard Worker // canonID. In the reverse, insert it at zero, and invert
304*0e209d39SAndroid Build Coastguard Worker // the presence of parens ("A" <-> "(A)").
305*0e209d39SAndroid Build Coastguard Worker if (canonID != nullptr) {
306*0e209d39SAndroid Build Coastguard Worker if (dir == FORWARD) {
307*0e209d39SAndroid Build Coastguard Worker if (withParens == 1) {
308*0e209d39SAndroid Build Coastguard Worker pattern.insert(0, OPEN_REV);
309*0e209d39SAndroid Build Coastguard Worker pattern.append(CLOSE_REV);
310*0e209d39SAndroid Build Coastguard Worker }
311*0e209d39SAndroid Build Coastguard Worker canonID->append(pattern).append(ID_DELIM);
312*0e209d39SAndroid Build Coastguard Worker } else {
313*0e209d39SAndroid Build Coastguard Worker if (withParens == 0) {
314*0e209d39SAndroid Build Coastguard Worker pattern.insert(0, OPEN_REV);
315*0e209d39SAndroid Build Coastguard Worker pattern.append(CLOSE_REV);
316*0e209d39SAndroid Build Coastguard Worker }
317*0e209d39SAndroid Build Coastguard Worker canonID->insert(0, pattern);
318*0e209d39SAndroid Build Coastguard Worker canonID->insert(pattern.length(), ID_DELIM);
319*0e209d39SAndroid Build Coastguard Worker }
320*0e209d39SAndroid Build Coastguard Worker }
321*0e209d39SAndroid Build Coastguard Worker }
322*0e209d39SAndroid Build Coastguard Worker
323*0e209d39SAndroid Build Coastguard Worker return filter;
324*0e209d39SAndroid Build Coastguard Worker }
325*0e209d39SAndroid Build Coastguard Worker
326*0e209d39SAndroid Build Coastguard Worker U_CDECL_BEGIN
_deleteSingleID(void * obj)327*0e209d39SAndroid Build Coastguard Worker static void U_CALLCONV _deleteSingleID(void* obj) {
328*0e209d39SAndroid Build Coastguard Worker delete (TransliteratorIDParser::SingleID*) obj;
329*0e209d39SAndroid Build Coastguard Worker }
330*0e209d39SAndroid Build Coastguard Worker
_deleteTransliteratorTrIDPars(void * obj)331*0e209d39SAndroid Build Coastguard Worker static void U_CALLCONV _deleteTransliteratorTrIDPars(void* obj) {
332*0e209d39SAndroid Build Coastguard Worker delete (Transliterator*) obj;
333*0e209d39SAndroid Build Coastguard Worker }
334*0e209d39SAndroid Build Coastguard Worker U_CDECL_END
335*0e209d39SAndroid Build Coastguard Worker
336*0e209d39SAndroid Build Coastguard Worker /**
337*0e209d39SAndroid Build Coastguard Worker * Parse a compound ID, consisting of an optional forward global
338*0e209d39SAndroid Build Coastguard Worker * filter, a separator, one or more single IDs delimited by
339*0e209d39SAndroid Build Coastguard Worker * separators, an an optional reverse global filter. The
340*0e209d39SAndroid Build Coastguard Worker * separator is a semicolon. The global filters are UnicodeSet
341*0e209d39SAndroid Build Coastguard Worker * patterns. The reverse global filter must be enclosed in
342*0e209d39SAndroid Build Coastguard Worker * parentheses.
343*0e209d39SAndroid Build Coastguard Worker * @param id the pattern the parse
344*0e209d39SAndroid Build Coastguard Worker * @param dir the direction.
345*0e209d39SAndroid Build Coastguard Worker * @param canonID OUTPUT parameter that receives the canonical ID,
346*0e209d39SAndroid Build Coastguard Worker * consisting of canonical IDs for all elements, as returned by
347*0e209d39SAndroid Build Coastguard Worker * parseSingleID(), separated by semicolons. Previous contents
348*0e209d39SAndroid Build Coastguard Worker * are discarded.
349*0e209d39SAndroid Build Coastguard Worker * @param list OUTPUT parameter that receives a list of SingleID
350*0e209d39SAndroid Build Coastguard Worker * objects representing the parsed IDs. Previous contents are
351*0e209d39SAndroid Build Coastguard Worker * discarded.
352*0e209d39SAndroid Build Coastguard Worker * @param globalFilter OUTPUT parameter that receives a pointer to
353*0e209d39SAndroid Build Coastguard Worker * a newly created global filter for this ID in this direction, or
354*0e209d39SAndroid Build Coastguard Worker * nullptr if there is none.
355*0e209d39SAndroid Build Coastguard Worker * @return true if the parse succeeds, that is, if the entire
356*0e209d39SAndroid Build Coastguard Worker * id is consumed without syntax error.
357*0e209d39SAndroid Build Coastguard Worker */
parseCompoundID(const UnicodeString & id,int32_t dir,UnicodeString & canonID,UVector & list,UnicodeSet * & globalFilter)358*0e209d39SAndroid Build Coastguard Worker UBool TransliteratorIDParser::parseCompoundID(const UnicodeString& id, int32_t dir,
359*0e209d39SAndroid Build Coastguard Worker UnicodeString& canonID,
360*0e209d39SAndroid Build Coastguard Worker UVector& list,
361*0e209d39SAndroid Build Coastguard Worker UnicodeSet*& globalFilter) {
362*0e209d39SAndroid Build Coastguard Worker UErrorCode ec = U_ZERO_ERROR;
363*0e209d39SAndroid Build Coastguard Worker int32_t i;
364*0e209d39SAndroid Build Coastguard Worker int32_t pos = 0;
365*0e209d39SAndroid Build Coastguard Worker int32_t withParens = 1;
366*0e209d39SAndroid Build Coastguard Worker list.removeAllElements();
367*0e209d39SAndroid Build Coastguard Worker UObjectDeleter *save = list.setDeleter(_deleteSingleID);
368*0e209d39SAndroid Build Coastguard Worker
369*0e209d39SAndroid Build Coastguard Worker UnicodeSet* filter;
370*0e209d39SAndroid Build Coastguard Worker globalFilter = nullptr;
371*0e209d39SAndroid Build Coastguard Worker canonID.truncate(0);
372*0e209d39SAndroid Build Coastguard Worker
373*0e209d39SAndroid Build Coastguard Worker // Parse leading global filter, if any
374*0e209d39SAndroid Build Coastguard Worker withParens = 0; // parens disallowed
375*0e209d39SAndroid Build Coastguard Worker filter = parseGlobalFilter(id, pos, dir, withParens, &canonID);
376*0e209d39SAndroid Build Coastguard Worker if (filter != nullptr) {
377*0e209d39SAndroid Build Coastguard Worker if (!ICU_Utility::parseChar(id, pos, ID_DELIM)) {
378*0e209d39SAndroid Build Coastguard Worker // Not a global filter; backup and resume
379*0e209d39SAndroid Build Coastguard Worker canonID.truncate(0);
380*0e209d39SAndroid Build Coastguard Worker pos = 0;
381*0e209d39SAndroid Build Coastguard Worker }
382*0e209d39SAndroid Build Coastguard Worker if (dir == FORWARD) {
383*0e209d39SAndroid Build Coastguard Worker globalFilter = filter;
384*0e209d39SAndroid Build Coastguard Worker } else {
385*0e209d39SAndroid Build Coastguard Worker delete filter;
386*0e209d39SAndroid Build Coastguard Worker }
387*0e209d39SAndroid Build Coastguard Worker filter = nullptr;
388*0e209d39SAndroid Build Coastguard Worker }
389*0e209d39SAndroid Build Coastguard Worker
390*0e209d39SAndroid Build Coastguard Worker UBool sawDelimiter = true;
391*0e209d39SAndroid Build Coastguard Worker for (;;) {
392*0e209d39SAndroid Build Coastguard Worker SingleID* single = parseSingleID(id, pos, dir, ec);
393*0e209d39SAndroid Build Coastguard Worker if (single == nullptr) {
394*0e209d39SAndroid Build Coastguard Worker break;
395*0e209d39SAndroid Build Coastguard Worker }
396*0e209d39SAndroid Build Coastguard Worker if (dir == FORWARD) {
397*0e209d39SAndroid Build Coastguard Worker list.adoptElement(single, ec);
398*0e209d39SAndroid Build Coastguard Worker } else {
399*0e209d39SAndroid Build Coastguard Worker list.insertElementAt(single, 0, ec);
400*0e209d39SAndroid Build Coastguard Worker }
401*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(ec)) {
402*0e209d39SAndroid Build Coastguard Worker goto FAIL;
403*0e209d39SAndroid Build Coastguard Worker }
404*0e209d39SAndroid Build Coastguard Worker if (!ICU_Utility::parseChar(id, pos, ID_DELIM)) {
405*0e209d39SAndroid Build Coastguard Worker sawDelimiter = false;
406*0e209d39SAndroid Build Coastguard Worker break;
407*0e209d39SAndroid Build Coastguard Worker }
408*0e209d39SAndroid Build Coastguard Worker }
409*0e209d39SAndroid Build Coastguard Worker
410*0e209d39SAndroid Build Coastguard Worker if (list.size() == 0) {
411*0e209d39SAndroid Build Coastguard Worker goto FAIL;
412*0e209d39SAndroid Build Coastguard Worker }
413*0e209d39SAndroid Build Coastguard Worker
414*0e209d39SAndroid Build Coastguard Worker // Construct canonical ID
415*0e209d39SAndroid Build Coastguard Worker for (i=0; i<list.size(); ++i) {
416*0e209d39SAndroid Build Coastguard Worker SingleID* single = (SingleID*) list.elementAt(i);
417*0e209d39SAndroid Build Coastguard Worker canonID.append(single->canonID);
418*0e209d39SAndroid Build Coastguard Worker if (i != (list.size()-1)) {
419*0e209d39SAndroid Build Coastguard Worker canonID.append(ID_DELIM);
420*0e209d39SAndroid Build Coastguard Worker }
421*0e209d39SAndroid Build Coastguard Worker }
422*0e209d39SAndroid Build Coastguard Worker
423*0e209d39SAndroid Build Coastguard Worker // Parse trailing global filter, if any, and only if we saw
424*0e209d39SAndroid Build Coastguard Worker // a trailing delimiter after the IDs.
425*0e209d39SAndroid Build Coastguard Worker if (sawDelimiter) {
426*0e209d39SAndroid Build Coastguard Worker withParens = 1; // parens required
427*0e209d39SAndroid Build Coastguard Worker filter = parseGlobalFilter(id, pos, dir, withParens, &canonID);
428*0e209d39SAndroid Build Coastguard Worker if (filter != nullptr) {
429*0e209d39SAndroid Build Coastguard Worker // Don't require trailing ';', but parse it if present
430*0e209d39SAndroid Build Coastguard Worker ICU_Utility::parseChar(id, pos, ID_DELIM);
431*0e209d39SAndroid Build Coastguard Worker
432*0e209d39SAndroid Build Coastguard Worker if (dir == REVERSE) {
433*0e209d39SAndroid Build Coastguard Worker globalFilter = filter;
434*0e209d39SAndroid Build Coastguard Worker } else {
435*0e209d39SAndroid Build Coastguard Worker delete filter;
436*0e209d39SAndroid Build Coastguard Worker }
437*0e209d39SAndroid Build Coastguard Worker filter = nullptr;
438*0e209d39SAndroid Build Coastguard Worker }
439*0e209d39SAndroid Build Coastguard Worker }
440*0e209d39SAndroid Build Coastguard Worker
441*0e209d39SAndroid Build Coastguard Worker // Trailing unparsed text is a syntax error
442*0e209d39SAndroid Build Coastguard Worker ICU_Utility::skipWhitespace(id, pos, true);
443*0e209d39SAndroid Build Coastguard Worker if (pos != id.length()) {
444*0e209d39SAndroid Build Coastguard Worker goto FAIL;
445*0e209d39SAndroid Build Coastguard Worker }
446*0e209d39SAndroid Build Coastguard Worker
447*0e209d39SAndroid Build Coastguard Worker list.setDeleter(save);
448*0e209d39SAndroid Build Coastguard Worker return true;
449*0e209d39SAndroid Build Coastguard Worker
450*0e209d39SAndroid Build Coastguard Worker FAIL:
451*0e209d39SAndroid Build Coastguard Worker list.removeAllElements();
452*0e209d39SAndroid Build Coastguard Worker list.setDeleter(save);
453*0e209d39SAndroid Build Coastguard Worker delete globalFilter;
454*0e209d39SAndroid Build Coastguard Worker globalFilter = nullptr;
455*0e209d39SAndroid Build Coastguard Worker return false;
456*0e209d39SAndroid Build Coastguard Worker }
457*0e209d39SAndroid Build Coastguard Worker
458*0e209d39SAndroid Build Coastguard Worker /**
459*0e209d39SAndroid Build Coastguard Worker * Convert the elements of the 'list' vector, which are SingleID
460*0e209d39SAndroid Build Coastguard Worker * objects, into actual Transliterator objects. In the course of
461*0e209d39SAndroid Build Coastguard Worker * this, some (or all) entries may be removed. If all entries
462*0e209d39SAndroid Build Coastguard Worker * are removed, the nullptr transliterator will be added.
463*0e209d39SAndroid Build Coastguard Worker *
464*0e209d39SAndroid Build Coastguard Worker * Delete entries with empty basicIDs; these are generated by
465*0e209d39SAndroid Build Coastguard Worker * elements like "(A)" in the forward direction, or "A()" in
466*0e209d39SAndroid Build Coastguard Worker * the reverse. THIS MAY RESULT IN AN EMPTY VECTOR. Convert
467*0e209d39SAndroid Build Coastguard Worker * SingleID entries to actual transliterators.
468*0e209d39SAndroid Build Coastguard Worker *
469*0e209d39SAndroid Build Coastguard Worker * @param list vector of SingleID objects. On exit, vector
470*0e209d39SAndroid Build Coastguard Worker * of one or more Transliterators.
471*0e209d39SAndroid Build Coastguard Worker * @return new value of insertIndex. The index will shift if
472*0e209d39SAndroid Build Coastguard Worker * there are empty items, like "(Lower)", with indices less than
473*0e209d39SAndroid Build Coastguard Worker * insertIndex.
474*0e209d39SAndroid Build Coastguard Worker */
instantiateList(UVector & list,UErrorCode & ec)475*0e209d39SAndroid Build Coastguard Worker void TransliteratorIDParser::instantiateList(UVector& list,
476*0e209d39SAndroid Build Coastguard Worker UErrorCode& ec) {
477*0e209d39SAndroid Build Coastguard Worker UVector tlist(ec);
478*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(ec)) {
479*0e209d39SAndroid Build Coastguard Worker goto RETURN;
480*0e209d39SAndroid Build Coastguard Worker }
481*0e209d39SAndroid Build Coastguard Worker tlist.setDeleter(_deleteTransliteratorTrIDPars);
482*0e209d39SAndroid Build Coastguard Worker
483*0e209d39SAndroid Build Coastguard Worker Transliterator* t;
484*0e209d39SAndroid Build Coastguard Worker int32_t i;
485*0e209d39SAndroid Build Coastguard Worker for (i=0; i<=list.size(); ++i) { // [sic]: i<=list.size()
486*0e209d39SAndroid Build Coastguard Worker // We run the loop too long by one, so we can
487*0e209d39SAndroid Build Coastguard Worker // do an insert after the last element
488*0e209d39SAndroid Build Coastguard Worker if (i==list.size()) {
489*0e209d39SAndroid Build Coastguard Worker break;
490*0e209d39SAndroid Build Coastguard Worker }
491*0e209d39SAndroid Build Coastguard Worker
492*0e209d39SAndroid Build Coastguard Worker SingleID* single = (SingleID*) list.elementAt(i);
493*0e209d39SAndroid Build Coastguard Worker if (single->basicID.length() != 0) {
494*0e209d39SAndroid Build Coastguard Worker t = single->createInstance();
495*0e209d39SAndroid Build Coastguard Worker if (t == nullptr) {
496*0e209d39SAndroid Build Coastguard Worker ec = U_INVALID_ID;
497*0e209d39SAndroid Build Coastguard Worker goto RETURN;
498*0e209d39SAndroid Build Coastguard Worker }
499*0e209d39SAndroid Build Coastguard Worker tlist.adoptElement(t, ec);
500*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(ec)) {
501*0e209d39SAndroid Build Coastguard Worker goto RETURN;
502*0e209d39SAndroid Build Coastguard Worker }
503*0e209d39SAndroid Build Coastguard Worker }
504*0e209d39SAndroid Build Coastguard Worker }
505*0e209d39SAndroid Build Coastguard Worker
506*0e209d39SAndroid Build Coastguard Worker // An empty list is equivalent to a nullptr transliterator.
507*0e209d39SAndroid Build Coastguard Worker if (tlist.size() == 0) {
508*0e209d39SAndroid Build Coastguard Worker t = createBasicInstance(UnicodeString(true, ANY_NULL, 8), nullptr);
509*0e209d39SAndroid Build Coastguard Worker if (t == nullptr) {
510*0e209d39SAndroid Build Coastguard Worker // Should never happen
511*0e209d39SAndroid Build Coastguard Worker ec = U_INTERNAL_TRANSLITERATOR_ERROR;
512*0e209d39SAndroid Build Coastguard Worker }
513*0e209d39SAndroid Build Coastguard Worker tlist.adoptElement(t, ec);
514*0e209d39SAndroid Build Coastguard Worker }
515*0e209d39SAndroid Build Coastguard Worker
516*0e209d39SAndroid Build Coastguard Worker RETURN:
517*0e209d39SAndroid Build Coastguard Worker
518*0e209d39SAndroid Build Coastguard Worker UObjectDeleter *save = list.setDeleter(_deleteSingleID);
519*0e209d39SAndroid Build Coastguard Worker list.removeAllElements();
520*0e209d39SAndroid Build Coastguard Worker
521*0e209d39SAndroid Build Coastguard Worker if (U_SUCCESS(ec)) {
522*0e209d39SAndroid Build Coastguard Worker list.setDeleter(_deleteTransliteratorTrIDPars);
523*0e209d39SAndroid Build Coastguard Worker
524*0e209d39SAndroid Build Coastguard Worker while (tlist.size() > 0) {
525*0e209d39SAndroid Build Coastguard Worker t = (Transliterator*) tlist.orphanElementAt(0);
526*0e209d39SAndroid Build Coastguard Worker list.adoptElement(t, ec);
527*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(ec)) {
528*0e209d39SAndroid Build Coastguard Worker list.removeAllElements();
529*0e209d39SAndroid Build Coastguard Worker break;
530*0e209d39SAndroid Build Coastguard Worker }
531*0e209d39SAndroid Build Coastguard Worker }
532*0e209d39SAndroid Build Coastguard Worker }
533*0e209d39SAndroid Build Coastguard Worker
534*0e209d39SAndroid Build Coastguard Worker list.setDeleter(save);
535*0e209d39SAndroid Build Coastguard Worker }
536*0e209d39SAndroid Build Coastguard Worker
537*0e209d39SAndroid Build Coastguard Worker /**
538*0e209d39SAndroid Build Coastguard Worker * Parse an ID into pieces. Take IDs of the form T, T/V, S-T,
539*0e209d39SAndroid Build Coastguard Worker * S-T/V, or S/V-T. If the source is missing, return a source of
540*0e209d39SAndroid Build Coastguard Worker * ANY.
541*0e209d39SAndroid Build Coastguard Worker * @param id the id string, in any of several forms
542*0e209d39SAndroid Build Coastguard Worker * @return an array of 4 strings: source, target, variant, and
543*0e209d39SAndroid Build Coastguard Worker * isSourcePresent. If the source is not present, ANY will be
544*0e209d39SAndroid Build Coastguard Worker * given as the source, and isSourcePresent will be nullptr. Otherwise
545*0e209d39SAndroid Build Coastguard Worker * isSourcePresent will be non-nullptr. The target may be empty if the
546*0e209d39SAndroid Build Coastguard Worker * id is not well-formed. The variant may be empty.
547*0e209d39SAndroid Build Coastguard Worker */
IDtoSTV(const UnicodeString & id,UnicodeString & source,UnicodeString & target,UnicodeString & variant,UBool & isSourcePresent)548*0e209d39SAndroid Build Coastguard Worker void TransliteratorIDParser::IDtoSTV(const UnicodeString& id,
549*0e209d39SAndroid Build Coastguard Worker UnicodeString& source,
550*0e209d39SAndroid Build Coastguard Worker UnicodeString& target,
551*0e209d39SAndroid Build Coastguard Worker UnicodeString& variant,
552*0e209d39SAndroid Build Coastguard Worker UBool& isSourcePresent) {
553*0e209d39SAndroid Build Coastguard Worker source.setTo(ANY, 3);
554*0e209d39SAndroid Build Coastguard Worker target.truncate(0);
555*0e209d39SAndroid Build Coastguard Worker variant.truncate(0);
556*0e209d39SAndroid Build Coastguard Worker
557*0e209d39SAndroid Build Coastguard Worker int32_t sep = id.indexOf(TARGET_SEP);
558*0e209d39SAndroid Build Coastguard Worker int32_t var = id.indexOf(VARIANT_SEP);
559*0e209d39SAndroid Build Coastguard Worker if (var < 0) {
560*0e209d39SAndroid Build Coastguard Worker var = id.length();
561*0e209d39SAndroid Build Coastguard Worker }
562*0e209d39SAndroid Build Coastguard Worker isSourcePresent = false;
563*0e209d39SAndroid Build Coastguard Worker
564*0e209d39SAndroid Build Coastguard Worker if (sep < 0) {
565*0e209d39SAndroid Build Coastguard Worker // Form: T/V or T (or /V)
566*0e209d39SAndroid Build Coastguard Worker id.extractBetween(0, var, target);
567*0e209d39SAndroid Build Coastguard Worker id.extractBetween(var, id.length(), variant);
568*0e209d39SAndroid Build Coastguard Worker } else if (sep < var) {
569*0e209d39SAndroid Build Coastguard Worker // Form: S-T/V or S-T (or -T/V or -T)
570*0e209d39SAndroid Build Coastguard Worker if (sep > 0) {
571*0e209d39SAndroid Build Coastguard Worker id.extractBetween(0, sep, source);
572*0e209d39SAndroid Build Coastguard Worker isSourcePresent = true;
573*0e209d39SAndroid Build Coastguard Worker }
574*0e209d39SAndroid Build Coastguard Worker id.extractBetween(++sep, var, target);
575*0e209d39SAndroid Build Coastguard Worker id.extractBetween(var, id.length(), variant);
576*0e209d39SAndroid Build Coastguard Worker } else {
577*0e209d39SAndroid Build Coastguard Worker // Form: (S/V-T or /V-T)
578*0e209d39SAndroid Build Coastguard Worker if (var > 0) {
579*0e209d39SAndroid Build Coastguard Worker id.extractBetween(0, var, source);
580*0e209d39SAndroid Build Coastguard Worker isSourcePresent = true;
581*0e209d39SAndroid Build Coastguard Worker }
582*0e209d39SAndroid Build Coastguard Worker id.extractBetween(var, sep++, variant);
583*0e209d39SAndroid Build Coastguard Worker id.extractBetween(sep, id.length(), target);
584*0e209d39SAndroid Build Coastguard Worker }
585*0e209d39SAndroid Build Coastguard Worker
586*0e209d39SAndroid Build Coastguard Worker if (variant.length() > 0) {
587*0e209d39SAndroid Build Coastguard Worker variant.remove(0, 1);
588*0e209d39SAndroid Build Coastguard Worker }
589*0e209d39SAndroid Build Coastguard Worker }
590*0e209d39SAndroid Build Coastguard Worker
591*0e209d39SAndroid Build Coastguard Worker /**
592*0e209d39SAndroid Build Coastguard Worker * Given source, target, and variant strings, concatenate them into a
593*0e209d39SAndroid Build Coastguard Worker * full ID. If the source is empty, then "Any" will be used for the
594*0e209d39SAndroid Build Coastguard Worker * source, so the ID will always be of the form s-t/v or s-t.
595*0e209d39SAndroid Build Coastguard Worker */
STVtoID(const UnicodeString & source,const UnicodeString & target,const UnicodeString & variant,UnicodeString & id)596*0e209d39SAndroid Build Coastguard Worker void TransliteratorIDParser::STVtoID(const UnicodeString& source,
597*0e209d39SAndroid Build Coastguard Worker const UnicodeString& target,
598*0e209d39SAndroid Build Coastguard Worker const UnicodeString& variant,
599*0e209d39SAndroid Build Coastguard Worker UnicodeString& id) {
600*0e209d39SAndroid Build Coastguard Worker id = source;
601*0e209d39SAndroid Build Coastguard Worker if (id.length() == 0) {
602*0e209d39SAndroid Build Coastguard Worker id.setTo(ANY, 3);
603*0e209d39SAndroid Build Coastguard Worker }
604*0e209d39SAndroid Build Coastguard Worker id.append(TARGET_SEP).append(target);
605*0e209d39SAndroid Build Coastguard Worker if (variant.length() != 0) {
606*0e209d39SAndroid Build Coastguard Worker id.append(VARIANT_SEP).append(variant);
607*0e209d39SAndroid Build Coastguard Worker }
608*0e209d39SAndroid Build Coastguard Worker // NUL-terminate the ID string for getTerminatedBuffer.
609*0e209d39SAndroid Build Coastguard Worker // This prevents valgrind and Purify warnings.
610*0e209d39SAndroid Build Coastguard Worker id.append((char16_t)0);
611*0e209d39SAndroid Build Coastguard Worker id.truncate(id.length()-1);
612*0e209d39SAndroid Build Coastguard Worker }
613*0e209d39SAndroid Build Coastguard Worker
614*0e209d39SAndroid Build Coastguard Worker /**
615*0e209d39SAndroid Build Coastguard Worker * Register two targets as being inverses of one another. For
616*0e209d39SAndroid Build Coastguard Worker * example, calling registerSpecialInverse("NFC", "NFD", true) causes
617*0e209d39SAndroid Build Coastguard Worker * Transliterator to form the following inverse relationships:
618*0e209d39SAndroid Build Coastguard Worker *
619*0e209d39SAndroid Build Coastguard Worker * <pre>NFC => NFD
620*0e209d39SAndroid Build Coastguard Worker * Any-NFC => Any-NFD
621*0e209d39SAndroid Build Coastguard Worker * NFD => NFC
622*0e209d39SAndroid Build Coastguard Worker * Any-NFD => Any-NFC</pre>
623*0e209d39SAndroid Build Coastguard Worker *
624*0e209d39SAndroid Build Coastguard Worker * (Without the special inverse registration, the inverse of NFC
625*0e209d39SAndroid Build Coastguard Worker * would be NFC-Any.) Note that NFD is shorthand for Any-NFD, but
626*0e209d39SAndroid Build Coastguard Worker * that the presence or absence of "Any-" is preserved.
627*0e209d39SAndroid Build Coastguard Worker *
628*0e209d39SAndroid Build Coastguard Worker * <p>The relationship is symmetrical; registering (a, b) is
629*0e209d39SAndroid Build Coastguard Worker * equivalent to registering (b, a).
630*0e209d39SAndroid Build Coastguard Worker *
631*0e209d39SAndroid Build Coastguard Worker * <p>The relevant IDs must still be registered separately as
632*0e209d39SAndroid Build Coastguard Worker * factories or classes.
633*0e209d39SAndroid Build Coastguard Worker *
634*0e209d39SAndroid Build Coastguard Worker * <p>Only the targets are specified. Special inverses always
635*0e209d39SAndroid Build Coastguard Worker * have the form Any-Target1 <=> Any-Target2. The target should
636*0e209d39SAndroid Build Coastguard Worker * have canonical casing (the casing desired to be produced when
637*0e209d39SAndroid Build Coastguard Worker * an inverse is formed) and should contain no whitespace or other
638*0e209d39SAndroid Build Coastguard Worker * extraneous characters.
639*0e209d39SAndroid Build Coastguard Worker *
640*0e209d39SAndroid Build Coastguard Worker * @param target the target against which to register the inverse
641*0e209d39SAndroid Build Coastguard Worker * @param inverseTarget the inverse of target, that is
642*0e209d39SAndroid Build Coastguard Worker * Any-target.getInverse() => Any-inverseTarget
643*0e209d39SAndroid Build Coastguard Worker * @param bidirectional if true, register the reverse relation
644*0e209d39SAndroid Build Coastguard Worker * as well, that is, Any-inverseTarget.getInverse() => Any-target
645*0e209d39SAndroid Build Coastguard Worker */
registerSpecialInverse(const UnicodeString & target,const UnicodeString & inverseTarget,UBool bidirectional,UErrorCode & status)646*0e209d39SAndroid Build Coastguard Worker void TransliteratorIDParser::registerSpecialInverse(const UnicodeString& target,
647*0e209d39SAndroid Build Coastguard Worker const UnicodeString& inverseTarget,
648*0e209d39SAndroid Build Coastguard Worker UBool bidirectional,
649*0e209d39SAndroid Build Coastguard Worker UErrorCode &status) {
650*0e209d39SAndroid Build Coastguard Worker umtx_initOnce(gSpecialInversesInitOnce, init, status);
651*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(status)) {
652*0e209d39SAndroid Build Coastguard Worker return;
653*0e209d39SAndroid Build Coastguard Worker }
654*0e209d39SAndroid Build Coastguard Worker
655*0e209d39SAndroid Build Coastguard Worker // If target == inverseTarget then force bidirectional => false
656*0e209d39SAndroid Build Coastguard Worker if (bidirectional && 0==target.caseCompare(inverseTarget, U_FOLD_CASE_DEFAULT)) {
657*0e209d39SAndroid Build Coastguard Worker bidirectional = false;
658*0e209d39SAndroid Build Coastguard Worker }
659*0e209d39SAndroid Build Coastguard Worker
660*0e209d39SAndroid Build Coastguard Worker Mutex lock(&LOCK);
661*0e209d39SAndroid Build Coastguard Worker
662*0e209d39SAndroid Build Coastguard Worker UnicodeString *tempus = new UnicodeString(inverseTarget); // Used for null pointer check before usage.
663*0e209d39SAndroid Build Coastguard Worker if (tempus == nullptr) {
664*0e209d39SAndroid Build Coastguard Worker status = U_MEMORY_ALLOCATION_ERROR;
665*0e209d39SAndroid Build Coastguard Worker return;
666*0e209d39SAndroid Build Coastguard Worker }
667*0e209d39SAndroid Build Coastguard Worker SPECIAL_INVERSES->put(target, tempus, status);
668*0e209d39SAndroid Build Coastguard Worker if (bidirectional) {
669*0e209d39SAndroid Build Coastguard Worker tempus = new UnicodeString(target);
670*0e209d39SAndroid Build Coastguard Worker if (tempus == nullptr) {
671*0e209d39SAndroid Build Coastguard Worker status = U_MEMORY_ALLOCATION_ERROR;
672*0e209d39SAndroid Build Coastguard Worker return;
673*0e209d39SAndroid Build Coastguard Worker }
674*0e209d39SAndroid Build Coastguard Worker SPECIAL_INVERSES->put(inverseTarget, tempus, status);
675*0e209d39SAndroid Build Coastguard Worker }
676*0e209d39SAndroid Build Coastguard Worker }
677*0e209d39SAndroid Build Coastguard Worker
678*0e209d39SAndroid Build Coastguard Worker //----------------------------------------------------------------
679*0e209d39SAndroid Build Coastguard Worker // Private implementation
680*0e209d39SAndroid Build Coastguard Worker //----------------------------------------------------------------
681*0e209d39SAndroid Build Coastguard Worker
682*0e209d39SAndroid Build Coastguard Worker /**
683*0e209d39SAndroid Build Coastguard Worker * Parse an ID into component pieces. Take IDs of the form T,
684*0e209d39SAndroid Build Coastguard Worker * T/V, S-T, S-T/V, or S/V-T. If the source is missing, return a
685*0e209d39SAndroid Build Coastguard Worker * source of ANY.
686*0e209d39SAndroid Build Coastguard Worker * @param id the id string, in any of several forms
687*0e209d39SAndroid Build Coastguard Worker * @param pos INPUT-OUTPUT parameter. On input, pos is the
688*0e209d39SAndroid Build Coastguard Worker * offset of the first character to parse in id. On output,
689*0e209d39SAndroid Build Coastguard Worker * pos is the offset after the last parsed character. If the
690*0e209d39SAndroid Build Coastguard Worker * parse failed, pos will be unchanged.
691*0e209d39SAndroid Build Coastguard Worker * @param allowFilter2 if true, a UnicodeSet pattern is allowed
692*0e209d39SAndroid Build Coastguard Worker * at any location between specs or delimiters, and is returned
693*0e209d39SAndroid Build Coastguard Worker * as the fifth string in the array.
694*0e209d39SAndroid Build Coastguard Worker * @return a Specs object, or nullptr if the parse failed. If
695*0e209d39SAndroid Build Coastguard Worker * neither source nor target was seen in the parsed id, then the
696*0e209d39SAndroid Build Coastguard Worker * parse fails. If allowFilter is true, then the parsed filter
697*0e209d39SAndroid Build Coastguard Worker * pattern is returned in the Specs object, otherwise the returned
698*0e209d39SAndroid Build Coastguard Worker * filter reference is nullptr. If the parse fails for any reason
699*0e209d39SAndroid Build Coastguard Worker * nullptr is returned.
700*0e209d39SAndroid Build Coastguard Worker */
701*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::Specs*
parseFilterID(const UnicodeString & id,int32_t & pos,UBool allowFilter)702*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::parseFilterID(const UnicodeString& id, int32_t& pos,
703*0e209d39SAndroid Build Coastguard Worker UBool allowFilter) {
704*0e209d39SAndroid Build Coastguard Worker UnicodeString first;
705*0e209d39SAndroid Build Coastguard Worker UnicodeString source;
706*0e209d39SAndroid Build Coastguard Worker UnicodeString target;
707*0e209d39SAndroid Build Coastguard Worker UnicodeString variant;
708*0e209d39SAndroid Build Coastguard Worker UnicodeString filter;
709*0e209d39SAndroid Build Coastguard Worker char16_t delimiter = 0;
710*0e209d39SAndroid Build Coastguard Worker int32_t specCount = 0;
711*0e209d39SAndroid Build Coastguard Worker int32_t start = pos;
712*0e209d39SAndroid Build Coastguard Worker
713*0e209d39SAndroid Build Coastguard Worker // This loop parses one of the following things with each
714*0e209d39SAndroid Build Coastguard Worker // pass: a filter, a delimiter character (either '-' or '/'),
715*0e209d39SAndroid Build Coastguard Worker // or a spec (source, target, or variant).
716*0e209d39SAndroid Build Coastguard Worker for (;;) {
717*0e209d39SAndroid Build Coastguard Worker ICU_Utility::skipWhitespace(id, pos, true);
718*0e209d39SAndroid Build Coastguard Worker if (pos == id.length()) {
719*0e209d39SAndroid Build Coastguard Worker break;
720*0e209d39SAndroid Build Coastguard Worker }
721*0e209d39SAndroid Build Coastguard Worker
722*0e209d39SAndroid Build Coastguard Worker // Parse filters
723*0e209d39SAndroid Build Coastguard Worker if (allowFilter && filter.length() == 0 &&
724*0e209d39SAndroid Build Coastguard Worker UnicodeSet::resemblesPattern(id, pos)) {
725*0e209d39SAndroid Build Coastguard Worker
726*0e209d39SAndroid Build Coastguard Worker ParsePosition ppos(pos);
727*0e209d39SAndroid Build Coastguard Worker UErrorCode ec = U_ZERO_ERROR;
728*0e209d39SAndroid Build Coastguard Worker UnicodeSet set(id, ppos, USET_IGNORE_SPACE, nullptr, ec);
729*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(ec)) {
730*0e209d39SAndroid Build Coastguard Worker pos = start;
731*0e209d39SAndroid Build Coastguard Worker return nullptr;
732*0e209d39SAndroid Build Coastguard Worker }
733*0e209d39SAndroid Build Coastguard Worker id.extractBetween(pos, ppos.getIndex(), filter);
734*0e209d39SAndroid Build Coastguard Worker pos = ppos.getIndex();
735*0e209d39SAndroid Build Coastguard Worker continue;
736*0e209d39SAndroid Build Coastguard Worker }
737*0e209d39SAndroid Build Coastguard Worker
738*0e209d39SAndroid Build Coastguard Worker if (delimiter == 0) {
739*0e209d39SAndroid Build Coastguard Worker char16_t c = id.charAt(pos);
740*0e209d39SAndroid Build Coastguard Worker if ((c == TARGET_SEP && target.length() == 0) ||
741*0e209d39SAndroid Build Coastguard Worker (c == VARIANT_SEP && variant.length() == 0)) {
742*0e209d39SAndroid Build Coastguard Worker delimiter = c;
743*0e209d39SAndroid Build Coastguard Worker ++pos;
744*0e209d39SAndroid Build Coastguard Worker continue;
745*0e209d39SAndroid Build Coastguard Worker }
746*0e209d39SAndroid Build Coastguard Worker }
747*0e209d39SAndroid Build Coastguard Worker
748*0e209d39SAndroid Build Coastguard Worker // We are about to try to parse a spec with no delimiter
749*0e209d39SAndroid Build Coastguard Worker // when we can no longer do so (we can only do so at the
750*0e209d39SAndroid Build Coastguard Worker // start); break.
751*0e209d39SAndroid Build Coastguard Worker if (delimiter == 0 && specCount > 0) {
752*0e209d39SAndroid Build Coastguard Worker break;
753*0e209d39SAndroid Build Coastguard Worker }
754*0e209d39SAndroid Build Coastguard Worker
755*0e209d39SAndroid Build Coastguard Worker UnicodeString spec = ICU_Utility::parseUnicodeIdentifier(id, pos);
756*0e209d39SAndroid Build Coastguard Worker if (spec.length() == 0) {
757*0e209d39SAndroid Build Coastguard Worker // Note that if there was a trailing delimiter, we
758*0e209d39SAndroid Build Coastguard Worker // consume it. So Foo-, Foo/, Foo-Bar/, and Foo/Bar-
759*0e209d39SAndroid Build Coastguard Worker // are legal.
760*0e209d39SAndroid Build Coastguard Worker break;
761*0e209d39SAndroid Build Coastguard Worker }
762*0e209d39SAndroid Build Coastguard Worker
763*0e209d39SAndroid Build Coastguard Worker switch (delimiter) {
764*0e209d39SAndroid Build Coastguard Worker case 0:
765*0e209d39SAndroid Build Coastguard Worker first = spec;
766*0e209d39SAndroid Build Coastguard Worker break;
767*0e209d39SAndroid Build Coastguard Worker case TARGET_SEP:
768*0e209d39SAndroid Build Coastguard Worker target = spec;
769*0e209d39SAndroid Build Coastguard Worker break;
770*0e209d39SAndroid Build Coastguard Worker case VARIANT_SEP:
771*0e209d39SAndroid Build Coastguard Worker variant = spec;
772*0e209d39SAndroid Build Coastguard Worker break;
773*0e209d39SAndroid Build Coastguard Worker }
774*0e209d39SAndroid Build Coastguard Worker ++specCount;
775*0e209d39SAndroid Build Coastguard Worker delimiter = 0;
776*0e209d39SAndroid Build Coastguard Worker }
777*0e209d39SAndroid Build Coastguard Worker
778*0e209d39SAndroid Build Coastguard Worker // A spec with no prior character is either source or target,
779*0e209d39SAndroid Build Coastguard Worker // depending on whether an explicit "-target" was seen.
780*0e209d39SAndroid Build Coastguard Worker if (first.length() != 0) {
781*0e209d39SAndroid Build Coastguard Worker if (target.length() == 0) {
782*0e209d39SAndroid Build Coastguard Worker target = first;
783*0e209d39SAndroid Build Coastguard Worker } else {
784*0e209d39SAndroid Build Coastguard Worker source = first;
785*0e209d39SAndroid Build Coastguard Worker }
786*0e209d39SAndroid Build Coastguard Worker }
787*0e209d39SAndroid Build Coastguard Worker
788*0e209d39SAndroid Build Coastguard Worker // Must have either source or target
789*0e209d39SAndroid Build Coastguard Worker if (source.length() == 0 && target.length() == 0) {
790*0e209d39SAndroid Build Coastguard Worker pos = start;
791*0e209d39SAndroid Build Coastguard Worker return nullptr;
792*0e209d39SAndroid Build Coastguard Worker }
793*0e209d39SAndroid Build Coastguard Worker
794*0e209d39SAndroid Build Coastguard Worker // Empty source or target defaults to ANY
795*0e209d39SAndroid Build Coastguard Worker UBool sawSource = true;
796*0e209d39SAndroid Build Coastguard Worker if (source.length() == 0) {
797*0e209d39SAndroid Build Coastguard Worker source.setTo(ANY, 3);
798*0e209d39SAndroid Build Coastguard Worker sawSource = false;
799*0e209d39SAndroid Build Coastguard Worker }
800*0e209d39SAndroid Build Coastguard Worker if (target.length() == 0) {
801*0e209d39SAndroid Build Coastguard Worker target.setTo(ANY, 3);
802*0e209d39SAndroid Build Coastguard Worker }
803*0e209d39SAndroid Build Coastguard Worker
804*0e209d39SAndroid Build Coastguard Worker return new Specs(source, target, variant, sawSource, filter);
805*0e209d39SAndroid Build Coastguard Worker }
806*0e209d39SAndroid Build Coastguard Worker
807*0e209d39SAndroid Build Coastguard Worker /**
808*0e209d39SAndroid Build Coastguard Worker * Givens a Spec object, convert it to a SingleID object. The
809*0e209d39SAndroid Build Coastguard Worker * Spec object is a more unprocessed parse result. The SingleID
810*0e209d39SAndroid Build Coastguard Worker * object contains information about canonical and basic IDs.
811*0e209d39SAndroid Build Coastguard Worker * @return a SingleID; never returns nullptr. Returned object always
812*0e209d39SAndroid Build Coastguard Worker * has 'filter' field of nullptr.
813*0e209d39SAndroid Build Coastguard Worker */
814*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::SingleID*
specsToID(const Specs * specs,int32_t dir)815*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::specsToID(const Specs* specs, int32_t dir) {
816*0e209d39SAndroid Build Coastguard Worker UnicodeString canonID;
817*0e209d39SAndroid Build Coastguard Worker UnicodeString basicID;
818*0e209d39SAndroid Build Coastguard Worker UnicodeString basicPrefix;
819*0e209d39SAndroid Build Coastguard Worker if (specs != nullptr) {
820*0e209d39SAndroid Build Coastguard Worker UnicodeString buf;
821*0e209d39SAndroid Build Coastguard Worker if (dir == FORWARD) {
822*0e209d39SAndroid Build Coastguard Worker if (specs->sawSource) {
823*0e209d39SAndroid Build Coastguard Worker buf.append(specs->source).append(TARGET_SEP);
824*0e209d39SAndroid Build Coastguard Worker } else {
825*0e209d39SAndroid Build Coastguard Worker basicPrefix = specs->source;
826*0e209d39SAndroid Build Coastguard Worker basicPrefix.append(TARGET_SEP);
827*0e209d39SAndroid Build Coastguard Worker }
828*0e209d39SAndroid Build Coastguard Worker buf.append(specs->target);
829*0e209d39SAndroid Build Coastguard Worker } else {
830*0e209d39SAndroid Build Coastguard Worker buf.append(specs->target).append(TARGET_SEP).append(specs->source);
831*0e209d39SAndroid Build Coastguard Worker }
832*0e209d39SAndroid Build Coastguard Worker if (specs->variant.length() != 0) {
833*0e209d39SAndroid Build Coastguard Worker buf.append(VARIANT_SEP).append(specs->variant);
834*0e209d39SAndroid Build Coastguard Worker }
835*0e209d39SAndroid Build Coastguard Worker basicID = basicPrefix;
836*0e209d39SAndroid Build Coastguard Worker basicID.append(buf);
837*0e209d39SAndroid Build Coastguard Worker if (specs->filter.length() != 0) {
838*0e209d39SAndroid Build Coastguard Worker buf.insert(0, specs->filter);
839*0e209d39SAndroid Build Coastguard Worker }
840*0e209d39SAndroid Build Coastguard Worker canonID = buf;
841*0e209d39SAndroid Build Coastguard Worker }
842*0e209d39SAndroid Build Coastguard Worker return new SingleID(canonID, basicID);
843*0e209d39SAndroid Build Coastguard Worker }
844*0e209d39SAndroid Build Coastguard Worker
845*0e209d39SAndroid Build Coastguard Worker /**
846*0e209d39SAndroid Build Coastguard Worker * Given a Specs object, return a SingleID representing the
847*0e209d39SAndroid Build Coastguard Worker * special inverse of that ID. If there is no special inverse
848*0e209d39SAndroid Build Coastguard Worker * then return nullptr.
849*0e209d39SAndroid Build Coastguard Worker * @return a SingleID or nullptr. Returned object always has
850*0e209d39SAndroid Build Coastguard Worker * 'filter' field of nullptr.
851*0e209d39SAndroid Build Coastguard Worker */
852*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::SingleID*
specsToSpecialInverse(const Specs & specs,UErrorCode & status)853*0e209d39SAndroid Build Coastguard Worker TransliteratorIDParser::specsToSpecialInverse(const Specs& specs, UErrorCode &status) {
854*0e209d39SAndroid Build Coastguard Worker if (0!=specs.source.caseCompare(ANY, 3, U_FOLD_CASE_DEFAULT)) {
855*0e209d39SAndroid Build Coastguard Worker return nullptr;
856*0e209d39SAndroid Build Coastguard Worker }
857*0e209d39SAndroid Build Coastguard Worker umtx_initOnce(gSpecialInversesInitOnce, init, status);
858*0e209d39SAndroid Build Coastguard Worker if (U_FAILURE(status)) {
859*0e209d39SAndroid Build Coastguard Worker return nullptr;
860*0e209d39SAndroid Build Coastguard Worker }
861*0e209d39SAndroid Build Coastguard Worker
862*0e209d39SAndroid Build Coastguard Worker UnicodeString* inverseTarget;
863*0e209d39SAndroid Build Coastguard Worker
864*0e209d39SAndroid Build Coastguard Worker umtx_lock(&LOCK);
865*0e209d39SAndroid Build Coastguard Worker inverseTarget = (UnicodeString*) SPECIAL_INVERSES->get(specs.target);
866*0e209d39SAndroid Build Coastguard Worker umtx_unlock(&LOCK);
867*0e209d39SAndroid Build Coastguard Worker
868*0e209d39SAndroid Build Coastguard Worker if (inverseTarget != nullptr) {
869*0e209d39SAndroid Build Coastguard Worker // If the original ID contained "Any-" then make the
870*0e209d39SAndroid Build Coastguard Worker // special inverse "Any-Foo"; otherwise make it "Foo".
871*0e209d39SAndroid Build Coastguard Worker // So "Any-NFC" => "Any-NFD" but "NFC" => "NFD".
872*0e209d39SAndroid Build Coastguard Worker UnicodeString buf;
873*0e209d39SAndroid Build Coastguard Worker if (specs.filter.length() != 0) {
874*0e209d39SAndroid Build Coastguard Worker buf.append(specs.filter);
875*0e209d39SAndroid Build Coastguard Worker }
876*0e209d39SAndroid Build Coastguard Worker if (specs.sawSource) {
877*0e209d39SAndroid Build Coastguard Worker buf.append(ANY, 3).append(TARGET_SEP);
878*0e209d39SAndroid Build Coastguard Worker }
879*0e209d39SAndroid Build Coastguard Worker buf.append(*inverseTarget);
880*0e209d39SAndroid Build Coastguard Worker
881*0e209d39SAndroid Build Coastguard Worker UnicodeString basicID(true, ANY, 3);
882*0e209d39SAndroid Build Coastguard Worker basicID.append(TARGET_SEP).append(*inverseTarget);
883*0e209d39SAndroid Build Coastguard Worker
884*0e209d39SAndroid Build Coastguard Worker if (specs.variant.length() != 0) {
885*0e209d39SAndroid Build Coastguard Worker buf.append(VARIANT_SEP).append(specs.variant);
886*0e209d39SAndroid Build Coastguard Worker basicID.append(VARIANT_SEP).append(specs.variant);
887*0e209d39SAndroid Build Coastguard Worker }
888*0e209d39SAndroid Build Coastguard Worker return new SingleID(buf, basicID);
889*0e209d39SAndroid Build Coastguard Worker }
890*0e209d39SAndroid Build Coastguard Worker return nullptr;
891*0e209d39SAndroid Build Coastguard Worker }
892*0e209d39SAndroid Build Coastguard Worker
893*0e209d39SAndroid Build Coastguard Worker /**
894*0e209d39SAndroid Build Coastguard Worker * Glue method to get around access problems in C++. This would
895*0e209d39SAndroid Build Coastguard Worker * ideally be inline but we want to avoid a circular header
896*0e209d39SAndroid Build Coastguard Worker * dependency.
897*0e209d39SAndroid Build Coastguard Worker */
createBasicInstance(const UnicodeString & id,const UnicodeString * canonID)898*0e209d39SAndroid Build Coastguard Worker Transliterator* TransliteratorIDParser::createBasicInstance(const UnicodeString& id, const UnicodeString* canonID) {
899*0e209d39SAndroid Build Coastguard Worker return Transliterator::createBasicInstance(id, canonID);
900*0e209d39SAndroid Build Coastguard Worker }
901*0e209d39SAndroid Build Coastguard Worker
902*0e209d39SAndroid Build Coastguard Worker /**
903*0e209d39SAndroid Build Coastguard Worker * Initialize static memory. Called through umtx_initOnce only.
904*0e209d39SAndroid Build Coastguard Worker */
init(UErrorCode & status)905*0e209d39SAndroid Build Coastguard Worker void U_CALLCONV TransliteratorIDParser::init(UErrorCode &status) {
906*0e209d39SAndroid Build Coastguard Worker U_ASSERT(SPECIAL_INVERSES == nullptr);
907*0e209d39SAndroid Build Coastguard Worker ucln_i18n_registerCleanup(UCLN_I18N_TRANSLITERATOR, utrans_transliterator_cleanup);
908*0e209d39SAndroid Build Coastguard Worker
909*0e209d39SAndroid Build Coastguard Worker SPECIAL_INVERSES = new Hashtable(true, status);
910*0e209d39SAndroid Build Coastguard Worker if (SPECIAL_INVERSES == nullptr) {
911*0e209d39SAndroid Build Coastguard Worker status = U_MEMORY_ALLOCATION_ERROR;
912*0e209d39SAndroid Build Coastguard Worker return;
913*0e209d39SAndroid Build Coastguard Worker }
914*0e209d39SAndroid Build Coastguard Worker SPECIAL_INVERSES->setValueDeleter(uprv_deleteUObject);
915*0e209d39SAndroid Build Coastguard Worker }
916*0e209d39SAndroid Build Coastguard Worker
917*0e209d39SAndroid Build Coastguard Worker /**
918*0e209d39SAndroid Build Coastguard Worker * Free static memory.
919*0e209d39SAndroid Build Coastguard Worker */
cleanup()920*0e209d39SAndroid Build Coastguard Worker void TransliteratorIDParser::cleanup() {
921*0e209d39SAndroid Build Coastguard Worker if (SPECIAL_INVERSES) {
922*0e209d39SAndroid Build Coastguard Worker delete SPECIAL_INVERSES;
923*0e209d39SAndroid Build Coastguard Worker SPECIAL_INVERSES = nullptr;
924*0e209d39SAndroid Build Coastguard Worker }
925*0e209d39SAndroid Build Coastguard Worker gSpecialInversesInitOnce.reset();
926*0e209d39SAndroid Build Coastguard Worker }
927*0e209d39SAndroid Build Coastguard Worker
928*0e209d39SAndroid Build Coastguard Worker U_NAMESPACE_END
929*0e209d39SAndroid Build Coastguard Worker
930*0e209d39SAndroid Build Coastguard Worker #endif /* #if !UCONFIG_NO_TRANSLITERATION */
931*0e209d39SAndroid Build Coastguard Worker
932*0e209d39SAndroid Build Coastguard Worker //eof
933