xref: /aosp_15_r20/external/libchrome/base/i18n/rtl.cc (revision 635a864187cb8b6c713ff48b7e790a6b21769273)
1*635a8641SAndroid Build Coastguard Worker // Copyright (c) 2011 The Chromium Authors. All rights reserved.
2*635a8641SAndroid Build Coastguard Worker // Use of this source code is governed by a BSD-style license that can be
3*635a8641SAndroid Build Coastguard Worker // found in the LICENSE file.
4*635a8641SAndroid Build Coastguard Worker 
5*635a8641SAndroid Build Coastguard Worker #include "base/i18n/rtl.h"
6*635a8641SAndroid Build Coastguard Worker 
7*635a8641SAndroid Build Coastguard Worker #include <stddef.h>
8*635a8641SAndroid Build Coastguard Worker #include <stdint.h>
9*635a8641SAndroid Build Coastguard Worker 
10*635a8641SAndroid Build Coastguard Worker #include <algorithm>
11*635a8641SAndroid Build Coastguard Worker 
12*635a8641SAndroid Build Coastguard Worker #include "base/command_line.h"
13*635a8641SAndroid Build Coastguard Worker #include "base/files/file_path.h"
14*635a8641SAndroid Build Coastguard Worker #include "base/i18n/base_i18n_switches.h"
15*635a8641SAndroid Build Coastguard Worker #include "base/logging.h"
16*635a8641SAndroid Build Coastguard Worker #include "base/macros.h"
17*635a8641SAndroid Build Coastguard Worker #include "base/strings/string_split.h"
18*635a8641SAndroid Build Coastguard Worker #include "base/strings/string_util.h"
19*635a8641SAndroid Build Coastguard Worker #include "base/strings/sys_string_conversions.h"
20*635a8641SAndroid Build Coastguard Worker #include "base/strings/utf_string_conversions.h"
21*635a8641SAndroid Build Coastguard Worker #include "build/build_config.h"
22*635a8641SAndroid Build Coastguard Worker #include "third_party/icu/source/common/unicode/locid.h"
23*635a8641SAndroid Build Coastguard Worker #include "third_party/icu/source/common/unicode/uchar.h"
24*635a8641SAndroid Build Coastguard Worker #include "third_party/icu/source/common/unicode/uscript.h"
25*635a8641SAndroid Build Coastguard Worker #include "third_party/icu/source/i18n/unicode/coll.h"
26*635a8641SAndroid Build Coastguard Worker 
27*635a8641SAndroid Build Coastguard Worker #if defined(OS_IOS)
28*635a8641SAndroid Build Coastguard Worker #include "base/debug/crash_logging.h"
29*635a8641SAndroid Build Coastguard Worker #include "base/ios/ios_util.h"
30*635a8641SAndroid Build Coastguard Worker #endif
31*635a8641SAndroid Build Coastguard Worker 
32*635a8641SAndroid Build Coastguard Worker namespace {
33*635a8641SAndroid Build Coastguard Worker 
34*635a8641SAndroid Build Coastguard Worker // Extract language, country and variant, but ignore keywords.  For example,
35*635a8641SAndroid Build Coastguard Worker // en-US, ca@valencia, ca-ES@valencia.
GetLocaleString(const icu::Locale & locale)36*635a8641SAndroid Build Coastguard Worker std::string GetLocaleString(const icu::Locale& locale) {
37*635a8641SAndroid Build Coastguard Worker   const char* language = locale.getLanguage();
38*635a8641SAndroid Build Coastguard Worker   const char* country = locale.getCountry();
39*635a8641SAndroid Build Coastguard Worker   const char* variant = locale.getVariant();
40*635a8641SAndroid Build Coastguard Worker 
41*635a8641SAndroid Build Coastguard Worker   std::string result =
42*635a8641SAndroid Build Coastguard Worker       (language != nullptr && *language != '\0') ? language : "und";
43*635a8641SAndroid Build Coastguard Worker 
44*635a8641SAndroid Build Coastguard Worker   if (country != nullptr && *country != '\0') {
45*635a8641SAndroid Build Coastguard Worker     result += '-';
46*635a8641SAndroid Build Coastguard Worker     result += country;
47*635a8641SAndroid Build Coastguard Worker   }
48*635a8641SAndroid Build Coastguard Worker 
49*635a8641SAndroid Build Coastguard Worker   if (variant != nullptr && *variant != '\0')
50*635a8641SAndroid Build Coastguard Worker     result += '@' + base::ToLowerASCII(variant);
51*635a8641SAndroid Build Coastguard Worker 
52*635a8641SAndroid Build Coastguard Worker   return result;
53*635a8641SAndroid Build Coastguard Worker }
54*635a8641SAndroid Build Coastguard Worker 
55*635a8641SAndroid Build Coastguard Worker // Returns LEFT_TO_RIGHT or RIGHT_TO_LEFT if |character| has strong
56*635a8641SAndroid Build Coastguard Worker // directionality, returns UNKNOWN_DIRECTION if it doesn't. Please refer to
57*635a8641SAndroid Build Coastguard Worker // http://unicode.org/reports/tr9/ for more information.
GetCharacterDirection(UChar32 character)58*635a8641SAndroid Build Coastguard Worker base::i18n::TextDirection GetCharacterDirection(UChar32 character) {
59*635a8641SAndroid Build Coastguard Worker   static bool has_switch = base::CommandLine::ForCurrentProcess()->HasSwitch(
60*635a8641SAndroid Build Coastguard Worker       switches::kForceTextDirection);
61*635a8641SAndroid Build Coastguard Worker   if (has_switch) {
62*635a8641SAndroid Build Coastguard Worker     base::CommandLine* command_line = base::CommandLine::ForCurrentProcess();
63*635a8641SAndroid Build Coastguard Worker     std::string force_flag =
64*635a8641SAndroid Build Coastguard Worker         command_line->GetSwitchValueASCII(switches::kForceTextDirection);
65*635a8641SAndroid Build Coastguard Worker 
66*635a8641SAndroid Build Coastguard Worker     if (force_flag == switches::kForceDirectionRTL)
67*635a8641SAndroid Build Coastguard Worker       return base::i18n::RIGHT_TO_LEFT;
68*635a8641SAndroid Build Coastguard Worker     if (force_flag == switches::kForceDirectionLTR)
69*635a8641SAndroid Build Coastguard Worker       return base::i18n::LEFT_TO_RIGHT;
70*635a8641SAndroid Build Coastguard Worker   }
71*635a8641SAndroid Build Coastguard Worker   // Now that we have the character, we use ICU in order to query for the
72*635a8641SAndroid Build Coastguard Worker   // appropriate Unicode BiDi character type.
73*635a8641SAndroid Build Coastguard Worker   int32_t property = u_getIntPropertyValue(character, UCHAR_BIDI_CLASS);
74*635a8641SAndroid Build Coastguard Worker   if ((property == U_RIGHT_TO_LEFT) ||
75*635a8641SAndroid Build Coastguard Worker       (property == U_RIGHT_TO_LEFT_ARABIC) ||
76*635a8641SAndroid Build Coastguard Worker       (property == U_RIGHT_TO_LEFT_EMBEDDING) ||
77*635a8641SAndroid Build Coastguard Worker       (property == U_RIGHT_TO_LEFT_OVERRIDE)) {
78*635a8641SAndroid Build Coastguard Worker     return base::i18n::RIGHT_TO_LEFT;
79*635a8641SAndroid Build Coastguard Worker   } else if ((property == U_LEFT_TO_RIGHT) ||
80*635a8641SAndroid Build Coastguard Worker              (property == U_LEFT_TO_RIGHT_EMBEDDING) ||
81*635a8641SAndroid Build Coastguard Worker              (property == U_LEFT_TO_RIGHT_OVERRIDE)) {
82*635a8641SAndroid Build Coastguard Worker     return base::i18n::LEFT_TO_RIGHT;
83*635a8641SAndroid Build Coastguard Worker   }
84*635a8641SAndroid Build Coastguard Worker   return base::i18n::UNKNOWN_DIRECTION;
85*635a8641SAndroid Build Coastguard Worker }
86*635a8641SAndroid Build Coastguard Worker 
87*635a8641SAndroid Build Coastguard Worker }  // namespace
88*635a8641SAndroid Build Coastguard Worker 
89*635a8641SAndroid Build Coastguard Worker namespace base {
90*635a8641SAndroid Build Coastguard Worker namespace i18n {
91*635a8641SAndroid Build Coastguard Worker 
92*635a8641SAndroid Build Coastguard Worker // Represents the locale-specific ICU text direction.
93*635a8641SAndroid Build Coastguard Worker static TextDirection g_icu_text_direction = UNKNOWN_DIRECTION;
94*635a8641SAndroid Build Coastguard Worker 
95*635a8641SAndroid Build Coastguard Worker // Convert the ICU default locale to a string.
GetConfiguredLocale()96*635a8641SAndroid Build Coastguard Worker std::string GetConfiguredLocale() {
97*635a8641SAndroid Build Coastguard Worker   return GetLocaleString(icu::Locale::getDefault());
98*635a8641SAndroid Build Coastguard Worker }
99*635a8641SAndroid Build Coastguard Worker 
100*635a8641SAndroid Build Coastguard Worker // Convert the ICU canonicalized locale to a string.
GetCanonicalLocale(const std::string & locale)101*635a8641SAndroid Build Coastguard Worker std::string GetCanonicalLocale(const std::string& locale) {
102*635a8641SAndroid Build Coastguard Worker   return GetLocaleString(icu::Locale::createCanonical(locale.c_str()));
103*635a8641SAndroid Build Coastguard Worker }
104*635a8641SAndroid Build Coastguard Worker 
105*635a8641SAndroid Build Coastguard Worker // Convert Chrome locale name to ICU locale name
ICULocaleName(const std::string & locale_string)106*635a8641SAndroid Build Coastguard Worker std::string ICULocaleName(const std::string& locale_string) {
107*635a8641SAndroid Build Coastguard Worker   // If not Spanish, just return it.
108*635a8641SAndroid Build Coastguard Worker   if (locale_string.substr(0, 2) != "es")
109*635a8641SAndroid Build Coastguard Worker     return locale_string;
110*635a8641SAndroid Build Coastguard Worker   // Expand es to es-ES.
111*635a8641SAndroid Build Coastguard Worker   if (LowerCaseEqualsASCII(locale_string, "es"))
112*635a8641SAndroid Build Coastguard Worker     return "es-ES";
113*635a8641SAndroid Build Coastguard Worker   // Map es-419 (Latin American Spanish) to es-FOO depending on the system
114*635a8641SAndroid Build Coastguard Worker   // locale.  If it's es-RR other than es-ES, map to es-RR. Otherwise, map
115*635a8641SAndroid Build Coastguard Worker   // to es-MX (the most populous in Spanish-speaking Latin America).
116*635a8641SAndroid Build Coastguard Worker   if (LowerCaseEqualsASCII(locale_string, "es-419")) {
117*635a8641SAndroid Build Coastguard Worker     const icu::Locale& locale = icu::Locale::getDefault();
118*635a8641SAndroid Build Coastguard Worker     std::string language = locale.getLanguage();
119*635a8641SAndroid Build Coastguard Worker     const char* country = locale.getCountry();
120*635a8641SAndroid Build Coastguard Worker     if (LowerCaseEqualsASCII(language, "es") &&
121*635a8641SAndroid Build Coastguard Worker       !LowerCaseEqualsASCII(country, "es")) {
122*635a8641SAndroid Build Coastguard Worker         language += '-';
123*635a8641SAndroid Build Coastguard Worker         language += country;
124*635a8641SAndroid Build Coastguard Worker         return language;
125*635a8641SAndroid Build Coastguard Worker     }
126*635a8641SAndroid Build Coastguard Worker     return "es-MX";
127*635a8641SAndroid Build Coastguard Worker   }
128*635a8641SAndroid Build Coastguard Worker   // Currently, Chrome has only "es" and "es-419", but later we may have
129*635a8641SAndroid Build Coastguard Worker   // more specific "es-RR".
130*635a8641SAndroid Build Coastguard Worker   return locale_string;
131*635a8641SAndroid Build Coastguard Worker }
132*635a8641SAndroid Build Coastguard Worker 
SetICUDefaultLocale(const std::string & locale_string)133*635a8641SAndroid Build Coastguard Worker void SetICUDefaultLocale(const std::string& locale_string) {
134*635a8641SAndroid Build Coastguard Worker #if defined(OS_IOS)
135*635a8641SAndroid Build Coastguard Worker   static base::debug::CrashKeyString* crash_key_locale =
136*635a8641SAndroid Build Coastguard Worker       base::debug::AllocateCrashKeyString("icu_locale_input",
137*635a8641SAndroid Build Coastguard Worker                                           base::debug::CrashKeySize::Size256);
138*635a8641SAndroid Build Coastguard Worker   base::debug::SetCrashKeyString(crash_key_locale, locale_string);
139*635a8641SAndroid Build Coastguard Worker #endif
140*635a8641SAndroid Build Coastguard Worker   icu::Locale locale(ICULocaleName(locale_string).c_str());
141*635a8641SAndroid Build Coastguard Worker   UErrorCode error_code = U_ZERO_ERROR;
142*635a8641SAndroid Build Coastguard Worker   const char* lang = locale.getLanguage();
143*635a8641SAndroid Build Coastguard Worker   if (lang != nullptr && *lang != '\0') {
144*635a8641SAndroid Build Coastguard Worker     icu::Locale::setDefault(locale, error_code);
145*635a8641SAndroid Build Coastguard Worker   } else {
146*635a8641SAndroid Build Coastguard Worker     LOG(ERROR) << "Failed to set the ICU default locale to " << locale_string
147*635a8641SAndroid Build Coastguard Worker                << ". Falling back to en-US.";
148*635a8641SAndroid Build Coastguard Worker     icu::Locale::setDefault(icu::Locale::getUS(), error_code);
149*635a8641SAndroid Build Coastguard Worker   }
150*635a8641SAndroid Build Coastguard Worker   g_icu_text_direction = UNKNOWN_DIRECTION;
151*635a8641SAndroid Build Coastguard Worker }
152*635a8641SAndroid Build Coastguard Worker 
IsRTL()153*635a8641SAndroid Build Coastguard Worker bool IsRTL() {
154*635a8641SAndroid Build Coastguard Worker   return ICUIsRTL();
155*635a8641SAndroid Build Coastguard Worker }
156*635a8641SAndroid Build Coastguard Worker 
SetRTLForTesting(bool rtl)157*635a8641SAndroid Build Coastguard Worker void SetRTLForTesting(bool rtl) {
158*635a8641SAndroid Build Coastguard Worker   SetICUDefaultLocale(rtl ? "he" : "en");
159*635a8641SAndroid Build Coastguard Worker   DCHECK_EQ(rtl, IsRTL());
160*635a8641SAndroid Build Coastguard Worker }
161*635a8641SAndroid Build Coastguard Worker 
ICUIsRTL()162*635a8641SAndroid Build Coastguard Worker bool ICUIsRTL() {
163*635a8641SAndroid Build Coastguard Worker   if (g_icu_text_direction == UNKNOWN_DIRECTION) {
164*635a8641SAndroid Build Coastguard Worker     const icu::Locale& locale = icu::Locale::getDefault();
165*635a8641SAndroid Build Coastguard Worker     g_icu_text_direction = GetTextDirectionForLocaleInStartUp(locale.getName());
166*635a8641SAndroid Build Coastguard Worker   }
167*635a8641SAndroid Build Coastguard Worker   return g_icu_text_direction == RIGHT_TO_LEFT;
168*635a8641SAndroid Build Coastguard Worker }
169*635a8641SAndroid Build Coastguard Worker 
GetForcedTextDirection()170*635a8641SAndroid Build Coastguard Worker TextDirection GetForcedTextDirection() {
171*635a8641SAndroid Build Coastguard Worker // On iOS, check for RTL forcing.
172*635a8641SAndroid Build Coastguard Worker #if defined(OS_IOS)
173*635a8641SAndroid Build Coastguard Worker   if (base::ios::IsInForcedRTL())
174*635a8641SAndroid Build Coastguard Worker     return base::i18n::RIGHT_TO_LEFT;
175*635a8641SAndroid Build Coastguard Worker #endif
176*635a8641SAndroid Build Coastguard Worker 
177*635a8641SAndroid Build Coastguard Worker   base::CommandLine* command_line = base::CommandLine::ForCurrentProcess();
178*635a8641SAndroid Build Coastguard Worker   if (command_line->HasSwitch(switches::kForceUIDirection)) {
179*635a8641SAndroid Build Coastguard Worker     std::string force_flag =
180*635a8641SAndroid Build Coastguard Worker         command_line->GetSwitchValueASCII(switches::kForceUIDirection);
181*635a8641SAndroid Build Coastguard Worker 
182*635a8641SAndroid Build Coastguard Worker     if (force_flag == switches::kForceDirectionLTR)
183*635a8641SAndroid Build Coastguard Worker       return base::i18n::LEFT_TO_RIGHT;
184*635a8641SAndroid Build Coastguard Worker 
185*635a8641SAndroid Build Coastguard Worker     if (force_flag == switches::kForceDirectionRTL)
186*635a8641SAndroid Build Coastguard Worker       return base::i18n::RIGHT_TO_LEFT;
187*635a8641SAndroid Build Coastguard Worker   }
188*635a8641SAndroid Build Coastguard Worker 
189*635a8641SAndroid Build Coastguard Worker   return base::i18n::UNKNOWN_DIRECTION;
190*635a8641SAndroid Build Coastguard Worker }
191*635a8641SAndroid Build Coastguard Worker 
GetTextDirectionForLocaleInStartUp(const char * locale_name)192*635a8641SAndroid Build Coastguard Worker TextDirection GetTextDirectionForLocaleInStartUp(const char* locale_name) {
193*635a8641SAndroid Build Coastguard Worker   // Check for direction forcing.
194*635a8641SAndroid Build Coastguard Worker   TextDirection forced_direction = GetForcedTextDirection();
195*635a8641SAndroid Build Coastguard Worker   if (forced_direction != UNKNOWN_DIRECTION)
196*635a8641SAndroid Build Coastguard Worker     return forced_direction;
197*635a8641SAndroid Build Coastguard Worker 
198*635a8641SAndroid Build Coastguard Worker   // This list needs to be updated in alphabetical order if we add more RTL
199*635a8641SAndroid Build Coastguard Worker   // locales.
200*635a8641SAndroid Build Coastguard Worker   static const char kRTLLanguageCodes[][3] = {"ar", "fa", "he", "iw", "ur"};
201*635a8641SAndroid Build Coastguard Worker   std::vector<StringPiece> locale_split =
202*635a8641SAndroid Build Coastguard Worker       SplitStringPiece(locale_name, "-_", KEEP_WHITESPACE, SPLIT_WANT_ALL);
203*635a8641SAndroid Build Coastguard Worker   const StringPiece& language_code = locale_split[0];
204*635a8641SAndroid Build Coastguard Worker   if (std::binary_search(kRTLLanguageCodes,
205*635a8641SAndroid Build Coastguard Worker                          kRTLLanguageCodes + arraysize(kRTLLanguageCodes),
206*635a8641SAndroid Build Coastguard Worker                          language_code))
207*635a8641SAndroid Build Coastguard Worker     return RIGHT_TO_LEFT;
208*635a8641SAndroid Build Coastguard Worker   return LEFT_TO_RIGHT;
209*635a8641SAndroid Build Coastguard Worker }
210*635a8641SAndroid Build Coastguard Worker 
GetTextDirectionForLocale(const char * locale_name)211*635a8641SAndroid Build Coastguard Worker TextDirection GetTextDirectionForLocale(const char* locale_name) {
212*635a8641SAndroid Build Coastguard Worker   // Check for direction forcing.
213*635a8641SAndroid Build Coastguard Worker   TextDirection forced_direction = GetForcedTextDirection();
214*635a8641SAndroid Build Coastguard Worker   if (forced_direction != UNKNOWN_DIRECTION)
215*635a8641SAndroid Build Coastguard Worker     return forced_direction;
216*635a8641SAndroid Build Coastguard Worker 
217*635a8641SAndroid Build Coastguard Worker   UErrorCode status = U_ZERO_ERROR;
218*635a8641SAndroid Build Coastguard Worker   ULayoutType layout_dir = uloc_getCharacterOrientation(locale_name, &status);
219*635a8641SAndroid Build Coastguard Worker   DCHECK(U_SUCCESS(status));
220*635a8641SAndroid Build Coastguard Worker   // Treat anything other than RTL as LTR.
221*635a8641SAndroid Build Coastguard Worker   return (layout_dir != ULOC_LAYOUT_RTL) ? LEFT_TO_RIGHT : RIGHT_TO_LEFT;
222*635a8641SAndroid Build Coastguard Worker }
223*635a8641SAndroid Build Coastguard Worker 
GetFirstStrongCharacterDirection(const string16 & text)224*635a8641SAndroid Build Coastguard Worker TextDirection GetFirstStrongCharacterDirection(const string16& text) {
225*635a8641SAndroid Build Coastguard Worker   const UChar* string = text.c_str();
226*635a8641SAndroid Build Coastguard Worker   size_t length = text.length();
227*635a8641SAndroid Build Coastguard Worker   size_t position = 0;
228*635a8641SAndroid Build Coastguard Worker   while (position < length) {
229*635a8641SAndroid Build Coastguard Worker     UChar32 character;
230*635a8641SAndroid Build Coastguard Worker     size_t next_position = position;
231*635a8641SAndroid Build Coastguard Worker     U16_NEXT(string, next_position, length, character);
232*635a8641SAndroid Build Coastguard Worker     TextDirection direction = GetCharacterDirection(character);
233*635a8641SAndroid Build Coastguard Worker     if (direction != UNKNOWN_DIRECTION)
234*635a8641SAndroid Build Coastguard Worker       return direction;
235*635a8641SAndroid Build Coastguard Worker     position = next_position;
236*635a8641SAndroid Build Coastguard Worker   }
237*635a8641SAndroid Build Coastguard Worker   return LEFT_TO_RIGHT;
238*635a8641SAndroid Build Coastguard Worker }
239*635a8641SAndroid Build Coastguard Worker 
GetLastStrongCharacterDirection(const string16 & text)240*635a8641SAndroid Build Coastguard Worker TextDirection GetLastStrongCharacterDirection(const string16& text) {
241*635a8641SAndroid Build Coastguard Worker   const UChar* string = text.c_str();
242*635a8641SAndroid Build Coastguard Worker   size_t position = text.length();
243*635a8641SAndroid Build Coastguard Worker   while (position > 0) {
244*635a8641SAndroid Build Coastguard Worker     UChar32 character;
245*635a8641SAndroid Build Coastguard Worker     size_t prev_position = position;
246*635a8641SAndroid Build Coastguard Worker     U16_PREV(string, 0, prev_position, character);
247*635a8641SAndroid Build Coastguard Worker     TextDirection direction = GetCharacterDirection(character);
248*635a8641SAndroid Build Coastguard Worker     if (direction != UNKNOWN_DIRECTION)
249*635a8641SAndroid Build Coastguard Worker       return direction;
250*635a8641SAndroid Build Coastguard Worker     position = prev_position;
251*635a8641SAndroid Build Coastguard Worker   }
252*635a8641SAndroid Build Coastguard Worker   return LEFT_TO_RIGHT;
253*635a8641SAndroid Build Coastguard Worker }
254*635a8641SAndroid Build Coastguard Worker 
GetStringDirection(const string16 & text)255*635a8641SAndroid Build Coastguard Worker TextDirection GetStringDirection(const string16& text) {
256*635a8641SAndroid Build Coastguard Worker   const UChar* string = text.c_str();
257*635a8641SAndroid Build Coastguard Worker   size_t length = text.length();
258*635a8641SAndroid Build Coastguard Worker   size_t position = 0;
259*635a8641SAndroid Build Coastguard Worker 
260*635a8641SAndroid Build Coastguard Worker   TextDirection result(UNKNOWN_DIRECTION);
261*635a8641SAndroid Build Coastguard Worker   while (position < length) {
262*635a8641SAndroid Build Coastguard Worker     UChar32 character;
263*635a8641SAndroid Build Coastguard Worker     size_t next_position = position;
264*635a8641SAndroid Build Coastguard Worker     U16_NEXT(string, next_position, length, character);
265*635a8641SAndroid Build Coastguard Worker     TextDirection direction = GetCharacterDirection(character);
266*635a8641SAndroid Build Coastguard Worker     if (direction != UNKNOWN_DIRECTION) {
267*635a8641SAndroid Build Coastguard Worker       if (result != UNKNOWN_DIRECTION && result != direction)
268*635a8641SAndroid Build Coastguard Worker         return UNKNOWN_DIRECTION;
269*635a8641SAndroid Build Coastguard Worker       result = direction;
270*635a8641SAndroid Build Coastguard Worker     }
271*635a8641SAndroid Build Coastguard Worker     position = next_position;
272*635a8641SAndroid Build Coastguard Worker   }
273*635a8641SAndroid Build Coastguard Worker 
274*635a8641SAndroid Build Coastguard Worker   // Handle the case of a string not containing any strong directionality
275*635a8641SAndroid Build Coastguard Worker   // characters defaulting to LEFT_TO_RIGHT.
276*635a8641SAndroid Build Coastguard Worker   if (result == UNKNOWN_DIRECTION)
277*635a8641SAndroid Build Coastguard Worker     return LEFT_TO_RIGHT;
278*635a8641SAndroid Build Coastguard Worker 
279*635a8641SAndroid Build Coastguard Worker   return result;
280*635a8641SAndroid Build Coastguard Worker }
281*635a8641SAndroid Build Coastguard Worker 
282*635a8641SAndroid Build Coastguard Worker #if defined(OS_WIN)
AdjustStringForLocaleDirection(string16 * text)283*635a8641SAndroid Build Coastguard Worker bool AdjustStringForLocaleDirection(string16* text) {
284*635a8641SAndroid Build Coastguard Worker   if (!IsRTL() || text->empty())
285*635a8641SAndroid Build Coastguard Worker     return false;
286*635a8641SAndroid Build Coastguard Worker 
287*635a8641SAndroid Build Coastguard Worker   // Marking the string as LTR if the locale is RTL and the string does not
288*635a8641SAndroid Build Coastguard Worker   // contain strong RTL characters. Otherwise, mark the string as RTL.
289*635a8641SAndroid Build Coastguard Worker   bool has_rtl_chars = StringContainsStrongRTLChars(*text);
290*635a8641SAndroid Build Coastguard Worker   if (!has_rtl_chars)
291*635a8641SAndroid Build Coastguard Worker     WrapStringWithLTRFormatting(text);
292*635a8641SAndroid Build Coastguard Worker   else
293*635a8641SAndroid Build Coastguard Worker     WrapStringWithRTLFormatting(text);
294*635a8641SAndroid Build Coastguard Worker 
295*635a8641SAndroid Build Coastguard Worker   return true;
296*635a8641SAndroid Build Coastguard Worker }
297*635a8641SAndroid Build Coastguard Worker 
UnadjustStringForLocaleDirection(string16 * text)298*635a8641SAndroid Build Coastguard Worker bool UnadjustStringForLocaleDirection(string16* text) {
299*635a8641SAndroid Build Coastguard Worker   if (!IsRTL() || text->empty())
300*635a8641SAndroid Build Coastguard Worker     return false;
301*635a8641SAndroid Build Coastguard Worker 
302*635a8641SAndroid Build Coastguard Worker   *text = StripWrappingBidiControlCharacters(*text);
303*635a8641SAndroid Build Coastguard Worker   return true;
304*635a8641SAndroid Build Coastguard Worker }
305*635a8641SAndroid Build Coastguard Worker #else
AdjustStringForLocaleDirection(string16 * text)306*635a8641SAndroid Build Coastguard Worker bool AdjustStringForLocaleDirection(string16* text) {
307*635a8641SAndroid Build Coastguard Worker   // On OS X & GTK the directionality of a label is determined by the first
308*635a8641SAndroid Build Coastguard Worker   // strongly directional character.
309*635a8641SAndroid Build Coastguard Worker   // However, we want to make sure that in an LTR-language-UI all strings are
310*635a8641SAndroid Build Coastguard Worker   // left aligned and vice versa.
311*635a8641SAndroid Build Coastguard Worker   // A problem can arise if we display a string which starts with user input.
312*635a8641SAndroid Build Coastguard Worker   // User input may be of the opposite directionality to the UI. So the whole
313*635a8641SAndroid Build Coastguard Worker   // string will be displayed in the opposite directionality, e.g. if we want to
314*635a8641SAndroid Build Coastguard Worker   // display in an LTR UI [such as US English]:
315*635a8641SAndroid Build Coastguard Worker   //
316*635a8641SAndroid Build Coastguard Worker   // EMAN_NOISNETXE is now installed.
317*635a8641SAndroid Build Coastguard Worker   //
318*635a8641SAndroid Build Coastguard Worker   // Since EXTENSION_NAME begins with a strong RTL char, the label's
319*635a8641SAndroid Build Coastguard Worker   // directionality will be set to RTL and the string will be displayed visually
320*635a8641SAndroid Build Coastguard Worker   // as:
321*635a8641SAndroid Build Coastguard Worker   //
322*635a8641SAndroid Build Coastguard Worker   // .is now installed EMAN_NOISNETXE
323*635a8641SAndroid Build Coastguard Worker   //
324*635a8641SAndroid Build Coastguard Worker   // In order to solve this issue, we prepend an LRM to the string. An LRM is a
325*635a8641SAndroid Build Coastguard Worker   // strongly directional LTR char.
326*635a8641SAndroid Build Coastguard Worker   // We also append an LRM at the end, which ensures that we're in an LTR
327*635a8641SAndroid Build Coastguard Worker   // context.
328*635a8641SAndroid Build Coastguard Worker 
329*635a8641SAndroid Build Coastguard Worker   // Unlike Windows, Linux and OS X can correctly display RTL glyphs out of the
330*635a8641SAndroid Build Coastguard Worker   // box so there is no issue with displaying zero-width bidi control characters
331*635a8641SAndroid Build Coastguard Worker   // on any system.  Thus no need for the !IsRTL() check here.
332*635a8641SAndroid Build Coastguard Worker   if (text->empty())
333*635a8641SAndroid Build Coastguard Worker     return false;
334*635a8641SAndroid Build Coastguard Worker 
335*635a8641SAndroid Build Coastguard Worker   bool ui_direction_is_rtl = IsRTL();
336*635a8641SAndroid Build Coastguard Worker 
337*635a8641SAndroid Build Coastguard Worker   bool has_rtl_chars = StringContainsStrongRTLChars(*text);
338*635a8641SAndroid Build Coastguard Worker   if (!ui_direction_is_rtl && has_rtl_chars) {
339*635a8641SAndroid Build Coastguard Worker     WrapStringWithRTLFormatting(text);
340*635a8641SAndroid Build Coastguard Worker     text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
341*635a8641SAndroid Build Coastguard Worker                  kLeftToRightMark);
342*635a8641SAndroid Build Coastguard Worker     text->push_back(kLeftToRightMark);
343*635a8641SAndroid Build Coastguard Worker   } else if (ui_direction_is_rtl && has_rtl_chars) {
344*635a8641SAndroid Build Coastguard Worker     WrapStringWithRTLFormatting(text);
345*635a8641SAndroid Build Coastguard Worker     text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
346*635a8641SAndroid Build Coastguard Worker                  kRightToLeftMark);
347*635a8641SAndroid Build Coastguard Worker     text->push_back(kRightToLeftMark);
348*635a8641SAndroid Build Coastguard Worker   } else if (ui_direction_is_rtl) {
349*635a8641SAndroid Build Coastguard Worker     WrapStringWithLTRFormatting(text);
350*635a8641SAndroid Build Coastguard Worker     text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
351*635a8641SAndroid Build Coastguard Worker                  kRightToLeftMark);
352*635a8641SAndroid Build Coastguard Worker     text->push_back(kRightToLeftMark);
353*635a8641SAndroid Build Coastguard Worker   } else {
354*635a8641SAndroid Build Coastguard Worker     return false;
355*635a8641SAndroid Build Coastguard Worker   }
356*635a8641SAndroid Build Coastguard Worker 
357*635a8641SAndroid Build Coastguard Worker   return true;
358*635a8641SAndroid Build Coastguard Worker }
359*635a8641SAndroid Build Coastguard Worker 
UnadjustStringForLocaleDirection(string16 * text)360*635a8641SAndroid Build Coastguard Worker bool UnadjustStringForLocaleDirection(string16* text) {
361*635a8641SAndroid Build Coastguard Worker   if (text->empty())
362*635a8641SAndroid Build Coastguard Worker     return false;
363*635a8641SAndroid Build Coastguard Worker 
364*635a8641SAndroid Build Coastguard Worker   size_t begin_index = 0;
365*635a8641SAndroid Build Coastguard Worker   char16 begin = text->at(begin_index);
366*635a8641SAndroid Build Coastguard Worker   if (begin == kLeftToRightMark ||
367*635a8641SAndroid Build Coastguard Worker       begin == kRightToLeftMark) {
368*635a8641SAndroid Build Coastguard Worker     ++begin_index;
369*635a8641SAndroid Build Coastguard Worker   }
370*635a8641SAndroid Build Coastguard Worker 
371*635a8641SAndroid Build Coastguard Worker   size_t end_index = text->length() - 1;
372*635a8641SAndroid Build Coastguard Worker   char16 end = text->at(end_index);
373*635a8641SAndroid Build Coastguard Worker   if (end == kLeftToRightMark ||
374*635a8641SAndroid Build Coastguard Worker       end == kRightToLeftMark) {
375*635a8641SAndroid Build Coastguard Worker     --end_index;
376*635a8641SAndroid Build Coastguard Worker   }
377*635a8641SAndroid Build Coastguard Worker 
378*635a8641SAndroid Build Coastguard Worker   string16 unmarked_text =
379*635a8641SAndroid Build Coastguard Worker       text->substr(begin_index, end_index - begin_index + 1);
380*635a8641SAndroid Build Coastguard Worker   *text = StripWrappingBidiControlCharacters(unmarked_text);
381*635a8641SAndroid Build Coastguard Worker   return true;
382*635a8641SAndroid Build Coastguard Worker }
383*635a8641SAndroid Build Coastguard Worker 
384*635a8641SAndroid Build Coastguard Worker #endif  // !OS_WIN
385*635a8641SAndroid Build Coastguard Worker 
EnsureTerminatedDirectionalFormatting(string16 * text)386*635a8641SAndroid Build Coastguard Worker void EnsureTerminatedDirectionalFormatting(string16* text) {
387*635a8641SAndroid Build Coastguard Worker   int count = 0;
388*635a8641SAndroid Build Coastguard Worker   for (auto c : *text) {
389*635a8641SAndroid Build Coastguard Worker     if (c == kLeftToRightEmbeddingMark || c == kRightToLeftEmbeddingMark ||
390*635a8641SAndroid Build Coastguard Worker         c == kLeftToRightOverride || c == kRightToLeftOverride) {
391*635a8641SAndroid Build Coastguard Worker       ++count;
392*635a8641SAndroid Build Coastguard Worker     } else if (c == kPopDirectionalFormatting && count > 0) {
393*635a8641SAndroid Build Coastguard Worker       --count;
394*635a8641SAndroid Build Coastguard Worker     }
395*635a8641SAndroid Build Coastguard Worker   }
396*635a8641SAndroid Build Coastguard Worker   for (int j = 0; j < count; j++)
397*635a8641SAndroid Build Coastguard Worker     text->push_back(kPopDirectionalFormatting);
398*635a8641SAndroid Build Coastguard Worker }
399*635a8641SAndroid Build Coastguard Worker 
SanitizeUserSuppliedString(string16 * text)400*635a8641SAndroid Build Coastguard Worker void SanitizeUserSuppliedString(string16* text) {
401*635a8641SAndroid Build Coastguard Worker   EnsureTerminatedDirectionalFormatting(text);
402*635a8641SAndroid Build Coastguard Worker   AdjustStringForLocaleDirection(text);
403*635a8641SAndroid Build Coastguard Worker }
404*635a8641SAndroid Build Coastguard Worker 
StringContainsStrongRTLChars(const string16 & text)405*635a8641SAndroid Build Coastguard Worker bool StringContainsStrongRTLChars(const string16& text) {
406*635a8641SAndroid Build Coastguard Worker   const UChar* string = text.c_str();
407*635a8641SAndroid Build Coastguard Worker   size_t length = text.length();
408*635a8641SAndroid Build Coastguard Worker   size_t position = 0;
409*635a8641SAndroid Build Coastguard Worker   while (position < length) {
410*635a8641SAndroid Build Coastguard Worker     UChar32 character;
411*635a8641SAndroid Build Coastguard Worker     size_t next_position = position;
412*635a8641SAndroid Build Coastguard Worker     U16_NEXT(string, next_position, length, character);
413*635a8641SAndroid Build Coastguard Worker 
414*635a8641SAndroid Build Coastguard Worker     // Now that we have the character, we use ICU in order to query for the
415*635a8641SAndroid Build Coastguard Worker     // appropriate Unicode BiDi character type.
416*635a8641SAndroid Build Coastguard Worker     int32_t property = u_getIntPropertyValue(character, UCHAR_BIDI_CLASS);
417*635a8641SAndroid Build Coastguard Worker     if ((property == U_RIGHT_TO_LEFT) || (property == U_RIGHT_TO_LEFT_ARABIC))
418*635a8641SAndroid Build Coastguard Worker       return true;
419*635a8641SAndroid Build Coastguard Worker 
420*635a8641SAndroid Build Coastguard Worker     position = next_position;
421*635a8641SAndroid Build Coastguard Worker   }
422*635a8641SAndroid Build Coastguard Worker 
423*635a8641SAndroid Build Coastguard Worker   return false;
424*635a8641SAndroid Build Coastguard Worker }
425*635a8641SAndroid Build Coastguard Worker 
WrapStringWithLTRFormatting(string16 * text)426*635a8641SAndroid Build Coastguard Worker void WrapStringWithLTRFormatting(string16* text) {
427*635a8641SAndroid Build Coastguard Worker   if (text->empty())
428*635a8641SAndroid Build Coastguard Worker     return;
429*635a8641SAndroid Build Coastguard Worker 
430*635a8641SAndroid Build Coastguard Worker   // Inserting an LRE (Left-To-Right Embedding) mark as the first character.
431*635a8641SAndroid Build Coastguard Worker   text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
432*635a8641SAndroid Build Coastguard Worker                kLeftToRightEmbeddingMark);
433*635a8641SAndroid Build Coastguard Worker 
434*635a8641SAndroid Build Coastguard Worker   // Inserting a PDF (Pop Directional Formatting) mark as the last character.
435*635a8641SAndroid Build Coastguard Worker   text->push_back(kPopDirectionalFormatting);
436*635a8641SAndroid Build Coastguard Worker }
437*635a8641SAndroid Build Coastguard Worker 
WrapStringWithRTLFormatting(string16 * text)438*635a8641SAndroid Build Coastguard Worker void WrapStringWithRTLFormatting(string16* text) {
439*635a8641SAndroid Build Coastguard Worker   if (text->empty())
440*635a8641SAndroid Build Coastguard Worker     return;
441*635a8641SAndroid Build Coastguard Worker 
442*635a8641SAndroid Build Coastguard Worker   // Inserting an RLE (Right-To-Left Embedding) mark as the first character.
443*635a8641SAndroid Build Coastguard Worker   text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
444*635a8641SAndroid Build Coastguard Worker                kRightToLeftEmbeddingMark);
445*635a8641SAndroid Build Coastguard Worker 
446*635a8641SAndroid Build Coastguard Worker   // Inserting a PDF (Pop Directional Formatting) mark as the last character.
447*635a8641SAndroid Build Coastguard Worker   text->push_back(kPopDirectionalFormatting);
448*635a8641SAndroid Build Coastguard Worker }
449*635a8641SAndroid Build Coastguard Worker 
WrapPathWithLTRFormatting(const FilePath & path,string16 * rtl_safe_path)450*635a8641SAndroid Build Coastguard Worker void WrapPathWithLTRFormatting(const FilePath& path,
451*635a8641SAndroid Build Coastguard Worker                                string16* rtl_safe_path) {
452*635a8641SAndroid Build Coastguard Worker   // Wrap the overall path with LRE-PDF pair which essentialy marks the
453*635a8641SAndroid Build Coastguard Worker   // string as a Left-To-Right string.
454*635a8641SAndroid Build Coastguard Worker   // Inserting an LRE (Left-To-Right Embedding) mark as the first character.
455*635a8641SAndroid Build Coastguard Worker   rtl_safe_path->push_back(kLeftToRightEmbeddingMark);
456*635a8641SAndroid Build Coastguard Worker #if defined(OS_MACOSX)
457*635a8641SAndroid Build Coastguard Worker     rtl_safe_path->append(UTF8ToUTF16(path.value()));
458*635a8641SAndroid Build Coastguard Worker #elif defined(OS_WIN)
459*635a8641SAndroid Build Coastguard Worker     rtl_safe_path->append(path.value());
460*635a8641SAndroid Build Coastguard Worker #else  // defined(OS_POSIX) && !defined(OS_MACOSX)
461*635a8641SAndroid Build Coastguard Worker     std::wstring wide_path = base::SysNativeMBToWide(path.value());
462*635a8641SAndroid Build Coastguard Worker     rtl_safe_path->append(WideToUTF16(wide_path));
463*635a8641SAndroid Build Coastguard Worker #endif
464*635a8641SAndroid Build Coastguard Worker   // Inserting a PDF (Pop Directional Formatting) mark as the last character.
465*635a8641SAndroid Build Coastguard Worker   rtl_safe_path->push_back(kPopDirectionalFormatting);
466*635a8641SAndroid Build Coastguard Worker }
467*635a8641SAndroid Build Coastguard Worker 
GetDisplayStringInLTRDirectionality(const string16 & text)468*635a8641SAndroid Build Coastguard Worker string16 GetDisplayStringInLTRDirectionality(const string16& text) {
469*635a8641SAndroid Build Coastguard Worker   // Always wrap the string in RTL UI (it may be appended to RTL string).
470*635a8641SAndroid Build Coastguard Worker   // Also wrap strings with an RTL first strong character direction in LTR UI.
471*635a8641SAndroid Build Coastguard Worker   if (IsRTL() || GetFirstStrongCharacterDirection(text) == RIGHT_TO_LEFT) {
472*635a8641SAndroid Build Coastguard Worker     string16 text_mutable(text);
473*635a8641SAndroid Build Coastguard Worker     WrapStringWithLTRFormatting(&text_mutable);
474*635a8641SAndroid Build Coastguard Worker     return text_mutable;
475*635a8641SAndroid Build Coastguard Worker   }
476*635a8641SAndroid Build Coastguard Worker   return text;
477*635a8641SAndroid Build Coastguard Worker }
478*635a8641SAndroid Build Coastguard Worker 
StripWrappingBidiControlCharacters(const string16 & text)479*635a8641SAndroid Build Coastguard Worker string16 StripWrappingBidiControlCharacters(const string16& text) {
480*635a8641SAndroid Build Coastguard Worker   if (text.empty())
481*635a8641SAndroid Build Coastguard Worker     return text;
482*635a8641SAndroid Build Coastguard Worker   size_t begin_index = 0;
483*635a8641SAndroid Build Coastguard Worker   char16 begin = text[begin_index];
484*635a8641SAndroid Build Coastguard Worker   if (begin == kLeftToRightEmbeddingMark ||
485*635a8641SAndroid Build Coastguard Worker       begin == kRightToLeftEmbeddingMark ||
486*635a8641SAndroid Build Coastguard Worker       begin == kLeftToRightOverride ||
487*635a8641SAndroid Build Coastguard Worker       begin == kRightToLeftOverride)
488*635a8641SAndroid Build Coastguard Worker     ++begin_index;
489*635a8641SAndroid Build Coastguard Worker   size_t end_index = text.length() - 1;
490*635a8641SAndroid Build Coastguard Worker   if (text[end_index] == kPopDirectionalFormatting)
491*635a8641SAndroid Build Coastguard Worker     --end_index;
492*635a8641SAndroid Build Coastguard Worker   return text.substr(begin_index, end_index - begin_index + 1);
493*635a8641SAndroid Build Coastguard Worker }
494*635a8641SAndroid Build Coastguard Worker 
495*635a8641SAndroid Build Coastguard Worker }  // namespace i18n
496*635a8641SAndroid Build Coastguard Worker }  // namespace base
497