1*6777b538SAndroid Build Coastguard Worker // Copyright 2011 The Chromium Authors
2*6777b538SAndroid Build Coastguard Worker // Use of this source code is governed by a BSD-style license that can be
3*6777b538SAndroid Build Coastguard Worker // found in the LICENSE file.
4*6777b538SAndroid Build Coastguard Worker
5*6777b538SAndroid Build Coastguard Worker #include "base/i18n/rtl.h"
6*6777b538SAndroid Build Coastguard Worker
7*6777b538SAndroid Build Coastguard Worker #include <stddef.h>
8*6777b538SAndroid Build Coastguard Worker #include <stdint.h>
9*6777b538SAndroid Build Coastguard Worker
10*6777b538SAndroid Build Coastguard Worker #include <algorithm>
11*6777b538SAndroid Build Coastguard Worker #include <string_view>
12*6777b538SAndroid Build Coastguard Worker
13*6777b538SAndroid Build Coastguard Worker #include "base/check_op.h"
14*6777b538SAndroid Build Coastguard Worker #include "base/command_line.h"
15*6777b538SAndroid Build Coastguard Worker #include "base/files/file_path.h"
16*6777b538SAndroid Build Coastguard Worker #include "base/i18n/base_i18n_switches.h"
17*6777b538SAndroid Build Coastguard Worker #include "base/logging.h"
18*6777b538SAndroid Build Coastguard Worker #include "base/strings/string_split.h"
19*6777b538SAndroid Build Coastguard Worker #include "base/strings/string_util.h"
20*6777b538SAndroid Build Coastguard Worker #include "base/strings/sys_string_conversions.h"
21*6777b538SAndroid Build Coastguard Worker #include "base/strings/utf_string_conversions.h"
22*6777b538SAndroid Build Coastguard Worker #include "build/build_config.h"
23*6777b538SAndroid Build Coastguard Worker #include "third_party/icu/source/common/unicode/locid.h"
24*6777b538SAndroid Build Coastguard Worker #include "third_party/icu/source/common/unicode/uchar.h"
25*6777b538SAndroid Build Coastguard Worker #include "third_party/icu/source/common/unicode/uscript.h"
26*6777b538SAndroid Build Coastguard Worker #include "third_party/icu/source/i18n/unicode/coll.h"
27*6777b538SAndroid Build Coastguard Worker
28*6777b538SAndroid Build Coastguard Worker #if BUILDFLAG(IS_IOS)
29*6777b538SAndroid Build Coastguard Worker #include "base/debug/crash_logging.h"
30*6777b538SAndroid Build Coastguard Worker #include "base/ios/ios_util.h"
31*6777b538SAndroid Build Coastguard Worker #endif
32*6777b538SAndroid Build Coastguard Worker
33*6777b538SAndroid Build Coastguard Worker namespace {
34*6777b538SAndroid Build Coastguard Worker
35*6777b538SAndroid Build Coastguard Worker // Extract language, country and variant, but ignore keywords. For example,
36*6777b538SAndroid Build Coastguard Worker // en-US, ca@valencia, ca-ES@valencia.
GetLocaleString(const icu::Locale & locale)37*6777b538SAndroid Build Coastguard Worker std::string GetLocaleString(const icu::Locale& locale) {
38*6777b538SAndroid Build Coastguard Worker const char* language = locale.getLanguage();
39*6777b538SAndroid Build Coastguard Worker const char* country = locale.getCountry();
40*6777b538SAndroid Build Coastguard Worker const char* variant = locale.getVariant();
41*6777b538SAndroid Build Coastguard Worker const char* script = locale.getScript();
42*6777b538SAndroid Build Coastguard Worker
43*6777b538SAndroid Build Coastguard Worker std::string result =
44*6777b538SAndroid Build Coastguard Worker (language != nullptr && *language != '\0') ? language : "und";
45*6777b538SAndroid Build Coastguard Worker
46*6777b538SAndroid Build Coastguard Worker if (script != nullptr && *script != '\0') {
47*6777b538SAndroid Build Coastguard Worker result += '-';
48*6777b538SAndroid Build Coastguard Worker result += script;
49*6777b538SAndroid Build Coastguard Worker }
50*6777b538SAndroid Build Coastguard Worker
51*6777b538SAndroid Build Coastguard Worker if (country != nullptr && *country != '\0') {
52*6777b538SAndroid Build Coastguard Worker result += '-';
53*6777b538SAndroid Build Coastguard Worker result += country;
54*6777b538SAndroid Build Coastguard Worker }
55*6777b538SAndroid Build Coastguard Worker
56*6777b538SAndroid Build Coastguard Worker if (variant != nullptr && *variant != '\0')
57*6777b538SAndroid Build Coastguard Worker result += '@' + base::ToLowerASCII(variant);
58*6777b538SAndroid Build Coastguard Worker
59*6777b538SAndroid Build Coastguard Worker return result;
60*6777b538SAndroid Build Coastguard Worker }
61*6777b538SAndroid Build Coastguard Worker
62*6777b538SAndroid Build Coastguard Worker // Returns LEFT_TO_RIGHT or RIGHT_TO_LEFT if |character| has strong
63*6777b538SAndroid Build Coastguard Worker // directionality, returns UNKNOWN_DIRECTION if it doesn't. Please refer to
64*6777b538SAndroid Build Coastguard Worker // http://unicode.org/reports/tr9/ for more information.
GetCharacterDirection(UChar32 character)65*6777b538SAndroid Build Coastguard Worker base::i18n::TextDirection GetCharacterDirection(UChar32 character) {
66*6777b538SAndroid Build Coastguard Worker static bool has_switch = base::CommandLine::ForCurrentProcess()->HasSwitch(
67*6777b538SAndroid Build Coastguard Worker switches::kForceTextDirection);
68*6777b538SAndroid Build Coastguard Worker if (has_switch) {
69*6777b538SAndroid Build Coastguard Worker base::CommandLine* command_line = base::CommandLine::ForCurrentProcess();
70*6777b538SAndroid Build Coastguard Worker std::string force_flag =
71*6777b538SAndroid Build Coastguard Worker command_line->GetSwitchValueASCII(switches::kForceTextDirection);
72*6777b538SAndroid Build Coastguard Worker
73*6777b538SAndroid Build Coastguard Worker if (force_flag == switches::kForceDirectionRTL)
74*6777b538SAndroid Build Coastguard Worker return base::i18n::RIGHT_TO_LEFT;
75*6777b538SAndroid Build Coastguard Worker if (force_flag == switches::kForceDirectionLTR)
76*6777b538SAndroid Build Coastguard Worker return base::i18n::LEFT_TO_RIGHT;
77*6777b538SAndroid Build Coastguard Worker }
78*6777b538SAndroid Build Coastguard Worker // Now that we have the character, we use ICU in order to query for the
79*6777b538SAndroid Build Coastguard Worker // appropriate Unicode BiDi character type.
80*6777b538SAndroid Build Coastguard Worker int32_t property = u_getIntPropertyValue(character, UCHAR_BIDI_CLASS);
81*6777b538SAndroid Build Coastguard Worker switch (property) {
82*6777b538SAndroid Build Coastguard Worker case U_RIGHT_TO_LEFT:
83*6777b538SAndroid Build Coastguard Worker case U_RIGHT_TO_LEFT_ARABIC:
84*6777b538SAndroid Build Coastguard Worker case U_RIGHT_TO_LEFT_EMBEDDING:
85*6777b538SAndroid Build Coastguard Worker case U_RIGHT_TO_LEFT_OVERRIDE:
86*6777b538SAndroid Build Coastguard Worker return base::i18n::RIGHT_TO_LEFT;
87*6777b538SAndroid Build Coastguard Worker case U_LEFT_TO_RIGHT:
88*6777b538SAndroid Build Coastguard Worker case U_LEFT_TO_RIGHT_EMBEDDING:
89*6777b538SAndroid Build Coastguard Worker case U_LEFT_TO_RIGHT_OVERRIDE:
90*6777b538SAndroid Build Coastguard Worker return base::i18n::LEFT_TO_RIGHT;
91*6777b538SAndroid Build Coastguard Worker }
92*6777b538SAndroid Build Coastguard Worker return base::i18n::UNKNOWN_DIRECTION;
93*6777b538SAndroid Build Coastguard Worker }
94*6777b538SAndroid Build Coastguard Worker
95*6777b538SAndroid Build Coastguard Worker } // namespace
96*6777b538SAndroid Build Coastguard Worker
97*6777b538SAndroid Build Coastguard Worker namespace base {
98*6777b538SAndroid Build Coastguard Worker namespace i18n {
99*6777b538SAndroid Build Coastguard Worker
100*6777b538SAndroid Build Coastguard Worker // Represents the locale-specific ICU text direction.
101*6777b538SAndroid Build Coastguard Worker static TextDirection g_icu_text_direction = UNKNOWN_DIRECTION;
102*6777b538SAndroid Build Coastguard Worker
103*6777b538SAndroid Build Coastguard Worker // Convert the ICU default locale to a string.
GetConfiguredLocale()104*6777b538SAndroid Build Coastguard Worker std::string GetConfiguredLocale() {
105*6777b538SAndroid Build Coastguard Worker return GetLocaleString(icu::Locale::getDefault());
106*6777b538SAndroid Build Coastguard Worker }
107*6777b538SAndroid Build Coastguard Worker
108*6777b538SAndroid Build Coastguard Worker // Convert the ICU canonicalized locale to a string.
GetCanonicalLocale(const std::string & locale)109*6777b538SAndroid Build Coastguard Worker std::string GetCanonicalLocale(const std::string& locale) {
110*6777b538SAndroid Build Coastguard Worker return GetLocaleString(icu::Locale::createCanonical(locale.c_str()));
111*6777b538SAndroid Build Coastguard Worker }
112*6777b538SAndroid Build Coastguard Worker
113*6777b538SAndroid Build Coastguard Worker // Convert Chrome locale name to ICU locale name
ICULocaleName(const std::string & locale_string)114*6777b538SAndroid Build Coastguard Worker std::string ICULocaleName(const std::string& locale_string) {
115*6777b538SAndroid Build Coastguard Worker // If not Spanish, just return it.
116*6777b538SAndroid Build Coastguard Worker if (locale_string.substr(0, 2) != "es")
117*6777b538SAndroid Build Coastguard Worker return locale_string;
118*6777b538SAndroid Build Coastguard Worker // Expand es to es-ES.
119*6777b538SAndroid Build Coastguard Worker if (EqualsCaseInsensitiveASCII(locale_string, "es"))
120*6777b538SAndroid Build Coastguard Worker return "es-ES";
121*6777b538SAndroid Build Coastguard Worker // Map es-419 (Latin American Spanish) to es-FOO depending on the system
122*6777b538SAndroid Build Coastguard Worker // locale. If it's es-RR other than es-ES, map to es-RR. Otherwise, map
123*6777b538SAndroid Build Coastguard Worker // to es-MX (the most populous in Spanish-speaking Latin America).
124*6777b538SAndroid Build Coastguard Worker if (EqualsCaseInsensitiveASCII(locale_string, "es-419")) {
125*6777b538SAndroid Build Coastguard Worker const icu::Locale& locale = icu::Locale::getDefault();
126*6777b538SAndroid Build Coastguard Worker std::string language = locale.getLanguage();
127*6777b538SAndroid Build Coastguard Worker const char* country = locale.getCountry();
128*6777b538SAndroid Build Coastguard Worker if (EqualsCaseInsensitiveASCII(language, "es") &&
129*6777b538SAndroid Build Coastguard Worker !EqualsCaseInsensitiveASCII(country, "es")) {
130*6777b538SAndroid Build Coastguard Worker language += '-';
131*6777b538SAndroid Build Coastguard Worker language += country;
132*6777b538SAndroid Build Coastguard Worker return language;
133*6777b538SAndroid Build Coastguard Worker }
134*6777b538SAndroid Build Coastguard Worker return "es-MX";
135*6777b538SAndroid Build Coastguard Worker }
136*6777b538SAndroid Build Coastguard Worker // Currently, Chrome has only "es" and "es-419", but later we may have
137*6777b538SAndroid Build Coastguard Worker // more specific "es-RR".
138*6777b538SAndroid Build Coastguard Worker return locale_string;
139*6777b538SAndroid Build Coastguard Worker }
140*6777b538SAndroid Build Coastguard Worker
SetICUDefaultLocale(const std::string & locale_string)141*6777b538SAndroid Build Coastguard Worker void SetICUDefaultLocale(const std::string& locale_string) {
142*6777b538SAndroid Build Coastguard Worker #if BUILDFLAG(IS_IOS)
143*6777b538SAndroid Build Coastguard Worker static base::debug::CrashKeyString* crash_key_locale =
144*6777b538SAndroid Build Coastguard Worker base::debug::AllocateCrashKeyString("icu_locale_input",
145*6777b538SAndroid Build Coastguard Worker base::debug::CrashKeySize::Size256);
146*6777b538SAndroid Build Coastguard Worker base::debug::SetCrashKeyString(crash_key_locale, locale_string);
147*6777b538SAndroid Build Coastguard Worker #endif
148*6777b538SAndroid Build Coastguard Worker icu::Locale locale(ICULocaleName(locale_string).c_str());
149*6777b538SAndroid Build Coastguard Worker UErrorCode error_code = U_ZERO_ERROR;
150*6777b538SAndroid Build Coastguard Worker const char* lang = locale.getLanguage();
151*6777b538SAndroid Build Coastguard Worker if (lang != nullptr && *lang != '\0') {
152*6777b538SAndroid Build Coastguard Worker icu::Locale::setDefault(locale, error_code);
153*6777b538SAndroid Build Coastguard Worker } else {
154*6777b538SAndroid Build Coastguard Worker LOG(ERROR) << "Failed to set the ICU default locale to " << locale_string
155*6777b538SAndroid Build Coastguard Worker << ". Falling back to en-US.";
156*6777b538SAndroid Build Coastguard Worker icu::Locale::setDefault(icu::Locale::getUS(), error_code);
157*6777b538SAndroid Build Coastguard Worker }
158*6777b538SAndroid Build Coastguard Worker g_icu_text_direction = UNKNOWN_DIRECTION;
159*6777b538SAndroid Build Coastguard Worker }
160*6777b538SAndroid Build Coastguard Worker
IsRTL()161*6777b538SAndroid Build Coastguard Worker bool IsRTL() {
162*6777b538SAndroid Build Coastguard Worker return ICUIsRTL();
163*6777b538SAndroid Build Coastguard Worker }
164*6777b538SAndroid Build Coastguard Worker
SetRTLForTesting(bool rtl)165*6777b538SAndroid Build Coastguard Worker void SetRTLForTesting(bool rtl) {
166*6777b538SAndroid Build Coastguard Worker SetICUDefaultLocale(rtl ? "he" : "en");
167*6777b538SAndroid Build Coastguard Worker DCHECK_EQ(rtl, IsRTL());
168*6777b538SAndroid Build Coastguard Worker }
169*6777b538SAndroid Build Coastguard Worker
ICUIsRTL()170*6777b538SAndroid Build Coastguard Worker bool ICUIsRTL() {
171*6777b538SAndroid Build Coastguard Worker if (g_icu_text_direction == UNKNOWN_DIRECTION) {
172*6777b538SAndroid Build Coastguard Worker const icu::Locale& locale = icu::Locale::getDefault();
173*6777b538SAndroid Build Coastguard Worker g_icu_text_direction = GetTextDirectionForLocaleInStartUp(locale.getName());
174*6777b538SAndroid Build Coastguard Worker }
175*6777b538SAndroid Build Coastguard Worker return g_icu_text_direction == RIGHT_TO_LEFT;
176*6777b538SAndroid Build Coastguard Worker }
177*6777b538SAndroid Build Coastguard Worker
GetForcedTextDirection()178*6777b538SAndroid Build Coastguard Worker TextDirection GetForcedTextDirection() {
179*6777b538SAndroid Build Coastguard Worker // On iOS, check for RTL forcing.
180*6777b538SAndroid Build Coastguard Worker #if BUILDFLAG(IS_IOS)
181*6777b538SAndroid Build Coastguard Worker if (base::ios::IsInForcedRTL())
182*6777b538SAndroid Build Coastguard Worker return base::i18n::RIGHT_TO_LEFT;
183*6777b538SAndroid Build Coastguard Worker #endif
184*6777b538SAndroid Build Coastguard Worker
185*6777b538SAndroid Build Coastguard Worker base::CommandLine* command_line = base::CommandLine::ForCurrentProcess();
186*6777b538SAndroid Build Coastguard Worker if (command_line->HasSwitch(switches::kForceUIDirection)) {
187*6777b538SAndroid Build Coastguard Worker std::string force_flag =
188*6777b538SAndroid Build Coastguard Worker command_line->GetSwitchValueASCII(switches::kForceUIDirection);
189*6777b538SAndroid Build Coastguard Worker
190*6777b538SAndroid Build Coastguard Worker if (force_flag == switches::kForceDirectionLTR)
191*6777b538SAndroid Build Coastguard Worker return base::i18n::LEFT_TO_RIGHT;
192*6777b538SAndroid Build Coastguard Worker
193*6777b538SAndroid Build Coastguard Worker if (force_flag == switches::kForceDirectionRTL)
194*6777b538SAndroid Build Coastguard Worker return base::i18n::RIGHT_TO_LEFT;
195*6777b538SAndroid Build Coastguard Worker }
196*6777b538SAndroid Build Coastguard Worker
197*6777b538SAndroid Build Coastguard Worker return base::i18n::UNKNOWN_DIRECTION;
198*6777b538SAndroid Build Coastguard Worker }
199*6777b538SAndroid Build Coastguard Worker
GetTextDirectionForLocaleInStartUp(const char * locale_name)200*6777b538SAndroid Build Coastguard Worker TextDirection GetTextDirectionForLocaleInStartUp(const char* locale_name) {
201*6777b538SAndroid Build Coastguard Worker // Check for direction forcing.
202*6777b538SAndroid Build Coastguard Worker TextDirection forced_direction = GetForcedTextDirection();
203*6777b538SAndroid Build Coastguard Worker if (forced_direction != UNKNOWN_DIRECTION)
204*6777b538SAndroid Build Coastguard Worker return forced_direction;
205*6777b538SAndroid Build Coastguard Worker
206*6777b538SAndroid Build Coastguard Worker // This list needs to be updated in alphabetical order if we add more RTL
207*6777b538SAndroid Build Coastguard Worker // locales.
208*6777b538SAndroid Build Coastguard Worker static const char kRTLLanguageCodes[][3] = {"ar", "fa", "he", "iw", "ur"};
209*6777b538SAndroid Build Coastguard Worker std::vector<std::string_view> locale_split =
210*6777b538SAndroid Build Coastguard Worker SplitStringPiece(locale_name, "-_", KEEP_WHITESPACE, SPLIT_WANT_ALL);
211*6777b538SAndroid Build Coastguard Worker std::string_view language_code = locale_split[0];
212*6777b538SAndroid Build Coastguard Worker if (std::binary_search(kRTLLanguageCodes,
213*6777b538SAndroid Build Coastguard Worker kRTLLanguageCodes + std::size(kRTLLanguageCodes),
214*6777b538SAndroid Build Coastguard Worker language_code))
215*6777b538SAndroid Build Coastguard Worker return RIGHT_TO_LEFT;
216*6777b538SAndroid Build Coastguard Worker return LEFT_TO_RIGHT;
217*6777b538SAndroid Build Coastguard Worker }
218*6777b538SAndroid Build Coastguard Worker
GetTextDirectionForLocale(const char * locale_name)219*6777b538SAndroid Build Coastguard Worker TextDirection GetTextDirectionForLocale(const char* locale_name) {
220*6777b538SAndroid Build Coastguard Worker // Check for direction forcing.
221*6777b538SAndroid Build Coastguard Worker TextDirection forced_direction = GetForcedTextDirection();
222*6777b538SAndroid Build Coastguard Worker if (forced_direction != UNKNOWN_DIRECTION)
223*6777b538SAndroid Build Coastguard Worker return forced_direction;
224*6777b538SAndroid Build Coastguard Worker
225*6777b538SAndroid Build Coastguard Worker UErrorCode status = U_ZERO_ERROR;
226*6777b538SAndroid Build Coastguard Worker ULayoutType layout_dir = uloc_getCharacterOrientation(locale_name, &status);
227*6777b538SAndroid Build Coastguard Worker DCHECK(U_SUCCESS(status));
228*6777b538SAndroid Build Coastguard Worker // Treat anything other than RTL as LTR.
229*6777b538SAndroid Build Coastguard Worker return (layout_dir != ULOC_LAYOUT_RTL) ? LEFT_TO_RIGHT : RIGHT_TO_LEFT;
230*6777b538SAndroid Build Coastguard Worker }
231*6777b538SAndroid Build Coastguard Worker
GetFirstStrongCharacterDirection(const std::u16string & text)232*6777b538SAndroid Build Coastguard Worker TextDirection GetFirstStrongCharacterDirection(const std::u16string& text) {
233*6777b538SAndroid Build Coastguard Worker const char16_t* string = text.c_str();
234*6777b538SAndroid Build Coastguard Worker size_t length = text.length();
235*6777b538SAndroid Build Coastguard Worker size_t position = 0;
236*6777b538SAndroid Build Coastguard Worker while (position < length) {
237*6777b538SAndroid Build Coastguard Worker UChar32 character;
238*6777b538SAndroid Build Coastguard Worker size_t next_position = position;
239*6777b538SAndroid Build Coastguard Worker U16_NEXT(string, next_position, length, character);
240*6777b538SAndroid Build Coastguard Worker TextDirection direction = GetCharacterDirection(character);
241*6777b538SAndroid Build Coastguard Worker if (direction != UNKNOWN_DIRECTION)
242*6777b538SAndroid Build Coastguard Worker return direction;
243*6777b538SAndroid Build Coastguard Worker position = next_position;
244*6777b538SAndroid Build Coastguard Worker }
245*6777b538SAndroid Build Coastguard Worker return LEFT_TO_RIGHT;
246*6777b538SAndroid Build Coastguard Worker }
247*6777b538SAndroid Build Coastguard Worker
GetLastStrongCharacterDirection(const std::u16string & text)248*6777b538SAndroid Build Coastguard Worker TextDirection GetLastStrongCharacterDirection(const std::u16string& text) {
249*6777b538SAndroid Build Coastguard Worker const char16_t* string = text.c_str();
250*6777b538SAndroid Build Coastguard Worker size_t position = text.length();
251*6777b538SAndroid Build Coastguard Worker while (position > 0) {
252*6777b538SAndroid Build Coastguard Worker UChar32 character;
253*6777b538SAndroid Build Coastguard Worker size_t prev_position = position;
254*6777b538SAndroid Build Coastguard Worker U16_PREV(string, 0, prev_position, character);
255*6777b538SAndroid Build Coastguard Worker TextDirection direction = GetCharacterDirection(character);
256*6777b538SAndroid Build Coastguard Worker if (direction != UNKNOWN_DIRECTION)
257*6777b538SAndroid Build Coastguard Worker return direction;
258*6777b538SAndroid Build Coastguard Worker position = prev_position;
259*6777b538SAndroid Build Coastguard Worker }
260*6777b538SAndroid Build Coastguard Worker return LEFT_TO_RIGHT;
261*6777b538SAndroid Build Coastguard Worker }
262*6777b538SAndroid Build Coastguard Worker
GetStringDirection(const std::u16string & text)263*6777b538SAndroid Build Coastguard Worker TextDirection GetStringDirection(const std::u16string& text) {
264*6777b538SAndroid Build Coastguard Worker const char16_t* string = text.c_str();
265*6777b538SAndroid Build Coastguard Worker size_t length = text.length();
266*6777b538SAndroid Build Coastguard Worker size_t position = 0;
267*6777b538SAndroid Build Coastguard Worker
268*6777b538SAndroid Build Coastguard Worker TextDirection result(UNKNOWN_DIRECTION);
269*6777b538SAndroid Build Coastguard Worker while (position < length) {
270*6777b538SAndroid Build Coastguard Worker UChar32 character;
271*6777b538SAndroid Build Coastguard Worker size_t next_position = position;
272*6777b538SAndroid Build Coastguard Worker U16_NEXT(string, next_position, length, character);
273*6777b538SAndroid Build Coastguard Worker TextDirection direction = GetCharacterDirection(character);
274*6777b538SAndroid Build Coastguard Worker if (direction != UNKNOWN_DIRECTION) {
275*6777b538SAndroid Build Coastguard Worker if (result != UNKNOWN_DIRECTION && result != direction)
276*6777b538SAndroid Build Coastguard Worker return UNKNOWN_DIRECTION;
277*6777b538SAndroid Build Coastguard Worker result = direction;
278*6777b538SAndroid Build Coastguard Worker }
279*6777b538SAndroid Build Coastguard Worker position = next_position;
280*6777b538SAndroid Build Coastguard Worker }
281*6777b538SAndroid Build Coastguard Worker
282*6777b538SAndroid Build Coastguard Worker // Handle the case of a string not containing any strong directionality
283*6777b538SAndroid Build Coastguard Worker // characters defaulting to LEFT_TO_RIGHT.
284*6777b538SAndroid Build Coastguard Worker if (result == UNKNOWN_DIRECTION)
285*6777b538SAndroid Build Coastguard Worker return LEFT_TO_RIGHT;
286*6777b538SAndroid Build Coastguard Worker
287*6777b538SAndroid Build Coastguard Worker return result;
288*6777b538SAndroid Build Coastguard Worker }
289*6777b538SAndroid Build Coastguard Worker
290*6777b538SAndroid Build Coastguard Worker #if BUILDFLAG(IS_WIN)
AdjustStringForLocaleDirection(std::u16string * text)291*6777b538SAndroid Build Coastguard Worker bool AdjustStringForLocaleDirection(std::u16string* text) {
292*6777b538SAndroid Build Coastguard Worker if (!IsRTL() || text->empty())
293*6777b538SAndroid Build Coastguard Worker return false;
294*6777b538SAndroid Build Coastguard Worker
295*6777b538SAndroid Build Coastguard Worker // Marking the string as LTR if the locale is RTL and the string does not
296*6777b538SAndroid Build Coastguard Worker // contain strong RTL characters. Otherwise, mark the string as RTL.
297*6777b538SAndroid Build Coastguard Worker bool has_rtl_chars = StringContainsStrongRTLChars(*text);
298*6777b538SAndroid Build Coastguard Worker if (!has_rtl_chars)
299*6777b538SAndroid Build Coastguard Worker WrapStringWithLTRFormatting(text);
300*6777b538SAndroid Build Coastguard Worker else
301*6777b538SAndroid Build Coastguard Worker WrapStringWithRTLFormatting(text);
302*6777b538SAndroid Build Coastguard Worker
303*6777b538SAndroid Build Coastguard Worker return true;
304*6777b538SAndroid Build Coastguard Worker }
305*6777b538SAndroid Build Coastguard Worker
UnadjustStringForLocaleDirection(std::u16string * text)306*6777b538SAndroid Build Coastguard Worker bool UnadjustStringForLocaleDirection(std::u16string* text) {
307*6777b538SAndroid Build Coastguard Worker if (!IsRTL() || text->empty())
308*6777b538SAndroid Build Coastguard Worker return false;
309*6777b538SAndroid Build Coastguard Worker
310*6777b538SAndroid Build Coastguard Worker *text = StripWrappingBidiControlCharacters(*text);
311*6777b538SAndroid Build Coastguard Worker return true;
312*6777b538SAndroid Build Coastguard Worker }
313*6777b538SAndroid Build Coastguard Worker #else
AdjustStringForLocaleDirection(std::u16string * text)314*6777b538SAndroid Build Coastguard Worker bool AdjustStringForLocaleDirection(std::u16string* text) {
315*6777b538SAndroid Build Coastguard Worker // On OS X & GTK the directionality of a label is determined by the first
316*6777b538SAndroid Build Coastguard Worker // strongly directional character.
317*6777b538SAndroid Build Coastguard Worker // However, we want to make sure that in an LTR-language-UI all strings are
318*6777b538SAndroid Build Coastguard Worker // left aligned and vice versa.
319*6777b538SAndroid Build Coastguard Worker // A problem can arise if we display a string which starts with user input.
320*6777b538SAndroid Build Coastguard Worker // User input may be of the opposite directionality to the UI. So the whole
321*6777b538SAndroid Build Coastguard Worker // string will be displayed in the opposite directionality, e.g. if we want to
322*6777b538SAndroid Build Coastguard Worker // display in an LTR UI [such as US English]:
323*6777b538SAndroid Build Coastguard Worker //
324*6777b538SAndroid Build Coastguard Worker // EMAN_NOISNETXE is now installed.
325*6777b538SAndroid Build Coastguard Worker //
326*6777b538SAndroid Build Coastguard Worker // Since EXTENSION_NAME begins with a strong RTL char, the label's
327*6777b538SAndroid Build Coastguard Worker // directionality will be set to RTL and the string will be displayed visually
328*6777b538SAndroid Build Coastguard Worker // as:
329*6777b538SAndroid Build Coastguard Worker //
330*6777b538SAndroid Build Coastguard Worker // .is now installed EMAN_NOISNETXE
331*6777b538SAndroid Build Coastguard Worker //
332*6777b538SAndroid Build Coastguard Worker // In order to solve this issue, we prepend an LRM to the string. An LRM is a
333*6777b538SAndroid Build Coastguard Worker // strongly directional LTR char.
334*6777b538SAndroid Build Coastguard Worker // We also append an LRM at the end, which ensures that we're in an LTR
335*6777b538SAndroid Build Coastguard Worker // context.
336*6777b538SAndroid Build Coastguard Worker
337*6777b538SAndroid Build Coastguard Worker // Unlike Windows, Linux and OS X can correctly display RTL glyphs out of the
338*6777b538SAndroid Build Coastguard Worker // box so there is no issue with displaying zero-width bidi control characters
339*6777b538SAndroid Build Coastguard Worker // on any system. Thus no need for the !IsRTL() check here.
340*6777b538SAndroid Build Coastguard Worker if (text->empty())
341*6777b538SAndroid Build Coastguard Worker return false;
342*6777b538SAndroid Build Coastguard Worker
343*6777b538SAndroid Build Coastguard Worker bool ui_direction_is_rtl = IsRTL();
344*6777b538SAndroid Build Coastguard Worker
345*6777b538SAndroid Build Coastguard Worker bool has_rtl_chars = StringContainsStrongRTLChars(*text);
346*6777b538SAndroid Build Coastguard Worker if (!ui_direction_is_rtl && has_rtl_chars) {
347*6777b538SAndroid Build Coastguard Worker WrapStringWithRTLFormatting(text);
348*6777b538SAndroid Build Coastguard Worker text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
349*6777b538SAndroid Build Coastguard Worker kLeftToRightMark);
350*6777b538SAndroid Build Coastguard Worker text->push_back(kLeftToRightMark);
351*6777b538SAndroid Build Coastguard Worker } else if (ui_direction_is_rtl && has_rtl_chars) {
352*6777b538SAndroid Build Coastguard Worker WrapStringWithRTLFormatting(text);
353*6777b538SAndroid Build Coastguard Worker text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
354*6777b538SAndroid Build Coastguard Worker kRightToLeftMark);
355*6777b538SAndroid Build Coastguard Worker text->push_back(kRightToLeftMark);
356*6777b538SAndroid Build Coastguard Worker } else if (ui_direction_is_rtl) {
357*6777b538SAndroid Build Coastguard Worker WrapStringWithLTRFormatting(text);
358*6777b538SAndroid Build Coastguard Worker text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
359*6777b538SAndroid Build Coastguard Worker kRightToLeftMark);
360*6777b538SAndroid Build Coastguard Worker text->push_back(kRightToLeftMark);
361*6777b538SAndroid Build Coastguard Worker } else {
362*6777b538SAndroid Build Coastguard Worker return false;
363*6777b538SAndroid Build Coastguard Worker }
364*6777b538SAndroid Build Coastguard Worker
365*6777b538SAndroid Build Coastguard Worker return true;
366*6777b538SAndroid Build Coastguard Worker }
367*6777b538SAndroid Build Coastguard Worker
UnadjustStringForLocaleDirection(std::u16string * text)368*6777b538SAndroid Build Coastguard Worker bool UnadjustStringForLocaleDirection(std::u16string* text) {
369*6777b538SAndroid Build Coastguard Worker if (text->empty())
370*6777b538SAndroid Build Coastguard Worker return false;
371*6777b538SAndroid Build Coastguard Worker
372*6777b538SAndroid Build Coastguard Worker size_t begin_index = 0;
373*6777b538SAndroid Build Coastguard Worker char16_t begin = text->at(begin_index);
374*6777b538SAndroid Build Coastguard Worker if (begin == kLeftToRightMark ||
375*6777b538SAndroid Build Coastguard Worker begin == kRightToLeftMark) {
376*6777b538SAndroid Build Coastguard Worker ++begin_index;
377*6777b538SAndroid Build Coastguard Worker }
378*6777b538SAndroid Build Coastguard Worker
379*6777b538SAndroid Build Coastguard Worker size_t end_index = text->length() - 1;
380*6777b538SAndroid Build Coastguard Worker char16_t end = text->at(end_index);
381*6777b538SAndroid Build Coastguard Worker if (end == kLeftToRightMark ||
382*6777b538SAndroid Build Coastguard Worker end == kRightToLeftMark) {
383*6777b538SAndroid Build Coastguard Worker --end_index;
384*6777b538SAndroid Build Coastguard Worker }
385*6777b538SAndroid Build Coastguard Worker
386*6777b538SAndroid Build Coastguard Worker std::u16string unmarked_text =
387*6777b538SAndroid Build Coastguard Worker text->substr(begin_index, end_index - begin_index + 1);
388*6777b538SAndroid Build Coastguard Worker *text = StripWrappingBidiControlCharacters(unmarked_text);
389*6777b538SAndroid Build Coastguard Worker return true;
390*6777b538SAndroid Build Coastguard Worker }
391*6777b538SAndroid Build Coastguard Worker
392*6777b538SAndroid Build Coastguard Worker #endif // !BUILDFLAG(IS_WIN)
393*6777b538SAndroid Build Coastguard Worker
EnsureTerminatedDirectionalFormatting(std::u16string * text)394*6777b538SAndroid Build Coastguard Worker void EnsureTerminatedDirectionalFormatting(std::u16string* text) {
395*6777b538SAndroid Build Coastguard Worker int count = 0;
396*6777b538SAndroid Build Coastguard Worker for (auto c : *text) {
397*6777b538SAndroid Build Coastguard Worker if (c == kLeftToRightEmbeddingMark || c == kRightToLeftEmbeddingMark ||
398*6777b538SAndroid Build Coastguard Worker c == kLeftToRightOverride || c == kRightToLeftOverride) {
399*6777b538SAndroid Build Coastguard Worker ++count;
400*6777b538SAndroid Build Coastguard Worker } else if (c == kPopDirectionalFormatting && count > 0) {
401*6777b538SAndroid Build Coastguard Worker --count;
402*6777b538SAndroid Build Coastguard Worker }
403*6777b538SAndroid Build Coastguard Worker }
404*6777b538SAndroid Build Coastguard Worker for (int j = 0; j < count; j++)
405*6777b538SAndroid Build Coastguard Worker text->push_back(kPopDirectionalFormatting);
406*6777b538SAndroid Build Coastguard Worker }
407*6777b538SAndroid Build Coastguard Worker
SanitizeUserSuppliedString(std::u16string * text)408*6777b538SAndroid Build Coastguard Worker void SanitizeUserSuppliedString(std::u16string* text) {
409*6777b538SAndroid Build Coastguard Worker EnsureTerminatedDirectionalFormatting(text);
410*6777b538SAndroid Build Coastguard Worker AdjustStringForLocaleDirection(text);
411*6777b538SAndroid Build Coastguard Worker }
412*6777b538SAndroid Build Coastguard Worker
StringContainsStrongRTLChars(const std::u16string & text)413*6777b538SAndroid Build Coastguard Worker bool StringContainsStrongRTLChars(const std::u16string& text) {
414*6777b538SAndroid Build Coastguard Worker const char16_t* string = text.c_str();
415*6777b538SAndroid Build Coastguard Worker size_t length = text.length();
416*6777b538SAndroid Build Coastguard Worker size_t position = 0;
417*6777b538SAndroid Build Coastguard Worker while (position < length) {
418*6777b538SAndroid Build Coastguard Worker UChar32 character;
419*6777b538SAndroid Build Coastguard Worker size_t next_position = position;
420*6777b538SAndroid Build Coastguard Worker U16_NEXT(string, next_position, length, character);
421*6777b538SAndroid Build Coastguard Worker
422*6777b538SAndroid Build Coastguard Worker // Now that we have the character, we use ICU in order to query for the
423*6777b538SAndroid Build Coastguard Worker // appropriate Unicode BiDi character type.
424*6777b538SAndroid Build Coastguard Worker int32_t property = u_getIntPropertyValue(character, UCHAR_BIDI_CLASS);
425*6777b538SAndroid Build Coastguard Worker if ((property == U_RIGHT_TO_LEFT) || (property == U_RIGHT_TO_LEFT_ARABIC))
426*6777b538SAndroid Build Coastguard Worker return true;
427*6777b538SAndroid Build Coastguard Worker
428*6777b538SAndroid Build Coastguard Worker position = next_position;
429*6777b538SAndroid Build Coastguard Worker }
430*6777b538SAndroid Build Coastguard Worker
431*6777b538SAndroid Build Coastguard Worker return false;
432*6777b538SAndroid Build Coastguard Worker }
433*6777b538SAndroid Build Coastguard Worker
WrapStringWithLTRFormatting(std::u16string * text)434*6777b538SAndroid Build Coastguard Worker void WrapStringWithLTRFormatting(std::u16string* text) {
435*6777b538SAndroid Build Coastguard Worker if (text->empty())
436*6777b538SAndroid Build Coastguard Worker return;
437*6777b538SAndroid Build Coastguard Worker
438*6777b538SAndroid Build Coastguard Worker // Inserting an LRE (Left-To-Right Embedding) mark as the first character.
439*6777b538SAndroid Build Coastguard Worker text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
440*6777b538SAndroid Build Coastguard Worker kLeftToRightEmbeddingMark);
441*6777b538SAndroid Build Coastguard Worker
442*6777b538SAndroid Build Coastguard Worker // Inserting a PDF (Pop Directional Formatting) mark as the last character.
443*6777b538SAndroid Build Coastguard Worker text->push_back(kPopDirectionalFormatting);
444*6777b538SAndroid Build Coastguard Worker }
445*6777b538SAndroid Build Coastguard Worker
WrapStringWithRTLFormatting(std::u16string * text)446*6777b538SAndroid Build Coastguard Worker void WrapStringWithRTLFormatting(std::u16string* text) {
447*6777b538SAndroid Build Coastguard Worker if (text->empty())
448*6777b538SAndroid Build Coastguard Worker return;
449*6777b538SAndroid Build Coastguard Worker
450*6777b538SAndroid Build Coastguard Worker // Inserting an RLE (Right-To-Left Embedding) mark as the first character.
451*6777b538SAndroid Build Coastguard Worker text->insert(static_cast<size_t>(0), static_cast<size_t>(1),
452*6777b538SAndroid Build Coastguard Worker kRightToLeftEmbeddingMark);
453*6777b538SAndroid Build Coastguard Worker
454*6777b538SAndroid Build Coastguard Worker // Inserting a PDF (Pop Directional Formatting) mark as the last character.
455*6777b538SAndroid Build Coastguard Worker text->push_back(kPopDirectionalFormatting);
456*6777b538SAndroid Build Coastguard Worker }
457*6777b538SAndroid Build Coastguard Worker
WrapPathWithLTRFormatting(const FilePath & path,std::u16string * rtl_safe_path)458*6777b538SAndroid Build Coastguard Worker void WrapPathWithLTRFormatting(const FilePath& path,
459*6777b538SAndroid Build Coastguard Worker std::u16string* rtl_safe_path) {
460*6777b538SAndroid Build Coastguard Worker // Wrap the overall path with LRE-PDF pair which essentialy marks the
461*6777b538SAndroid Build Coastguard Worker // string as a Left-To-Right string.
462*6777b538SAndroid Build Coastguard Worker // Inserting an LRE (Left-To-Right Embedding) mark as the first character.
463*6777b538SAndroid Build Coastguard Worker rtl_safe_path->push_back(kLeftToRightEmbeddingMark);
464*6777b538SAndroid Build Coastguard Worker #if BUILDFLAG(IS_APPLE)
465*6777b538SAndroid Build Coastguard Worker rtl_safe_path->append(UTF8ToUTF16(path.value()));
466*6777b538SAndroid Build Coastguard Worker #elif BUILDFLAG(IS_WIN)
467*6777b538SAndroid Build Coastguard Worker rtl_safe_path->append(AsString16(path.value()));
468*6777b538SAndroid Build Coastguard Worker #else // BUILDFLAG(IS_POSIX) && !BUILDFLAG(IS_APPLE)
469*6777b538SAndroid Build Coastguard Worker std::wstring wide_path = base::SysNativeMBToWide(path.value());
470*6777b538SAndroid Build Coastguard Worker rtl_safe_path->append(WideToUTF16(wide_path));
471*6777b538SAndroid Build Coastguard Worker #endif
472*6777b538SAndroid Build Coastguard Worker // Inserting a PDF (Pop Directional Formatting) mark as the last character.
473*6777b538SAndroid Build Coastguard Worker rtl_safe_path->push_back(kPopDirectionalFormatting);
474*6777b538SAndroid Build Coastguard Worker }
475*6777b538SAndroid Build Coastguard Worker
GetDisplayStringInLTRDirectionality(const std::u16string & text)476*6777b538SAndroid Build Coastguard Worker std::u16string GetDisplayStringInLTRDirectionality(const std::u16string& text) {
477*6777b538SAndroid Build Coastguard Worker // Always wrap the string in RTL UI (it may be appended to RTL string).
478*6777b538SAndroid Build Coastguard Worker // Also wrap strings with an RTL first strong character direction in LTR UI.
479*6777b538SAndroid Build Coastguard Worker if (IsRTL() || GetFirstStrongCharacterDirection(text) == RIGHT_TO_LEFT) {
480*6777b538SAndroid Build Coastguard Worker std::u16string text_mutable(text);
481*6777b538SAndroid Build Coastguard Worker WrapStringWithLTRFormatting(&text_mutable);
482*6777b538SAndroid Build Coastguard Worker return text_mutable;
483*6777b538SAndroid Build Coastguard Worker }
484*6777b538SAndroid Build Coastguard Worker return text;
485*6777b538SAndroid Build Coastguard Worker }
486*6777b538SAndroid Build Coastguard Worker
StripWrappingBidiControlCharacters(const std::u16string & text)487*6777b538SAndroid Build Coastguard Worker std::u16string StripWrappingBidiControlCharacters(const std::u16string& text) {
488*6777b538SAndroid Build Coastguard Worker if (text.empty())
489*6777b538SAndroid Build Coastguard Worker return text;
490*6777b538SAndroid Build Coastguard Worker size_t begin_index = 0;
491*6777b538SAndroid Build Coastguard Worker char16_t begin = text[begin_index];
492*6777b538SAndroid Build Coastguard Worker if (begin == kLeftToRightEmbeddingMark ||
493*6777b538SAndroid Build Coastguard Worker begin == kRightToLeftEmbeddingMark ||
494*6777b538SAndroid Build Coastguard Worker begin == kLeftToRightOverride ||
495*6777b538SAndroid Build Coastguard Worker begin == kRightToLeftOverride)
496*6777b538SAndroid Build Coastguard Worker ++begin_index;
497*6777b538SAndroid Build Coastguard Worker size_t end_index = text.length() - 1;
498*6777b538SAndroid Build Coastguard Worker if (text[end_index] == kPopDirectionalFormatting)
499*6777b538SAndroid Build Coastguard Worker --end_index;
500*6777b538SAndroid Build Coastguard Worker return text.substr(begin_index, end_index - begin_index + 1);
501*6777b538SAndroid Build Coastguard Worker }
502*6777b538SAndroid Build Coastguard Worker
503*6777b538SAndroid Build Coastguard Worker } // namespace i18n
504*6777b538SAndroid Build Coastguard Worker } // namespace base
505