1*6777b538SAndroid Build Coastguard Worker // Copyright 2011 The Chromium Authors 2*6777b538SAndroid Build Coastguard Worker // Use of this source code is governed by a BSD-style license that can be 3*6777b538SAndroid Build Coastguard Worker // found in the LICENSE file. 4*6777b538SAndroid Build Coastguard Worker 5*6777b538SAndroid Build Coastguard Worker #ifndef BASE_I18N_CASE_CONVERSION_H_ 6*6777b538SAndroid Build Coastguard Worker #define BASE_I18N_CASE_CONVERSION_H_ 7*6777b538SAndroid Build Coastguard Worker 8*6777b538SAndroid Build Coastguard Worker #include <string> 9*6777b538SAndroid Build Coastguard Worker #include <string_view> 10*6777b538SAndroid Build Coastguard Worker 11*6777b538SAndroid Build Coastguard Worker #include "base/i18n/base_i18n_export.h" 12*6777b538SAndroid Build Coastguard Worker 13*6777b538SAndroid Build Coastguard Worker namespace base { 14*6777b538SAndroid Build Coastguard Worker namespace i18n { 15*6777b538SAndroid Build Coastguard Worker 16*6777b538SAndroid Build Coastguard Worker // UNICODE CASE-HANDLING ADVICE 17*6777b538SAndroid Build Coastguard Worker // 18*6777b538SAndroid Build Coastguard Worker // In English it's always safe to convert to upper-case or lower-case text 19*6777b538SAndroid Build Coastguard Worker // and get a good answer. But some languages have rules specific to those 20*6777b538SAndroid Build Coastguard Worker // locales. One example is the Turkish I: 21*6777b538SAndroid Build Coastguard Worker // http://www.i18nguy.com/unicode/turkish-i18n.html 22*6777b538SAndroid Build Coastguard Worker // 23*6777b538SAndroid Build Coastguard Worker // ToLower/ToUpper use the current ICU locale which will take into account 24*6777b538SAndroid Build Coastguard Worker // the user language preference. Use this when dealing with user typing. 25*6777b538SAndroid Build Coastguard Worker // 26*6777b538SAndroid Build Coastguard Worker // FoldCase canonicalizes to a standardized form independent of the current 27*6777b538SAndroid Build Coastguard Worker // locale. Use this when comparing general Unicode strings that don't 28*6777b538SAndroid Build Coastguard Worker // necessarily belong in the user's current locale (like commands, protocol 29*6777b538SAndroid Build Coastguard Worker // names, other strings from the web) for case-insensitive equality. 30*6777b538SAndroid Build Coastguard Worker // 31*6777b538SAndroid Build Coastguard Worker // Note that case conversions will change the length of the string in some 32*6777b538SAndroid Build Coastguard Worker // not-uncommon cases. Never assume that the output is the same length as 33*6777b538SAndroid Build Coastguard Worker // the input. 34*6777b538SAndroid Build Coastguard Worker 35*6777b538SAndroid Build Coastguard Worker // Returns the lower case equivalent of string. Uses ICU's current locale. 36*6777b538SAndroid Build Coastguard Worker BASE_I18N_EXPORT std::u16string ToLower(std::u16string_view string); 37*6777b538SAndroid Build Coastguard Worker 38*6777b538SAndroid Build Coastguard Worker // Returns the upper case equivalent of string. Uses ICU's current locale. 39*6777b538SAndroid Build Coastguard Worker BASE_I18N_EXPORT std::u16string ToUpper(std::u16string_view string); 40*6777b538SAndroid Build Coastguard Worker 41*6777b538SAndroid Build Coastguard Worker // Convert the given string to a canonical case, independent of the current 42*6777b538SAndroid Build Coastguard Worker // locale. For ASCII the canonical form is lower case. 43*6777b538SAndroid Build Coastguard Worker // See http://unicode.org/faq/casemap_charprop.html#2 44*6777b538SAndroid Build Coastguard Worker BASE_I18N_EXPORT std::u16string FoldCase(std::u16string_view string); 45*6777b538SAndroid Build Coastguard Worker 46*6777b538SAndroid Build Coastguard Worker } // namespace i18n 47*6777b538SAndroid Build Coastguard Worker } // namespace base 48*6777b538SAndroid Build Coastguard Worker 49*6777b538SAndroid Build Coastguard Worker #endif // BASE_I18N_CASE_CONVERSION_H_ 50