xref: /aosp_15_r20/external/abseil-cpp/absl/strings/internal/utf8.h (revision 9356374a3709195abf420251b3e825997ff56c0f)
1*9356374aSAndroid Build Coastguard Worker // Copyright 2017 The Abseil Authors.
2*9356374aSAndroid Build Coastguard Worker //
3*9356374aSAndroid Build Coastguard Worker // Licensed under the Apache License, Version 2.0 (the "License");
4*9356374aSAndroid Build Coastguard Worker // you may not use this file except in compliance with the License.
5*9356374aSAndroid Build Coastguard Worker // You may obtain a copy of the License at
6*9356374aSAndroid Build Coastguard Worker //
7*9356374aSAndroid Build Coastguard Worker //      https://www.apache.org/licenses/LICENSE-2.0
8*9356374aSAndroid Build Coastguard Worker //
9*9356374aSAndroid Build Coastguard Worker // Unless required by applicable law or agreed to in writing, software
10*9356374aSAndroid Build Coastguard Worker // distributed under the License is distributed on an "AS IS" BASIS,
11*9356374aSAndroid Build Coastguard Worker // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12*9356374aSAndroid Build Coastguard Worker // See the License for the specific language governing permissions and
13*9356374aSAndroid Build Coastguard Worker // limitations under the License.
14*9356374aSAndroid Build Coastguard Worker //
15*9356374aSAndroid Build Coastguard Worker // UTF8 utilities, implemented to reduce dependencies.
16*9356374aSAndroid Build Coastguard Worker 
17*9356374aSAndroid Build Coastguard Worker #ifndef ABSL_STRINGS_INTERNAL_UTF8_H_
18*9356374aSAndroid Build Coastguard Worker #define ABSL_STRINGS_INTERNAL_UTF8_H_
19*9356374aSAndroid Build Coastguard Worker 
20*9356374aSAndroid Build Coastguard Worker #include <cstddef>
21*9356374aSAndroid Build Coastguard Worker #include <cstdint>
22*9356374aSAndroid Build Coastguard Worker 
23*9356374aSAndroid Build Coastguard Worker #include "absl/base/config.h"
24*9356374aSAndroid Build Coastguard Worker 
25*9356374aSAndroid Build Coastguard Worker namespace absl {
26*9356374aSAndroid Build Coastguard Worker ABSL_NAMESPACE_BEGIN
27*9356374aSAndroid Build Coastguard Worker namespace strings_internal {
28*9356374aSAndroid Build Coastguard Worker 
29*9356374aSAndroid Build Coastguard Worker // For Unicode code points 0 through 0x10FFFF, EncodeUTF8Char writes
30*9356374aSAndroid Build Coastguard Worker // out the UTF-8 encoding into buffer, and returns the number of chars
31*9356374aSAndroid Build Coastguard Worker // it wrote.
32*9356374aSAndroid Build Coastguard Worker //
33*9356374aSAndroid Build Coastguard Worker // As described in https://tools.ietf.org/html/rfc3629#section-3 , the encodings
34*9356374aSAndroid Build Coastguard Worker // are:
35*9356374aSAndroid Build Coastguard Worker //    00 -     7F : 0xxxxxxx
36*9356374aSAndroid Build Coastguard Worker //    80 -    7FF : 110xxxxx 10xxxxxx
37*9356374aSAndroid Build Coastguard Worker //   800 -   FFFF : 1110xxxx 10xxxxxx 10xxxxxx
38*9356374aSAndroid Build Coastguard Worker // 10000 - 10FFFF : 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
39*9356374aSAndroid Build Coastguard Worker //
40*9356374aSAndroid Build Coastguard Worker // Values greater than 0x10FFFF are not supported and may or may not write
41*9356374aSAndroid Build Coastguard Worker // characters into buffer, however never will more than kMaxEncodedUTF8Size
42*9356374aSAndroid Build Coastguard Worker // bytes be written, regardless of the value of utf8_char.
43*9356374aSAndroid Build Coastguard Worker enum { kMaxEncodedUTF8Size = 4 };
44*9356374aSAndroid Build Coastguard Worker size_t EncodeUTF8Char(char *buffer, char32_t utf8_char);
45*9356374aSAndroid Build Coastguard Worker 
46*9356374aSAndroid Build Coastguard Worker }  // namespace strings_internal
47*9356374aSAndroid Build Coastguard Worker ABSL_NAMESPACE_END
48*9356374aSAndroid Build Coastguard Worker }  // namespace absl
49*9356374aSAndroid Build Coastguard Worker 
50*9356374aSAndroid Build Coastguard Worker #endif  // ABSL_STRINGS_INTERNAL_UTF8_H_
51