xref: /aosp_15_r20/art/runtime/native/java_lang_StringFactory.cc (revision 795d594fd825385562da6b089ea9b2033f3abf5a)
1*795d594fSAndroid Build Coastguard Worker /*
2*795d594fSAndroid Build Coastguard Worker  * Copyright (C) 2008 The Android Open Source Project
3*795d594fSAndroid Build Coastguard Worker  *
4*795d594fSAndroid Build Coastguard Worker  * Licensed under the Apache License, Version 2.0 (the "License");
5*795d594fSAndroid Build Coastguard Worker  * you may not use this file except in compliance with the License.
6*795d594fSAndroid Build Coastguard Worker  * You may obtain a copy of the License at
7*795d594fSAndroid Build Coastguard Worker  *
8*795d594fSAndroid Build Coastguard Worker  *      http://www.apache.org/licenses/LICENSE-2.0
9*795d594fSAndroid Build Coastguard Worker  *
10*795d594fSAndroid Build Coastguard Worker  * Unless required by applicable law or agreed to in writing, software
11*795d594fSAndroid Build Coastguard Worker  * distributed under the License is distributed on an "AS IS" BASIS,
12*795d594fSAndroid Build Coastguard Worker  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*795d594fSAndroid Build Coastguard Worker  * See the License for the specific language governing permissions and
14*795d594fSAndroid Build Coastguard Worker  * limitations under the License.
15*795d594fSAndroid Build Coastguard Worker  */
16*795d594fSAndroid Build Coastguard Worker 
17*795d594fSAndroid Build Coastguard Worker #include "java_lang_StringFactory.h"
18*795d594fSAndroid Build Coastguard Worker 
19*795d594fSAndroid Build Coastguard Worker #include "common_throws.h"
20*795d594fSAndroid Build Coastguard Worker #include "handle_scope-inl.h"
21*795d594fSAndroid Build Coastguard Worker #include "jni/jni_internal.h"
22*795d594fSAndroid Build Coastguard Worker #include "mirror/object-inl.h"
23*795d594fSAndroid Build Coastguard Worker #include "mirror/string-alloc-inl.h"
24*795d594fSAndroid Build Coastguard Worker #include "native_util.h"
25*795d594fSAndroid Build Coastguard Worker #include "nativehelper/jni_macros.h"
26*795d594fSAndroid Build Coastguard Worker #include "nativehelper/scoped_local_ref.h"
27*795d594fSAndroid Build Coastguard Worker #include "nativehelper/scoped_primitive_array.h"
28*795d594fSAndroid Build Coastguard Worker #include "scoped_fast_native_object_access-inl.h"
29*795d594fSAndroid Build Coastguard Worker #include "scoped_thread_state_change-inl.h"
30*795d594fSAndroid Build Coastguard Worker 
31*795d594fSAndroid Build Coastguard Worker namespace art HIDDEN {
32*795d594fSAndroid Build Coastguard Worker 
StringFactory_newStringFromBytes(JNIEnv * env,jclass,jbyteArray java_data,jint high,jint offset,jint byte_count)33*795d594fSAndroid Build Coastguard Worker static jstring StringFactory_newStringFromBytes(JNIEnv* env, jclass, jbyteArray java_data,
34*795d594fSAndroid Build Coastguard Worker                                                 jint high, jint offset, jint byte_count) {
35*795d594fSAndroid Build Coastguard Worker   ScopedFastNativeObjectAccess soa(env);
36*795d594fSAndroid Build Coastguard Worker   if (UNLIKELY(java_data == nullptr)) {
37*795d594fSAndroid Build Coastguard Worker     ThrowNullPointerException("data == null");
38*795d594fSAndroid Build Coastguard Worker     return nullptr;
39*795d594fSAndroid Build Coastguard Worker   }
40*795d594fSAndroid Build Coastguard Worker   StackHandleScope<1> hs(soa.Self());
41*795d594fSAndroid Build Coastguard Worker   Handle<mirror::ByteArray> byte_array(hs.NewHandle(soa.Decode<mirror::ByteArray>(java_data)));
42*795d594fSAndroid Build Coastguard Worker   int32_t data_size = byte_array->GetLength();
43*795d594fSAndroid Build Coastguard Worker   if ((offset | byte_count) < 0 || byte_count > data_size - offset) {
44*795d594fSAndroid Build Coastguard Worker     soa.Self()->ThrowNewExceptionF("Ljava/lang/StringIndexOutOfBoundsException;",
45*795d594fSAndroid Build Coastguard Worker                                    "length=%d; regionStart=%d; regionLength=%d", data_size,
46*795d594fSAndroid Build Coastguard Worker                                    offset, byte_count);
47*795d594fSAndroid Build Coastguard Worker     return nullptr;
48*795d594fSAndroid Build Coastguard Worker   }
49*795d594fSAndroid Build Coastguard Worker   gc::AllocatorType allocator_type = Runtime::Current()->GetHeap()->GetCurrentAllocator();
50*795d594fSAndroid Build Coastguard Worker   ObjPtr<mirror::String> result = mirror::String::AllocFromByteArray(soa.Self(),
51*795d594fSAndroid Build Coastguard Worker                                                                      byte_count,
52*795d594fSAndroid Build Coastguard Worker                                                                      byte_array,
53*795d594fSAndroid Build Coastguard Worker                                                                      offset,
54*795d594fSAndroid Build Coastguard Worker                                                                      high,
55*795d594fSAndroid Build Coastguard Worker                                                                      allocator_type);
56*795d594fSAndroid Build Coastguard Worker   return soa.AddLocalReference<jstring>(result);
57*795d594fSAndroid Build Coastguard Worker }
58*795d594fSAndroid Build Coastguard Worker 
StringFactory_newStringFromUtf16Bytes(JNIEnv * env,jclass,jbyteArray java_data,jint offset,jint char_count)59*795d594fSAndroid Build Coastguard Worker static jstring StringFactory_newStringFromUtf16Bytes(
60*795d594fSAndroid Build Coastguard Worker     JNIEnv* env, jclass, jbyteArray java_data, jint offset, jint char_count) {
61*795d594fSAndroid Build Coastguard Worker   ScopedFastNativeObjectAccess soa(env);
62*795d594fSAndroid Build Coastguard Worker   if (UNLIKELY(java_data == nullptr)) {
63*795d594fSAndroid Build Coastguard Worker     ThrowNullPointerException("data == null");
64*795d594fSAndroid Build Coastguard Worker     return nullptr;
65*795d594fSAndroid Build Coastguard Worker   }
66*795d594fSAndroid Build Coastguard Worker   StackHandleScope<1> hs(soa.Self());
67*795d594fSAndroid Build Coastguard Worker   Handle<mirror::ByteArray> byte_array(hs.NewHandle(soa.Decode<mirror::ByteArray>(java_data)));
68*795d594fSAndroid Build Coastguard Worker   int32_t data_size = byte_array->GetLength();
69*795d594fSAndroid Build Coastguard Worker   DCHECK_GE(data_size, 0);
70*795d594fSAndroid Build Coastguard Worker   if (offset < 0 ||
71*795d594fSAndroid Build Coastguard Worker       offset > data_size ||
72*795d594fSAndroid Build Coastguard Worker       static_cast<uint32_t>(char_count) > (static_cast<uint32_t>(data_size - offset) >> 1)) {
73*795d594fSAndroid Build Coastguard Worker     soa.Self()->ThrowNewExceptionF("Ljava/lang/StringIndexOutOfBoundsException;",
74*795d594fSAndroid Build Coastguard Worker                                    "length=%d; regionStart=%d; bytePairLength=%d",
75*795d594fSAndroid Build Coastguard Worker                                    data_size,
76*795d594fSAndroid Build Coastguard Worker                                    offset,
77*795d594fSAndroid Build Coastguard Worker                                    char_count);
78*795d594fSAndroid Build Coastguard Worker     return nullptr;
79*795d594fSAndroid Build Coastguard Worker   }
80*795d594fSAndroid Build Coastguard Worker   gc::AllocatorType allocator_type = Runtime::Current()->GetHeap()->GetCurrentAllocator();
81*795d594fSAndroid Build Coastguard Worker   ObjPtr<mirror::String> result = mirror::String::AllocFromUtf16ByteArray(soa.Self(),
82*795d594fSAndroid Build Coastguard Worker                                                                           char_count,
83*795d594fSAndroid Build Coastguard Worker                                                                           byte_array,
84*795d594fSAndroid Build Coastguard Worker                                                                           offset,
85*795d594fSAndroid Build Coastguard Worker                                                                           allocator_type);
86*795d594fSAndroid Build Coastguard Worker   return soa.AddLocalReference<jstring>(result);
87*795d594fSAndroid Build Coastguard Worker }
88*795d594fSAndroid Build Coastguard Worker 
89*795d594fSAndroid Build Coastguard Worker // The char array passed as `java_data` must not be a null reference.
StringFactory_newStringFromChars(JNIEnv * env,jclass,jint offset,jint char_count,jcharArray java_data)90*795d594fSAndroid Build Coastguard Worker static jstring StringFactory_newStringFromChars(JNIEnv* env, jclass, jint offset,
91*795d594fSAndroid Build Coastguard Worker                                                 jint char_count, jcharArray java_data) {
92*795d594fSAndroid Build Coastguard Worker   DCHECK(java_data != nullptr);
93*795d594fSAndroid Build Coastguard Worker   ScopedFastNativeObjectAccess soa(env);
94*795d594fSAndroid Build Coastguard Worker   StackHandleScope<1> hs(soa.Self());
95*795d594fSAndroid Build Coastguard Worker   Handle<mirror::CharArray> char_array(hs.NewHandle(soa.Decode<mirror::CharArray>(java_data)));
96*795d594fSAndroid Build Coastguard Worker   gc::AllocatorType allocator_type = Runtime::Current()->GetHeap()->GetCurrentAllocator();
97*795d594fSAndroid Build Coastguard Worker   ObjPtr<mirror::String> result = mirror::String::AllocFromCharArray(soa.Self(),
98*795d594fSAndroid Build Coastguard Worker                                                                      char_count,
99*795d594fSAndroid Build Coastguard Worker                                                                      char_array,
100*795d594fSAndroid Build Coastguard Worker                                                                      offset,
101*795d594fSAndroid Build Coastguard Worker                                                                      allocator_type);
102*795d594fSAndroid Build Coastguard Worker   return soa.AddLocalReference<jstring>(result);
103*795d594fSAndroid Build Coastguard Worker }
104*795d594fSAndroid Build Coastguard Worker 
StringFactory_newStringFromString(JNIEnv * env,jclass,jstring to_copy)105*795d594fSAndroid Build Coastguard Worker static jstring StringFactory_newStringFromString(JNIEnv* env, jclass, jstring to_copy) {
106*795d594fSAndroid Build Coastguard Worker   ScopedFastNativeObjectAccess soa(env);
107*795d594fSAndroid Build Coastguard Worker   if (UNLIKELY(to_copy == nullptr)) {
108*795d594fSAndroid Build Coastguard Worker     ThrowNullPointerException("toCopy == null");
109*795d594fSAndroid Build Coastguard Worker     return nullptr;
110*795d594fSAndroid Build Coastguard Worker   }
111*795d594fSAndroid Build Coastguard Worker   StackHandleScope<1> hs(soa.Self());
112*795d594fSAndroid Build Coastguard Worker   Handle<mirror::String> string(hs.NewHandle(soa.Decode<mirror::String>(to_copy)));
113*795d594fSAndroid Build Coastguard Worker   gc::AllocatorType allocator_type = Runtime::Current()->GetHeap()->GetCurrentAllocator();
114*795d594fSAndroid Build Coastguard Worker   ObjPtr<mirror::String> result = mirror::String::AllocFromString(soa.Self(),
115*795d594fSAndroid Build Coastguard Worker                                                                   string->GetLength(),
116*795d594fSAndroid Build Coastguard Worker                                                                   string,
117*795d594fSAndroid Build Coastguard Worker                                                                   /*offset=*/ 0,
118*795d594fSAndroid Build Coastguard Worker                                                                   allocator_type);
119*795d594fSAndroid Build Coastguard Worker   return soa.AddLocalReference<jstring>(result);
120*795d594fSAndroid Build Coastguard Worker }
121*795d594fSAndroid Build Coastguard Worker 
StringFactory_newStringFromUtf8Bytes(JNIEnv * env,jclass,jbyteArray java_data,jint offset,jint byte_count)122*795d594fSAndroid Build Coastguard Worker static jstring StringFactory_newStringFromUtf8Bytes(JNIEnv* env, jclass, jbyteArray java_data,
123*795d594fSAndroid Build Coastguard Worker                                                     jint offset, jint byte_count) {
124*795d594fSAndroid Build Coastguard Worker   // Local Define in here
125*795d594fSAndroid Build Coastguard Worker   static const jchar kReplacementChar = 0xfffd;
126*795d594fSAndroid Build Coastguard Worker   static const int kDefaultBufferSize = 256;
127*795d594fSAndroid Build Coastguard Worker   static const int kTableUtf8Needed[] = {
128*795d594fSAndroid Build Coastguard Worker     //      0  1  2  3  4  5  6  7  8  9  a  b  c  d  e  f
129*795d594fSAndroid Build Coastguard Worker     0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,  // 0xc0 - 0xcf
130*795d594fSAndroid Build Coastguard Worker     1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,  // 0xd0 - 0xdf
131*795d594fSAndroid Build Coastguard Worker     2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,  // 0xe0 - 0xef
132*795d594fSAndroid Build Coastguard Worker     3, 3, 3, 3, 3, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,  // 0xf0 - 0xff
133*795d594fSAndroid Build Coastguard Worker   };
134*795d594fSAndroid Build Coastguard Worker 
135*795d594fSAndroid Build Coastguard Worker   ScopedFastNativeObjectAccess soa(env);
136*795d594fSAndroid Build Coastguard Worker   if (UNLIKELY(java_data == nullptr)) {
137*795d594fSAndroid Build Coastguard Worker     ThrowNullPointerException("data == null");
138*795d594fSAndroid Build Coastguard Worker     return nullptr;
139*795d594fSAndroid Build Coastguard Worker   }
140*795d594fSAndroid Build Coastguard Worker 
141*795d594fSAndroid Build Coastguard Worker   StackHandleScope<1> hs(soa.Self());
142*795d594fSAndroid Build Coastguard Worker   Handle<mirror::ByteArray> byte_array(hs.NewHandle(soa.Decode<mirror::ByteArray>(java_data)));
143*795d594fSAndroid Build Coastguard Worker   int32_t data_size = byte_array->GetLength();
144*795d594fSAndroid Build Coastguard Worker   if ((offset | byte_count) < 0 || byte_count > data_size - offset) {
145*795d594fSAndroid Build Coastguard Worker     soa.Self()->ThrowNewExceptionF("Ljava/lang/StringIndexOutOfBoundsException;",
146*795d594fSAndroid Build Coastguard Worker         "length=%d; regionStart=%d; regionLength=%d", data_size,
147*795d594fSAndroid Build Coastguard Worker         offset, byte_count);
148*795d594fSAndroid Build Coastguard Worker     return nullptr;
149*795d594fSAndroid Build Coastguard Worker   }
150*795d594fSAndroid Build Coastguard Worker 
151*795d594fSAndroid Build Coastguard Worker   /*
152*795d594fSAndroid Build Coastguard Worker    * This code converts a UTF-8 byte sequence to a Java String (UTF-16).
153*795d594fSAndroid Build Coastguard Worker    * It implements the W3C recommended UTF-8 decoder.
154*795d594fSAndroid Build Coastguard Worker    * https://www.w3.org/TR/encoding/#utf-8-decoder
155*795d594fSAndroid Build Coastguard Worker    *
156*795d594fSAndroid Build Coastguard Worker    * Unicode 3.2 Well-Formed UTF-8 Byte Sequences
157*795d594fSAndroid Build Coastguard Worker    * Code Points        First  Second Third Fourth
158*795d594fSAndroid Build Coastguard Worker    * U+0000..U+007F     00..7F
159*795d594fSAndroid Build Coastguard Worker    * U+0080..U+07FF     C2..DF 80..BF
160*795d594fSAndroid Build Coastguard Worker    * U+0800..U+0FFF     E0     A0..BF 80..BF
161*795d594fSAndroid Build Coastguard Worker    * U+1000..U+CFFF     E1..EC 80..BF 80..BF
162*795d594fSAndroid Build Coastguard Worker    * U+D000..U+D7FF     ED     80..9F 80..BF
163*795d594fSAndroid Build Coastguard Worker    * U+E000..U+FFFF     EE..EF 80..BF 80..BF
164*795d594fSAndroid Build Coastguard Worker    * U+10000..U+3FFFF   F0     90..BF 80..BF 80..BF
165*795d594fSAndroid Build Coastguard Worker    * U+40000..U+FFFFF   F1..F3 80..BF 80..BF 80..BF
166*795d594fSAndroid Build Coastguard Worker    * U+100000..U+10FFFF F4     80..8F 80..BF 80..BF
167*795d594fSAndroid Build Coastguard Worker    *
168*795d594fSAndroid Build Coastguard Worker    * Please refer to Unicode as the authority.
169*795d594fSAndroid Build Coastguard Worker    * p.126 Table 3-7 in http://www.unicode.org/versions/Unicode10.0.0/ch03.pdf
170*795d594fSAndroid Build Coastguard Worker    *
171*795d594fSAndroid Build Coastguard Worker    * Handling Malformed Input
172*795d594fSAndroid Build Coastguard Worker    * The maximal subpart should be replaced by a single U+FFFD. Maximal subpart is
173*795d594fSAndroid Build Coastguard Worker    * the longest code unit subsequence starting at an unconvertible offset that is either
174*795d594fSAndroid Build Coastguard Worker    * 1) the initial subsequence of a well-formed code unit sequence, or
175*795d594fSAndroid Build Coastguard Worker    * 2) a subsequence of length one:
176*795d594fSAndroid Build Coastguard Worker    * One U+FFFD should be emitted for every sequence of bytes that is an incomplete prefix
177*795d594fSAndroid Build Coastguard Worker    * of a valid sequence, and with the conversion to restart after the incomplete sequence.
178*795d594fSAndroid Build Coastguard Worker    *
179*795d594fSAndroid Build Coastguard Worker    * For example, in byte sequence "41 C0 AF 41 F4 80 80 41", the maximal subparts are
180*795d594fSAndroid Build Coastguard Worker    * "C0", "AF", and "F4 80 80". "F4 80 80" can be the initial subsequence of "F4 80 80 80",
181*795d594fSAndroid Build Coastguard Worker    * but "C0" can't be the initial subsequence of any well-formed code unit sequence.
182*795d594fSAndroid Build Coastguard Worker    * Thus, the output should be "A\ufffd\ufffdA\ufffdA".
183*795d594fSAndroid Build Coastguard Worker    *
184*795d594fSAndroid Build Coastguard Worker    * Please refer to section "Best Practices for Using U+FFFD." in
185*795d594fSAndroid Build Coastguard Worker    * http://www.unicode.org/versions/Unicode10.0.0/ch03.pdf
186*795d594fSAndroid Build Coastguard Worker    */
187*795d594fSAndroid Build Coastguard Worker 
188*795d594fSAndroid Build Coastguard Worker   // Initial value
189*795d594fSAndroid Build Coastguard Worker   jchar stack_buffer[kDefaultBufferSize];
190*795d594fSAndroid Build Coastguard Worker   std::unique_ptr<jchar[]> allocated_buffer;
191*795d594fSAndroid Build Coastguard Worker   jchar* v;
192*795d594fSAndroid Build Coastguard Worker   if (byte_count <= kDefaultBufferSize) {
193*795d594fSAndroid Build Coastguard Worker     v = stack_buffer;
194*795d594fSAndroid Build Coastguard Worker   } else {
195*795d594fSAndroid Build Coastguard Worker     allocated_buffer.reset(new jchar[byte_count]);
196*795d594fSAndroid Build Coastguard Worker     v = allocated_buffer.get();
197*795d594fSAndroid Build Coastguard Worker   }
198*795d594fSAndroid Build Coastguard Worker 
199*795d594fSAndroid Build Coastguard Worker   jbyte* d = byte_array->GetData();
200*795d594fSAndroid Build Coastguard Worker   DCHECK(d != nullptr);
201*795d594fSAndroid Build Coastguard Worker 
202*795d594fSAndroid Build Coastguard Worker   int idx = offset;
203*795d594fSAndroid Build Coastguard Worker   int last = offset + byte_count;
204*795d594fSAndroid Build Coastguard Worker   int s = 0;
205*795d594fSAndroid Build Coastguard Worker 
206*795d594fSAndroid Build Coastguard Worker   int code_point = 0;
207*795d594fSAndroid Build Coastguard Worker   int utf8_bytes_seen = 0;
208*795d594fSAndroid Build Coastguard Worker   int utf8_bytes_needed = 0;
209*795d594fSAndroid Build Coastguard Worker   int lower_bound = 0x80;
210*795d594fSAndroid Build Coastguard Worker   int upper_bound = 0xbf;
211*795d594fSAndroid Build Coastguard Worker   while (idx < last) {
212*795d594fSAndroid Build Coastguard Worker     int b = d[idx++] & 0xff;
213*795d594fSAndroid Build Coastguard Worker     if (utf8_bytes_needed == 0) {
214*795d594fSAndroid Build Coastguard Worker       if ((b & 0x80) == 0) {  // ASCII char. 0xxxxxxx
215*795d594fSAndroid Build Coastguard Worker         v[s++] = (jchar) b;
216*795d594fSAndroid Build Coastguard Worker         continue;
217*795d594fSAndroid Build Coastguard Worker       }
218*795d594fSAndroid Build Coastguard Worker 
219*795d594fSAndroid Build Coastguard Worker       if ((b & 0x40) == 0) {  // 10xxxxxx is illegal as first byte
220*795d594fSAndroid Build Coastguard Worker         v[s++] = kReplacementChar;
221*795d594fSAndroid Build Coastguard Worker         continue;
222*795d594fSAndroid Build Coastguard Worker       }
223*795d594fSAndroid Build Coastguard Worker 
224*795d594fSAndroid Build Coastguard Worker       // 11xxxxxx
225*795d594fSAndroid Build Coastguard Worker       int tableLookupIndex = b & 0x3f;
226*795d594fSAndroid Build Coastguard Worker       utf8_bytes_needed = kTableUtf8Needed[tableLookupIndex];
227*795d594fSAndroid Build Coastguard Worker       if (utf8_bytes_needed == 0) {
228*795d594fSAndroid Build Coastguard Worker         v[s++] = kReplacementChar;
229*795d594fSAndroid Build Coastguard Worker         continue;
230*795d594fSAndroid Build Coastguard Worker       }
231*795d594fSAndroid Build Coastguard Worker 
232*795d594fSAndroid Build Coastguard Worker       // utf8_bytes_needed
233*795d594fSAndroid Build Coastguard Worker       // 1: b & 0x1f
234*795d594fSAndroid Build Coastguard Worker       // 2: b & 0x0f
235*795d594fSAndroid Build Coastguard Worker       // 3: b & 0x07
236*795d594fSAndroid Build Coastguard Worker       code_point = b & (0x3f >> utf8_bytes_needed);
237*795d594fSAndroid Build Coastguard Worker       if (b == 0xe0) {
238*795d594fSAndroid Build Coastguard Worker         lower_bound = 0xa0;
239*795d594fSAndroid Build Coastguard Worker       } else if (b == 0xed) {
240*795d594fSAndroid Build Coastguard Worker         upper_bound = 0x9f;
241*795d594fSAndroid Build Coastguard Worker       } else if (b == 0xf0) {
242*795d594fSAndroid Build Coastguard Worker         lower_bound = 0x90;
243*795d594fSAndroid Build Coastguard Worker       } else if (b == 0xf4) {
244*795d594fSAndroid Build Coastguard Worker         upper_bound = 0x8f;
245*795d594fSAndroid Build Coastguard Worker       }
246*795d594fSAndroid Build Coastguard Worker     } else {
247*795d594fSAndroid Build Coastguard Worker       if (b < lower_bound || b > upper_bound) {
248*795d594fSAndroid Build Coastguard Worker         // The bytes seen are ill-formed. Substitute them with U+FFFD
249*795d594fSAndroid Build Coastguard Worker         v[s++] = kReplacementChar;
250*795d594fSAndroid Build Coastguard Worker         code_point = 0;
251*795d594fSAndroid Build Coastguard Worker         utf8_bytes_needed = 0;
252*795d594fSAndroid Build Coastguard Worker         utf8_bytes_seen = 0;
253*795d594fSAndroid Build Coastguard Worker         lower_bound = 0x80;
254*795d594fSAndroid Build Coastguard Worker         upper_bound = 0xbf;
255*795d594fSAndroid Build Coastguard Worker         /*
256*795d594fSAndroid Build Coastguard Worker          * According to the Unicode Standard,
257*795d594fSAndroid Build Coastguard Worker          * "a UTF-8 conversion process is required to never consume well-formed
258*795d594fSAndroid Build Coastguard Worker          * subsequences as part of its error handling for ill-formed subsequences"
259*795d594fSAndroid Build Coastguard Worker          * The current byte could be part of well-formed subsequences. Reduce the
260*795d594fSAndroid Build Coastguard Worker          * index by 1 to parse it in next loop.
261*795d594fSAndroid Build Coastguard Worker          */
262*795d594fSAndroid Build Coastguard Worker         idx--;
263*795d594fSAndroid Build Coastguard Worker         continue;
264*795d594fSAndroid Build Coastguard Worker       }
265*795d594fSAndroid Build Coastguard Worker 
266*795d594fSAndroid Build Coastguard Worker       lower_bound = 0x80;
267*795d594fSAndroid Build Coastguard Worker       upper_bound = 0xbf;
268*795d594fSAndroid Build Coastguard Worker       code_point = (code_point << 6) | (b & 0x3f);
269*795d594fSAndroid Build Coastguard Worker       utf8_bytes_seen++;
270*795d594fSAndroid Build Coastguard Worker       if (utf8_bytes_needed != utf8_bytes_seen) {
271*795d594fSAndroid Build Coastguard Worker         continue;
272*795d594fSAndroid Build Coastguard Worker       }
273*795d594fSAndroid Build Coastguard Worker 
274*795d594fSAndroid Build Coastguard Worker       // Encode chars from U+10000 up as surrogate pairs
275*795d594fSAndroid Build Coastguard Worker       if (code_point < 0x10000) {
276*795d594fSAndroid Build Coastguard Worker         v[s++] = (jchar) code_point;
277*795d594fSAndroid Build Coastguard Worker       } else {
278*795d594fSAndroid Build Coastguard Worker         v[s++] = (jchar) ((code_point >> 10) + 0xd7c0);
279*795d594fSAndroid Build Coastguard Worker         v[s++] = (jchar) ((code_point & 0x3ff) + 0xdc00);
280*795d594fSAndroid Build Coastguard Worker       }
281*795d594fSAndroid Build Coastguard Worker 
282*795d594fSAndroid Build Coastguard Worker       utf8_bytes_seen = 0;
283*795d594fSAndroid Build Coastguard Worker       utf8_bytes_needed = 0;
284*795d594fSAndroid Build Coastguard Worker       code_point = 0;
285*795d594fSAndroid Build Coastguard Worker     }
286*795d594fSAndroid Build Coastguard Worker   }
287*795d594fSAndroid Build Coastguard Worker 
288*795d594fSAndroid Build Coastguard Worker   // The bytes seen are ill-formed. Substitute them by U+FFFD
289*795d594fSAndroid Build Coastguard Worker   if (utf8_bytes_needed != 0) {
290*795d594fSAndroid Build Coastguard Worker     v[s++] = kReplacementChar;
291*795d594fSAndroid Build Coastguard Worker   }
292*795d594fSAndroid Build Coastguard Worker 
293*795d594fSAndroid Build Coastguard Worker   ObjPtr<mirror::String> result = mirror::String::AllocFromUtf16(soa.Self(), s, v);
294*795d594fSAndroid Build Coastguard Worker   return soa.AddLocalReference<jstring>(result);
295*795d594fSAndroid Build Coastguard Worker }
296*795d594fSAndroid Build Coastguard Worker 
297*795d594fSAndroid Build Coastguard Worker static JNINativeMethod gMethods[] = {
298*795d594fSAndroid Build Coastguard Worker   FAST_NATIVE_METHOD(StringFactory, newStringFromBytes, "([BIII)Ljava/lang/String;"),
299*795d594fSAndroid Build Coastguard Worker   FAST_NATIVE_METHOD(StringFactory, newStringFromChars, "(II[C)Ljava/lang/String;"),
300*795d594fSAndroid Build Coastguard Worker   FAST_NATIVE_METHOD(StringFactory, newStringFromString, "(Ljava/lang/String;)Ljava/lang/String;"),
301*795d594fSAndroid Build Coastguard Worker   FAST_NATIVE_METHOD(StringFactory, newStringFromUtf8Bytes, "([BII)Ljava/lang/String;"),
302*795d594fSAndroid Build Coastguard Worker   FAST_NATIVE_METHOD(StringFactory, newStringFromUtf16Bytes, "([BII)Ljava/lang/String;"),
303*795d594fSAndroid Build Coastguard Worker };
304*795d594fSAndroid Build Coastguard Worker 
register_java_lang_StringFactory(JNIEnv * env)305*795d594fSAndroid Build Coastguard Worker void register_java_lang_StringFactory(JNIEnv* env) {
306*795d594fSAndroid Build Coastguard Worker   REGISTER_NATIVE_METHODS("java/lang/StringFactory");
307*795d594fSAndroid Build Coastguard Worker }
308*795d594fSAndroid Build Coastguard Worker 
309*795d594fSAndroid Build Coastguard Worker }  // namespace art
310