xref: /aosp_15_r20/external/grpc-grpc/third_party/upb/upb/message/promote.c (revision cc02d7e222339f7a4f6ba5f422e6413f4bd931f2)
1 // Protocol Buffers - Google's data interchange format
2 // Copyright 2023 Google LLC.  All rights reserved.
3 //
4 // Use of this source code is governed by a BSD-style
5 // license that can be found in the LICENSE file or at
6 // https://developers.google.com/open-source/licenses/bsd
7 
8 #include "upb/message/promote.h"
9 
10 #include <stdbool.h>
11 #include <stdint.h>
12 #include <string.h>
13 
14 #include "upb/base/descriptor_constants.h"
15 #include "upb/mem/arena.h"
16 #include "upb/message/accessors.h"
17 #include "upb/message/array.h"
18 #include "upb/message/internal/array.h"
19 #include "upb/message/internal/extension.h"
20 #include "upb/message/internal/message.h"
21 #include "upb/message/internal/tagged_ptr.h"
22 #include "upb/message/map.h"
23 #include "upb/message/message.h"
24 #include "upb/message/tagged_ptr.h"
25 #include "upb/mini_table/extension.h"
26 #include "upb/mini_table/field.h"
27 #include "upb/mini_table/message.h"
28 #include "upb/mini_table/sub.h"
29 #include "upb/wire/decode.h"
30 #include "upb/wire/eps_copy_input_stream.h"
31 #include "upb/wire/reader.h"
32 
33 // Must be last.
34 #include "upb/port/def.inc"
35 
36 // Parses unknown data by merging into existing base_message or creating a
37 // new message usingg mini_table.
upb_MiniTable_ParseUnknownMessage(const char * unknown_data,size_t unknown_size,const upb_MiniTable * mini_table,upb_Message * base_message,int decode_options,upb_Arena * arena)38 static upb_UnknownToMessageRet upb_MiniTable_ParseUnknownMessage(
39     const char* unknown_data, size_t unknown_size,
40     const upb_MiniTable* mini_table, upb_Message* base_message,
41     int decode_options, upb_Arena* arena) {
42   upb_UnknownToMessageRet ret;
43   ret.message =
44       base_message ? base_message : _upb_Message_New(mini_table, arena);
45   if (!ret.message) {
46     ret.status = kUpb_UnknownToMessage_OutOfMemory;
47     return ret;
48   }
49   // Decode sub message using unknown field contents.
50   const char* data = unknown_data;
51   uint32_t tag;
52   uint64_t message_len = 0;
53   data = upb_WireReader_ReadTag(data, &tag);
54   data = upb_WireReader_ReadVarint(data, &message_len);
55   upb_DecodeStatus status = upb_Decode(data, message_len, ret.message,
56                                        mini_table, NULL, decode_options, arena);
57   if (status == kUpb_DecodeStatus_OutOfMemory) {
58     ret.status = kUpb_UnknownToMessage_OutOfMemory;
59   } else if (status == kUpb_DecodeStatus_Ok) {
60     ret.status = kUpb_UnknownToMessage_Ok;
61   } else {
62     ret.status = kUpb_UnknownToMessage_ParseError;
63   }
64   return ret;
65 }
66 
upb_Message_GetOrPromoteExtension(upb_Message * msg,const upb_MiniTableExtension * ext_table,int decode_options,upb_Arena * arena,upb_MessageValue * value)67 upb_GetExtension_Status upb_Message_GetOrPromoteExtension(
68     upb_Message* msg, const upb_MiniTableExtension* ext_table,
69     int decode_options, upb_Arena* arena, upb_MessageValue* value) {
70   UPB_ASSERT(upb_MiniTableExtension_CType(ext_table) == kUpb_CType_Message);
71   const upb_Extension* extension =
72       UPB_PRIVATE(_upb_Message_Getext)(msg, ext_table);
73   if (extension) {
74     memcpy(value, &extension->data, sizeof(upb_MessageValue));
75     return kUpb_GetExtension_Ok;
76   }
77 
78   // Check unknown fields, if available promote.
79   int field_number = upb_MiniTableExtension_Number(ext_table);
80   upb_FindUnknownRet result = upb_Message_FindUnknown(msg, field_number, 0);
81   if (result.status != kUpb_FindUnknown_Ok) {
82     return kUpb_GetExtension_NotPresent;
83   }
84   size_t len;
85   size_t ofs = result.ptr - upb_Message_GetUnknown(msg, &len);
86   // Decode and promote from unknown.
87   const upb_MiniTable* extension_table =
88       upb_MiniTableExtension_GetSubMessage(ext_table);
89   upb_UnknownToMessageRet parse_result = upb_MiniTable_ParseUnknownMessage(
90       result.ptr, result.len, extension_table,
91       /* base_message= */ NULL, decode_options, arena);
92   switch (parse_result.status) {
93     case kUpb_UnknownToMessage_OutOfMemory:
94       return kUpb_GetExtension_OutOfMemory;
95     case kUpb_UnknownToMessage_ParseError:
96       return kUpb_GetExtension_ParseError;
97     case kUpb_UnknownToMessage_NotFound:
98       return kUpb_GetExtension_NotPresent;
99     case kUpb_UnknownToMessage_Ok:
100       break;
101   }
102   upb_Message* extension_msg = parse_result.message;
103   // Add to extensions.
104   upb_Extension* ext =
105       UPB_PRIVATE(_upb_Message_GetOrCreateExtension)(msg, ext_table, arena);
106   if (!ext) {
107     return kUpb_GetExtension_OutOfMemory;
108   }
109   ext->data.ptr = extension_msg;
110   value->msg_val = extension_msg;
111   const char* delete_ptr = upb_Message_GetUnknown(msg, &len) + ofs;
112   upb_Message_DeleteUnknown(msg, delete_ptr, result.len);
113   return kUpb_GetExtension_Ok;
114 }
115 
upb_FindUnknownRet_ParseError(void)116 static upb_FindUnknownRet upb_FindUnknownRet_ParseError(void) {
117   return (upb_FindUnknownRet){.status = kUpb_FindUnknown_ParseError};
118 }
119 
upb_Message_FindUnknown(const upb_Message * msg,uint32_t field_number,int depth_limit)120 upb_FindUnknownRet upb_Message_FindUnknown(const upb_Message* msg,
121                                            uint32_t field_number,
122                                            int depth_limit) {
123   depth_limit = depth_limit ? depth_limit : 100;
124 
125   size_t size;
126   upb_FindUnknownRet ret;
127 
128   const char* ptr = upb_Message_GetUnknown(msg, &size);
129   upb_EpsCopyInputStream stream;
130   upb_EpsCopyInputStream_Init(&stream, &ptr, size, true);
131 
132   while (!upb_EpsCopyInputStream_IsDone(&stream, &ptr)) {
133     uint32_t tag;
134     const char* unknown_begin = ptr;
135     ptr = upb_WireReader_ReadTag(ptr, &tag);
136     if (!ptr) return upb_FindUnknownRet_ParseError();
137     if (field_number == upb_WireReader_GetFieldNumber(tag)) {
138       ret.status = kUpb_FindUnknown_Ok;
139       ret.ptr = upb_EpsCopyInputStream_GetAliasedPtr(&stream, unknown_begin);
140       ptr = _upb_WireReader_SkipValue(ptr, tag, depth_limit, &stream);
141       // Because we know that the input is a flat buffer, it is safe to perform
142       // pointer arithmetic on aliased pointers.
143       ret.len = upb_EpsCopyInputStream_GetAliasedPtr(&stream, ptr) - ret.ptr;
144       return ret;
145     }
146 
147     ptr = _upb_WireReader_SkipValue(ptr, tag, depth_limit, &stream);
148     if (!ptr) return upb_FindUnknownRet_ParseError();
149   }
150   ret.status = kUpb_FindUnknown_NotPresent;
151   ret.ptr = NULL;
152   ret.len = 0;
153   return ret;
154 }
155 
upb_Message_PromoteOne(upb_TaggedMessagePtr * tagged,const upb_MiniTable * mini_table,int decode_options,upb_Arena * arena)156 static upb_DecodeStatus upb_Message_PromoteOne(upb_TaggedMessagePtr* tagged,
157                                                const upb_MiniTable* mini_table,
158                                                int decode_options,
159                                                upb_Arena* arena) {
160   upb_Message* empty =
161       UPB_PRIVATE(_upb_TaggedMessagePtr_GetEmptyMessage)(*tagged);
162   size_t unknown_size;
163   const char* unknown_data = upb_Message_GetUnknown(empty, &unknown_size);
164   upb_Message* promoted = upb_Message_New(mini_table, arena);
165   if (!promoted) return kUpb_DecodeStatus_OutOfMemory;
166   upb_DecodeStatus status = upb_Decode(unknown_data, unknown_size, promoted,
167                                        mini_table, NULL, decode_options, arena);
168   if (status == kUpb_DecodeStatus_Ok) {
169     *tagged = UPB_PRIVATE(_upb_TaggedMessagePtr_Pack)(promoted, false);
170   }
171   return status;
172 }
173 
upb_Message_PromoteMessage(upb_Message * parent,const upb_MiniTable * mini_table,const upb_MiniTableField * field,int decode_options,upb_Arena * arena,upb_Message ** promoted)174 upb_DecodeStatus upb_Message_PromoteMessage(upb_Message* parent,
175                                             const upb_MiniTable* mini_table,
176                                             const upb_MiniTableField* field,
177                                             int decode_options,
178                                             upb_Arena* arena,
179                                             upb_Message** promoted) {
180   const upb_MiniTable* sub_table =
181       upb_MiniTable_GetSubMessageTable(mini_table, field);
182   UPB_ASSERT(sub_table);
183   upb_TaggedMessagePtr tagged =
184       upb_Message_GetTaggedMessagePtr(parent, field, NULL);
185   upb_DecodeStatus ret =
186       upb_Message_PromoteOne(&tagged, sub_table, decode_options, arena);
187   if (ret == kUpb_DecodeStatus_Ok) {
188     *promoted = upb_TaggedMessagePtr_GetNonEmptyMessage(tagged);
189     upb_Message_SetMessage(parent, mini_table, field, *promoted);
190   }
191   return ret;
192 }
193 
upb_Array_PromoteMessages(upb_Array * arr,const upb_MiniTable * mini_table,int decode_options,upb_Arena * arena)194 upb_DecodeStatus upb_Array_PromoteMessages(upb_Array* arr,
195                                            const upb_MiniTable* mini_table,
196                                            int decode_options,
197                                            upb_Arena* arena) {
198   void** data = upb_Array_MutableDataPtr(arr);
199   size_t size = arr->UPB_PRIVATE(size);
200   for (size_t i = 0; i < size; i++) {
201     upb_TaggedMessagePtr tagged;
202     memcpy(&tagged, &data[i], sizeof(tagged));
203     if (!upb_TaggedMessagePtr_IsEmpty(tagged)) continue;
204     upb_DecodeStatus status =
205         upb_Message_PromoteOne(&tagged, mini_table, decode_options, arena);
206     if (status != kUpb_DecodeStatus_Ok) return status;
207     memcpy(&data[i], &tagged, sizeof(tagged));
208   }
209   return kUpb_DecodeStatus_Ok;
210 }
211 
upb_Map_PromoteMessages(upb_Map * map,const upb_MiniTable * mini_table,int decode_options,upb_Arena * arena)212 upb_DecodeStatus upb_Map_PromoteMessages(upb_Map* map,
213                                          const upb_MiniTable* mini_table,
214                                          int decode_options, upb_Arena* arena) {
215   size_t iter = kUpb_Map_Begin;
216   upb_MessageValue key, val;
217   while (upb_Map_Next(map, &key, &val, &iter)) {
218     if (!upb_TaggedMessagePtr_IsEmpty(val.tagged_msg_val)) continue;
219     upb_DecodeStatus status = upb_Message_PromoteOne(
220         &val.tagged_msg_val, mini_table, decode_options, arena);
221     if (status != kUpb_DecodeStatus_Ok) return status;
222     upb_Map_SetEntryValue(map, iter, val);
223   }
224   return kUpb_DecodeStatus_Ok;
225 }
226 
227 ////////////////////////////////////////////////////////////////////////////////
228 // OLD promotion functions, will be removed!
229 ////////////////////////////////////////////////////////////////////////////////
230 
231 // Warning: See TODO
upb_MiniTable_PromoteUnknownToMessage(upb_Message * msg,const upb_MiniTable * mini_table,const upb_MiniTableField * field,const upb_MiniTable * sub_mini_table,int decode_options,upb_Arena * arena)232 upb_UnknownToMessageRet upb_MiniTable_PromoteUnknownToMessage(
233     upb_Message* msg, const upb_MiniTable* mini_table,
234     const upb_MiniTableField* field, const upb_MiniTable* sub_mini_table,
235     int decode_options, upb_Arena* arena) {
236   upb_FindUnknownRet unknown;
237   // We need to loop and merge unknowns that have matching tag field->number.
238   upb_Message* message = NULL;
239   // Callers should check that message is not set first before calling
240   // PromotoUnknownToMessage.
241   UPB_ASSERT(upb_MiniTable_GetSubMessageTable(mini_table, field) ==
242              sub_mini_table);
243   bool is_oneof = upb_MiniTableField_IsInOneof(field);
244   if (!is_oneof || UPB_PRIVATE(_upb_Message_GetOneofCase)(msg, field) ==
245                        upb_MiniTableField_Number(field)) {
246     UPB_ASSERT(upb_Message_GetMessage(msg, field, NULL) == NULL);
247   }
248   upb_UnknownToMessageRet ret;
249   ret.status = kUpb_UnknownToMessage_Ok;
250   do {
251     unknown =
252         upb_Message_FindUnknown(msg, upb_MiniTableField_Number(field),
253                                 upb_DecodeOptions_GetMaxDepth(decode_options));
254     switch (unknown.status) {
255       case kUpb_FindUnknown_Ok: {
256         const char* unknown_data = unknown.ptr;
257         size_t unknown_size = unknown.len;
258         ret = upb_MiniTable_ParseUnknownMessage(unknown_data, unknown_size,
259                                                 sub_mini_table, message,
260                                                 decode_options, arena);
261         if (ret.status == kUpb_UnknownToMessage_Ok) {
262           message = ret.message;
263           upb_Message_DeleteUnknown(msg, unknown_data, unknown_size);
264         }
265       } break;
266       case kUpb_FindUnknown_ParseError:
267         ret.status = kUpb_UnknownToMessage_ParseError;
268         break;
269       case kUpb_FindUnknown_NotPresent:
270         // If we parsed at least one unknown, we are done.
271         ret.status =
272             message ? kUpb_UnknownToMessage_Ok : kUpb_UnknownToMessage_NotFound;
273         break;
274     }
275   } while (unknown.status == kUpb_FindUnknown_Ok);
276   if (message) {
277     if (is_oneof) {
278       UPB_PRIVATE(_upb_Message_SetOneofCase)(msg, field);
279     }
280     upb_Message_SetMessage(msg, mini_table, field, message);
281     ret.message = message;
282   }
283   return ret;
284 }
285 
286 // Moves repeated messages in unknowns to a upb_Array.
287 //
288 // Since the repeated field is not a scalar type we don't check for
289 // kUpb_LabelFlags_IsPacked.
290 // TODO: Optimize. Instead of converting messages one at a time,
291 // scan all unknown data once and compact.
upb_MiniTable_PromoteUnknownToMessageArray(upb_Message * msg,const upb_MiniTableField * field,const upb_MiniTable * mini_table,int decode_options,upb_Arena * arena)292 upb_UnknownToMessage_Status upb_MiniTable_PromoteUnknownToMessageArray(
293     upb_Message* msg, const upb_MiniTableField* field,
294     const upb_MiniTable* mini_table, int decode_options, upb_Arena* arena) {
295   upb_Array* repeated_messages = upb_Message_GetMutableArray(msg, field);
296   // Find all unknowns with given field number and parse.
297   upb_FindUnknownRet unknown;
298   do {
299     unknown =
300         upb_Message_FindUnknown(msg, upb_MiniTableField_Number(field),
301                                 upb_DecodeOptions_GetMaxDepth(decode_options));
302     if (unknown.status == kUpb_FindUnknown_Ok) {
303       upb_UnknownToMessageRet ret = upb_MiniTable_ParseUnknownMessage(
304           unknown.ptr, unknown.len, mini_table,
305           /* base_message= */ NULL, decode_options, arena);
306       if (ret.status == kUpb_UnknownToMessage_Ok) {
307         upb_MessageValue value;
308         value.msg_val = ret.message;
309         // Allocate array on demand before append.
310         if (!repeated_messages) {
311           upb_Message_ResizeArrayUninitialized(msg, field, 0, arena);
312           repeated_messages = upb_Message_GetMutableArray(msg, field);
313         }
314         if (!upb_Array_Append(repeated_messages, value, arena)) {
315           return kUpb_UnknownToMessage_OutOfMemory;
316         }
317         upb_Message_DeleteUnknown(msg, unknown.ptr, unknown.len);
318       } else {
319         return ret.status;
320       }
321     }
322   } while (unknown.status == kUpb_FindUnknown_Ok);
323   return kUpb_UnknownToMessage_Ok;
324 }
325 
326 // Moves repeated messages in unknowns to a upb_Map.
upb_MiniTable_PromoteUnknownToMap(upb_Message * msg,const upb_MiniTable * mini_table,const upb_MiniTableField * field,int decode_options,upb_Arena * arena)327 upb_UnknownToMessage_Status upb_MiniTable_PromoteUnknownToMap(
328     upb_Message* msg, const upb_MiniTable* mini_table,
329     const upb_MiniTableField* field, int decode_options, upb_Arena* arena) {
330   // TODO: use a variant of upb_MiniTable_GetSubMessageTable() here.
331   const upb_MiniTable* map_entry_mini_table = upb_MiniTableSub_Message(
332       mini_table->UPB_PRIVATE(subs)[field->UPB_PRIVATE(submsg_index)]);
333   UPB_ASSERT(map_entry_mini_table);
334   UPB_ASSERT(map_entry_mini_table);
335   UPB_ASSERT(map_entry_mini_table->UPB_PRIVATE(field_count) == 2);
336   UPB_ASSERT(upb_MiniTableField_IsMap(field));
337   // Find all unknowns with given field number and parse.
338   upb_FindUnknownRet unknown;
339   while (1) {
340     unknown =
341         upb_Message_FindUnknown(msg, upb_MiniTableField_Number(field),
342                                 upb_DecodeOptions_GetMaxDepth(decode_options));
343     if (unknown.status != kUpb_FindUnknown_Ok) break;
344     upb_UnknownToMessageRet ret = upb_MiniTable_ParseUnknownMessage(
345         unknown.ptr, unknown.len, map_entry_mini_table,
346         /* base_message= */ NULL, decode_options, arena);
347     if (ret.status != kUpb_UnknownToMessage_Ok) return ret.status;
348     // Allocate map on demand before append.
349     upb_Map* map = upb_Message_GetOrCreateMutableMap(msg, map_entry_mini_table,
350                                                      field, arena);
351     upb_Message* map_entry_message = ret.message;
352     bool insert_success = upb_Message_SetMapEntry(map, mini_table, field,
353                                                   map_entry_message, arena);
354     if (!insert_success) return kUpb_UnknownToMessage_OutOfMemory;
355     upb_Message_DeleteUnknown(msg, unknown.ptr, unknown.len);
356   }
357   return kUpb_UnknownToMessage_Ok;
358 }
359