| // Protocol Buffers - Google's data interchange format |
| // Copyright 2023 Google LLC. All rights reserved. |
| // |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file or at |
| // https://developers.google.com/open-source/licenses/bsd |
| |
| // We encode backwards, to avoid pre-computing lengths (one-pass encode). |
| |
| #include "upb/wire/encode.h" |
| |
| #include <setjmp.h> |
| #include <stdbool.h> |
| #include <stdint.h> |
| #include <stdlib.h> |
| #include <string.h> |
| |
| #include "upb/base/descriptor_constants.h" |
| #include "upb/base/internal/endian.h" |
| #include "upb/base/string_view.h" |
| #include "upb/hash/common.h" |
| #include "upb/hash/int_table.h" |
| #include "upb/hash/str_table.h" |
| #include "upb/mem/arena.h" |
| #include "upb/message/array.h" |
| #include "upb/message/internal/accessors.h" |
| #include "upb/message/internal/array.h" |
| #include "upb/message/internal/extension.h" |
| #include "upb/message/internal/map.h" |
| #include "upb/message/internal/map_entry.h" |
| #include "upb/message/internal/map_sorter.h" |
| #include "upb/message/internal/message.h" |
| #include "upb/message/internal/tagged_ptr.h" |
| #include "upb/message/map.h" |
| #include "upb/message/message.h" |
| #include "upb/message/tagged_ptr.h" |
| #include "upb/mini_table/extension.h" |
| #include "upb/mini_table/field.h" |
| #include "upb/mini_table/internal/field.h" |
| #include "upb/mini_table/internal/message.h" |
| #include "upb/mini_table/internal/sub.h" |
| #include "upb/mini_table/message.h" |
| #include "upb/wire/internal/constants.h" |
| #include "upb/wire/types.h" |
| #include "upb/wire/writer.h" |
| |
| // Must be last. |
| #include "upb/port/def.inc" |
| |
| // Returns the MiniTable corresponding to a given MiniTableField |
| // from an array of MiniTableSubs. |
| static const upb_MiniTable* _upb_Encoder_GetSubMiniTable( |
| const upb_MiniTableSubInternal* subs, const upb_MiniTableField* field) { |
| return *subs[field->UPB_PRIVATE(submsg_index)].UPB_PRIVATE(submsg); |
| } |
| |
| static uint32_t encode_zz32(int32_t n) { |
| return ((uint32_t)n << 1) ^ (n >> 31); |
| } |
| static uint64_t encode_zz64(int64_t n) { |
| return ((uint64_t)n << 1) ^ (n >> 63); |
| } |
| |
| typedef struct { |
| upb_EncodeStatus status; |
| jmp_buf err; |
| upb_Arena* arena; |
| // These should only be used for arithmetic and reallocation to allow full |
| // aliasing analysis on the ptr argument. |
| const char UPB_NODEREF *buf, *limit; |
| int options; |
| int depth; |
| _upb_mapsorter sorter; |
| } upb_encstate; |
| |
| static size_t upb_roundup_pow2(size_t bytes) { |
| size_t ret = 128; |
| while (ret < bytes) { |
| ret *= 2; |
| } |
| return ret; |
| } |
| |
| UPB_NORETURN static void encode_err(upb_encstate* e, upb_EncodeStatus s) { |
| UPB_ASSERT(s != kUpb_EncodeStatus_Ok); |
| e->status = s; |
| UPB_LONGJMP(e->err, 1); |
| } |
| |
| UPB_NOINLINE |
| static char* encode_growbuffer(char* ptr, upb_encstate* e, size_t bytes) { |
| size_t old_size = e->limit - e->buf; |
| size_t needed_size = bytes + (e->limit - ptr); |
| size_t new_size = upb_roundup_pow2(needed_size); |
| char* new_buf = |
| upb_Arena_Realloc(e->arena, (void*)e->buf, old_size, new_size); |
| |
| if (!new_buf) encode_err(e, kUpb_EncodeStatus_OutOfMemory); |
| |
| // We want previous data at the end, realloc() put it at the beginning. |
| // TODO: This is somewhat inefficient since we are copying twice. |
| // Maybe create a realloc() that copies to the end of the new buffer? |
| if (old_size > 0) { |
| memmove(new_buf + new_size - old_size, new_buf, old_size); |
| } |
| |
| e->buf = new_buf; |
| e->limit = new_buf + new_size; |
| return new_buf + new_size - needed_size; |
| } |
| |
| /* Call to ensure that at least `bytes` bytes are available for writing at |
| * ptr. */ |
| UPB_FORCEINLINE |
| char* encode_reserve(char* ptr, upb_encstate* e, size_t bytes) { |
| if ((size_t)(ptr - e->buf) < bytes) { |
| return encode_growbuffer(ptr, e, bytes); |
| } |
| |
| return ptr - bytes; |
| } |
| |
| /* Writes the given bytes to the buffer, handling reserve/advance. */ |
| static char* encode_bytes(char* ptr, upb_encstate* e, const void* data, |
| size_t len) { |
| if (len == 0) return ptr; /* memcpy() with zero size is UB */ |
| ptr = encode_reserve(ptr, e, len); |
| memcpy(ptr, data, len); |
| return ptr; |
| } |
| |
| static char* encode_fixed64(char* ptr, upb_encstate* e, uint64_t val) { |
| val = upb_BigEndian64(val); |
| return encode_bytes(ptr, e, &val, sizeof(uint64_t)); |
| } |
| |
| static char* encode_fixed32(char* ptr, upb_encstate* e, uint32_t val) { |
| val = upb_BigEndian32(val); |
| return encode_bytes(ptr, e, &val, sizeof(uint32_t)); |
| } |
| |
| #define UPB_PB_VARINT_MAX_LEN 10 |
| |
| // Need gnu extended inline asm; msan can't instrument stores in inline assembly |
| #if defined(__aarch64__) && (defined(__GNUC__) || defined(__clang__)) && \ |
| !UPB_HAS_FEATURE(memory_sanitizer) |
| #define UPB_ARM64_ASM |
| #endif |
| |
| #ifdef UPB_ARM64_ASM |
| UPB_NOINLINE static char* encode_longvarint_arm64(char* ptr, upb_encstate* e, |
| uint64_t val) { |
| ptr = encode_reserve(ptr, e, UPB_PB_VARINT_MAX_LEN); |
| uint64_t clz; |
| __asm__("clz %[cnt], %[val]\n" : [cnt] "=r"(clz) : [val] "r"(val)); |
| |
| uint32_t skip = |
| UPB_PRIVATE(upb_WireWriter_VarintUnusedSizeFromLeadingZeros64)(clz); |
| |
| ptr += skip; |
| uint64_t addr, mask; |
| __asm__ volatile( |
| "adr %[addr], 0f\n" |
| // Each arm64 instruction encodes to 4 bytes, and it takes two |
| // intructions to process each byte of output, so we branch ahead by |
| // (4 + 4) * skip to avoid the remaining bytes. |
| "add %[addr], %[addr], %[cnt], lsl #3\n" |
| "mov %w[mask], #0x80\n" |
| "br %[addr]\n" |
| "0:\n" |
| // We don't need addr any more, but we've got the register for our whole |
| // assembly block so we'll use it as scratch to store the shift+masked |
| // values before storing them. |
| // The following stores are unsigned offset stores: |
| // strb Wt, [Xn, #imm] |
| "orr %[addr], %[mask], %[val], lsr #56\n" |
| "strb %w[addr], [%[ptr], #8]\n" |
| "orr %[addr], %[mask], %[val], lsr #49\n" |
| "strb %w[addr], [%[ptr], #7]\n" |
| "orr %[addr], %[mask], %[val], lsr #42\n" |
| "strb %w[addr], [%[ptr], #6]\n" |
| "orr %[addr], %[mask], %[val], lsr #35\n" |
| "strb %w[addr], [%[ptr], #5]\n" |
| "orr %[addr], %[mask], %[val], lsr #28\n" |
| "strb %w[addr], [%[ptr], #4]\n" |
| "orr %w[addr], %w[mask], %w[val], lsr #21\n" |
| "strb %w[addr], [%[ptr], #3]\n" |
| "orr %w[addr], %w[mask], %w[val], lsr #14\n" |
| "strb %w[addr], [%[ptr], #2]\n" |
| "orr %w[addr], %w[mask], %w[val], lsr #7\n" |
| "strb %w[addr], [%[ptr], #1]\n" |
| "orr %w[addr], %w[val], #0x80\n" |
| "strb %w[addr], [%[ptr]]\n" |
| : [addr] "=&r"(addr), [mask] "=&r"(mask) |
| : [val] "r"(val), [ptr] "r"(ptr), [cnt] "r"((uint64_t)skip) |
| : "memory"); |
| // Encode the final byte after the continuation bytes. |
| uint32_t continuations = UPB_PB_VARINT_MAX_LEN - 1 - skip; |
| ptr[continuations] = val >> (7 * continuations); |
| return ptr; |
| } |
| #else |
| UPB_NOINLINE |
| static char* encode_longvarint(char* ptr, upb_encstate* e, uint64_t val) { |
| ptr = encode_reserve(ptr, e, UPB_PB_VARINT_MAX_LEN); |
| size_t len = 0; |
| do { |
| uint8_t byte = val & 0x7fU; |
| val >>= 7; |
| if (val) byte |= 0x80U; |
| ptr[len++] = byte; |
| } while (val); |
| char* start = ptr + UPB_PB_VARINT_MAX_LEN - len; |
| memmove(start, ptr, len); |
| return start; |
| } |
| #endif |
| |
| UPB_FORCEINLINE |
| char* encode_varint(char* ptr, upb_encstate* e, uint64_t val) { |
| if (val < 128 && ptr != e->buf) { |
| --ptr; |
| *ptr = val; |
| return ptr; |
| } else { |
| #ifdef UPB_ARM64_ASM |
| return encode_longvarint_arm64(ptr, e, val); |
| #else |
| return encode_longvarint(ptr, e, val); |
| #endif |
| } |
| } |
| |
| static char* encode_double(char* ptr, upb_encstate* e, double d) { |
| uint64_t u64; |
| UPB_ASSERT(sizeof(double) == sizeof(uint64_t)); |
| memcpy(&u64, &d, sizeof(uint64_t)); |
| return encode_fixed64(ptr, e, u64); |
| } |
| |
| static char* encode_float(char* ptr, upb_encstate* e, float d) { |
| uint32_t u32; |
| UPB_ASSERT(sizeof(float) == sizeof(uint32_t)); |
| memcpy(&u32, &d, sizeof(uint32_t)); |
| return encode_fixed32(ptr, e, u32); |
| } |
| |
| static char* encode_tag(char* ptr, upb_encstate* e, uint32_t field_number, |
| uint8_t wire_type) { |
| return encode_varint(ptr, e, (field_number << 3) | wire_type); |
| } |
| |
| static char* encode_fixedarray(char* ptr, upb_encstate* e, const upb_Array* arr, |
| size_t elem_size, uint32_t tag) { |
| size_t bytes = upb_Array_Size(arr) * elem_size; |
| const char* data = upb_Array_DataPtr(arr); |
| const char* arr_ptr = data + bytes - elem_size; |
| |
| if (tag || !upb_IsLittleEndian()) { |
| while (true) { |
| if (elem_size == 4) { |
| uint32_t val; |
| memcpy(&val, arr_ptr, sizeof(val)); |
| val = upb_BigEndian32(val); |
| ptr = encode_bytes(ptr, e, &val, elem_size); |
| } else { |
| UPB_ASSERT(elem_size == 8); |
| uint64_t val; |
| memcpy(&val, arr_ptr, sizeof(val)); |
| val = upb_BigEndian64(val); |
| ptr = encode_bytes(ptr, e, &val, elem_size); |
| } |
| |
| if (tag) { |
| ptr = encode_varint(ptr, e, tag); |
| } |
| if (arr_ptr == data) break; |
| arr_ptr -= elem_size; |
| } |
| return ptr; |
| } else { |
| return encode_bytes(ptr, e, data, bytes); |
| } |
| } |
| |
| static char* encode_message(char* ptr, upb_encstate* e, const upb_Message* msg, |
| const upb_MiniTable* m, size_t* size); |
| |
| static char* encode_TaggedMessagePtr(char* ptr, upb_encstate* e, |
| upb_TaggedMessagePtr tagged, |
| const upb_MiniTable* m, size_t* size) { |
| if (upb_TaggedMessagePtr_IsEmpty(tagged)) { |
| m = UPB_PRIVATE(_upb_MiniTable_Empty)(); |
| } |
| return encode_message( |
| ptr, e, UPB_PRIVATE(_upb_TaggedMessagePtr_GetMessage)(tagged), m, size); |
| } |
| |
| static char* encode_scalar(char* ptr, upb_encstate* e, const void* _field_mem, |
| const upb_MiniTableSubInternal* subs, |
| const upb_MiniTableField* f) { |
| const char* field_mem = _field_mem; |
| int wire_type; |
| |
| #define CASE(ctype, type, wtype, encodeval) \ |
| { \ |
| ctype val = *(ctype*)field_mem; \ |
| ptr = encode_##type(ptr, e, encodeval); \ |
| wire_type = wtype; \ |
| break; \ |
| } |
| |
| switch (f->UPB_PRIVATE(descriptortype)) { |
| case kUpb_FieldType_Double: |
| CASE(double, double, kUpb_WireType_64Bit, val); |
| case kUpb_FieldType_Float: |
| CASE(float, float, kUpb_WireType_32Bit, val); |
| case kUpb_FieldType_Int64: |
| case kUpb_FieldType_UInt64: |
| CASE(uint64_t, varint, kUpb_WireType_Varint, val); |
| case kUpb_FieldType_UInt32: |
| CASE(uint32_t, varint, kUpb_WireType_Varint, val); |
| case kUpb_FieldType_Int32: |
| case kUpb_FieldType_Enum: |
| CASE(int32_t, varint, kUpb_WireType_Varint, (int64_t)val); |
| case kUpb_FieldType_SFixed64: |
| case kUpb_FieldType_Fixed64: |
| CASE(uint64_t, fixed64, kUpb_WireType_64Bit, val); |
| case kUpb_FieldType_Fixed32: |
| case kUpb_FieldType_SFixed32: |
| CASE(uint32_t, fixed32, kUpb_WireType_32Bit, val); |
| case kUpb_FieldType_Bool: |
| CASE(bool, varint, kUpb_WireType_Varint, val); |
| case kUpb_FieldType_SInt32: |
| CASE(int32_t, varint, kUpb_WireType_Varint, encode_zz32(val)); |
| case kUpb_FieldType_SInt64: |
| CASE(int64_t, varint, kUpb_WireType_Varint, encode_zz64(val)); |
| case kUpb_FieldType_String: |
| case kUpb_FieldType_Bytes: { |
| upb_StringView view = *(upb_StringView*)field_mem; |
| ptr = encode_bytes(ptr, e, view.data, view.size); |
| ptr = encode_varint(ptr, e, view.size); |
| wire_type = kUpb_WireType_Delimited; |
| break; |
| } |
| case kUpb_FieldType_Group: { |
| size_t size; |
| upb_TaggedMessagePtr submsg = *(upb_TaggedMessagePtr*)field_mem; |
| const upb_MiniTable* subm = _upb_Encoder_GetSubMiniTable(subs, f); |
| if (submsg == 0) { |
| return ptr; |
| } |
| if (--e->depth == 0) encode_err(e, kUpb_EncodeStatus_MaxDepthExceeded); |
| ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f), |
| kUpb_WireType_EndGroup); |
| ptr = encode_TaggedMessagePtr(ptr, e, submsg, subm, &size); |
| wire_type = kUpb_WireType_StartGroup; |
| e->depth++; |
| break; |
| } |
| case kUpb_FieldType_Message: { |
| size_t size; |
| upb_TaggedMessagePtr submsg = *(upb_TaggedMessagePtr*)field_mem; |
| const upb_MiniTable* subm = _upb_Encoder_GetSubMiniTable(subs, f); |
| if (submsg == 0) { |
| return ptr; |
| } |
| if (--e->depth == 0) encode_err(e, kUpb_EncodeStatus_MaxDepthExceeded); |
| ptr = encode_TaggedMessagePtr(ptr, e, submsg, subm, &size); |
| ptr = encode_varint(ptr, e, size); |
| wire_type = kUpb_WireType_Delimited; |
| e->depth++; |
| break; |
| } |
| default: |
| UPB_UNREACHABLE(); |
| } |
| #undef CASE |
| |
| return encode_tag(ptr, e, upb_MiniTableField_Number(f), wire_type); |
| } |
| |
| static char* encode_array(char* ptr, upb_encstate* e, const upb_Message* msg, |
| const upb_MiniTableSubInternal* subs, |
| const upb_MiniTableField* f) { |
| const upb_Array* arr = *UPB_PTR_AT(msg, f->UPB_PRIVATE(offset), upb_Array*); |
| bool packed = upb_MiniTableField_IsPacked(f); |
| size_t pre_len = e->limit - ptr; |
| |
| if (arr == NULL || upb_Array_Size(arr) == 0) { |
| return ptr; |
| } |
| |
| #define VARINT_CASE(ctype, encode) \ |
| { \ |
| const ctype* start = upb_Array_DataPtr(arr); \ |
| const ctype* arr_ptr = start + upb_Array_Size(arr); \ |
| uint32_t tag = \ |
| packed ? 0 : (f->UPB_PRIVATE(number) << 3) | kUpb_WireType_Varint; \ |
| do { \ |
| arr_ptr--; \ |
| ptr = encode_varint(ptr, e, encode); \ |
| if (tag) { \ |
| ptr = encode_varint(ptr, e, tag); \ |
| } \ |
| } while (arr_ptr != start); \ |
| } \ |
| break; |
| |
| #define TAG(wire_type) (packed ? 0 : (f->UPB_PRIVATE(number) << 3 | wire_type)) |
| |
| switch (f->UPB_PRIVATE(descriptortype)) { |
| case kUpb_FieldType_Double: |
| ptr = encode_fixedarray(ptr, e, arr, sizeof(double), |
| TAG(kUpb_WireType_64Bit)); |
| break; |
| case kUpb_FieldType_Float: |
| ptr = encode_fixedarray(ptr, e, arr, sizeof(float), |
| TAG(kUpb_WireType_32Bit)); |
| break; |
| case kUpb_FieldType_SFixed64: |
| case kUpb_FieldType_Fixed64: |
| ptr = encode_fixedarray(ptr, e, arr, sizeof(uint64_t), |
| TAG(kUpb_WireType_64Bit)); |
| break; |
| case kUpb_FieldType_Fixed32: |
| case kUpb_FieldType_SFixed32: |
| ptr = encode_fixedarray(ptr, e, arr, sizeof(uint32_t), |
| TAG(kUpb_WireType_32Bit)); |
| break; |
| case kUpb_FieldType_Int64: |
| case kUpb_FieldType_UInt64: |
| VARINT_CASE(uint64_t, *arr_ptr); |
| case kUpb_FieldType_UInt32: |
| VARINT_CASE(uint32_t, *arr_ptr); |
| case kUpb_FieldType_Int32: |
| case kUpb_FieldType_Enum: |
| VARINT_CASE(int32_t, (int64_t)*arr_ptr); |
| case kUpb_FieldType_Bool: |
| VARINT_CASE(bool, *arr_ptr); |
| case kUpb_FieldType_SInt32: |
| VARINT_CASE(int32_t, encode_zz32(*arr_ptr)); |
| case kUpb_FieldType_SInt64: |
| VARINT_CASE(int64_t, encode_zz64(*arr_ptr)); |
| case kUpb_FieldType_String: |
| case kUpb_FieldType_Bytes: { |
| const upb_StringView* start = upb_Array_DataPtr(arr); |
| const upb_StringView* str_ptr = start + upb_Array_Size(arr); |
| do { |
| str_ptr--; |
| ptr = encode_bytes(ptr, e, str_ptr->data, str_ptr->size); |
| ptr = encode_varint(ptr, e, str_ptr->size); |
| ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f), |
| kUpb_WireType_Delimited); |
| } while (str_ptr != start); |
| return ptr; |
| } |
| case kUpb_FieldType_Group: { |
| const upb_TaggedMessagePtr* start = upb_Array_DataPtr(arr); |
| const upb_TaggedMessagePtr* arr_ptr = start + upb_Array_Size(arr); |
| const upb_MiniTable* subm = _upb_Encoder_GetSubMiniTable(subs, f); |
| if (--e->depth == 0) encode_err(e, kUpb_EncodeStatus_MaxDepthExceeded); |
| do { |
| size_t size; |
| arr_ptr--; |
| ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f), |
| kUpb_WireType_EndGroup); |
| ptr = encode_TaggedMessagePtr(ptr, e, *arr_ptr, subm, &size); |
| ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f), |
| kUpb_WireType_StartGroup); |
| } while (arr_ptr != start); |
| e->depth++; |
| return ptr; |
| } |
| case kUpb_FieldType_Message: { |
| const upb_TaggedMessagePtr* start = upb_Array_DataPtr(arr); |
| const upb_TaggedMessagePtr* arr_ptr = start + upb_Array_Size(arr); |
| const upb_MiniTable* subm = _upb_Encoder_GetSubMiniTable(subs, f); |
| if (--e->depth == 0) encode_err(e, kUpb_EncodeStatus_MaxDepthExceeded); |
| do { |
| size_t size; |
| arr_ptr--; |
| ptr = encode_TaggedMessagePtr(ptr, e, *arr_ptr, subm, &size); |
| ptr = encode_varint(ptr, e, size); |
| ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f), |
| kUpb_WireType_Delimited); |
| } while (arr_ptr != start); |
| e->depth++; |
| return ptr; |
| } |
| } |
| #undef VARINT_CASE |
| |
| if (packed) { |
| ptr = encode_varint(ptr, e, e->limit - ptr - pre_len); |
| ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f), |
| kUpb_WireType_Delimited); |
| } |
| return ptr; |
| } |
| |
| static char* encode_mapentry(char* ptr, upb_encstate* e, uint32_t number, |
| const upb_MiniTable* layout, |
| const upb_MapEntry* ent) { |
| const upb_MiniTableField* key_field = upb_MiniTable_MapKey(layout); |
| const upb_MiniTableField* val_field = upb_MiniTable_MapValue(layout); |
| size_t pre_len = e->limit - ptr; |
| size_t size; |
| ptr = encode_scalar(ptr, e, &ent->v, layout->UPB_PRIVATE(subs), val_field); |
| ptr = encode_scalar(ptr, e, &ent->k, layout->UPB_PRIVATE(subs), key_field); |
| size = (e->limit - ptr) - pre_len; |
| ptr = encode_varint(ptr, e, size); |
| ptr = encode_tag(ptr, e, number, kUpb_WireType_Delimited); |
| return ptr; |
| } |
| |
| static char* encode_map(char* ptr, upb_encstate* e, const upb_Message* msg, |
| const upb_MiniTableSubInternal* subs, |
| const upb_MiniTableField* f) { |
| const upb_Map* map = *UPB_PTR_AT(msg, f->UPB_PRIVATE(offset), const upb_Map*); |
| const upb_MiniTable* layout = _upb_Encoder_GetSubMiniTable(subs, f); |
| UPB_ASSERT(upb_MiniTable_FieldCount(layout) == 2); |
| |
| if (!map || !upb_Map_Size(map)) return ptr; |
| |
| if (e->options & kUpb_EncodeOption_Deterministic) { |
| if (!map->UPB_PRIVATE(is_strtable)) { |
| // For inttable, first encode the array part, then sort the table entries. |
| intptr_t iter = UPB_INTTABLE_BEGIN; |
| while ((size_t)++iter < map->t.inttable.array_size) { |
| upb_value value = map->t.inttable.array[iter]; |
| if (upb_inttable_arrhas(&map->t.inttable, iter)) { |
| upb_MapEntry ent; |
| memcpy(&ent.k, &iter, sizeof(iter)); |
| _upb_map_fromvalue(value, &ent.v, map->val_size); |
| ptr = encode_mapentry(ptr, e, upb_MiniTableField_Number(f), layout, |
| &ent); |
| } |
| } |
| } |
| _upb_sortedmap sorted; |
| _upb_mapsorter_pushmap( |
| &e->sorter, layout->UPB_PRIVATE(fields)[0].UPB_PRIVATE(descriptortype), |
| map, &sorted); |
| upb_MapEntry ent; |
| while (_upb_sortedmap_next(&e->sorter, map, &sorted, &ent)) { |
| ptr = encode_mapentry(ptr, e, upb_MiniTableField_Number(f), layout, &ent); |
| } |
| _upb_mapsorter_popmap(&e->sorter, &sorted); |
| } else { |
| upb_value val; |
| if (map->UPB_PRIVATE(is_strtable)) { |
| intptr_t iter = UPB_STRTABLE_BEGIN; |
| upb_StringView strkey; |
| while (upb_strtable_next2(&map->t.strtable, &strkey, &val, &iter)) { |
| upb_MapEntry ent; |
| _upb_map_fromkey(strkey, &ent.k, map->key_size); |
| _upb_map_fromvalue(val, &ent.v, map->val_size); |
| ptr = |
| encode_mapentry(ptr, e, upb_MiniTableField_Number(f), layout, &ent); |
| } |
| } else { |
| intptr_t iter = UPB_INTTABLE_BEGIN; |
| uintptr_t intkey = 0; |
| while (upb_inttable_next(&map->t.inttable, &intkey, &val, &iter)) { |
| upb_MapEntry ent; |
| memcpy(&ent.k, &intkey, map->key_size); |
| _upb_map_fromvalue(val, &ent.v, map->val_size); |
| ptr = |
| encode_mapentry(ptr, e, upb_MiniTableField_Number(f), layout, &ent); |
| } |
| } |
| } |
| return ptr; |
| } |
| |
| static bool encode_shouldencode(const upb_Message* msg, |
| const upb_MiniTableField* f) { |
| if (f->presence == 0) { |
| // Proto3 presence or map/array. |
| const void* mem = UPB_PTR_AT(msg, f->UPB_PRIVATE(offset), void); |
| switch (UPB_PRIVATE(_upb_MiniTableField_GetRep)(f)) { |
| case kUpb_FieldRep_1Byte: { |
| char ch; |
| memcpy(&ch, mem, 1); |
| return ch != 0; |
| } |
| case kUpb_FieldRep_4Byte: { |
| uint32_t u32; |
| memcpy(&u32, mem, 4); |
| return u32 != 0; |
| } |
| case kUpb_FieldRep_8Byte: { |
| uint64_t u64; |
| memcpy(&u64, mem, 8); |
| return u64 != 0; |
| } |
| case kUpb_FieldRep_StringView: { |
| const upb_StringView* str = (const upb_StringView*)mem; |
| return str->size != 0; |
| } |
| default: |
| UPB_UNREACHABLE(); |
| } |
| } else if (UPB_PRIVATE(_upb_MiniTableField_HasHasbit)(f)) { |
| // Proto2 presence: hasbit. |
| return UPB_PRIVATE(_upb_Message_GetHasbit)(msg, f); |
| } else { |
| // Field is in a oneof. |
| return UPB_PRIVATE(_upb_Message_GetOneofCase)(msg, f) == |
| upb_MiniTableField_Number(f); |
| } |
| } |
| |
| static char* encode_field(char* ptr, upb_encstate* e, const upb_Message* msg, |
| const upb_MiniTableSubInternal* subs, |
| const upb_MiniTableField* field) { |
| switch (UPB_PRIVATE(_upb_MiniTableField_Mode)(field)) { |
| case kUpb_FieldMode_Array: |
| return encode_array(ptr, e, msg, subs, field); |
| case kUpb_FieldMode_Map: |
| return encode_map(ptr, e, msg, subs, field); |
| case kUpb_FieldMode_Scalar: |
| return encode_scalar(ptr, e, |
| UPB_PTR_AT(msg, field->UPB_PRIVATE(offset), void), |
| subs, field); |
| default: |
| UPB_UNREACHABLE(); |
| } |
| } |
| |
| static char* encode_msgset_item(char* ptr, upb_encstate* e, |
| const upb_MiniTableExtension* ext, |
| const upb_MessageValue ext_val) { |
| size_t size; |
| ptr = encode_tag(ptr, e, kUpb_MsgSet_Item, kUpb_WireType_EndGroup); |
| ptr = encode_message(ptr, e, ext_val.msg_val, |
| upb_MiniTableExtension_GetSubMessage(ext), &size); |
| ptr = encode_varint(ptr, e, size); |
| ptr = encode_tag(ptr, e, kUpb_MsgSet_Message, kUpb_WireType_Delimited); |
| ptr = encode_varint(ptr, e, upb_MiniTableExtension_Number(ext)); |
| ptr = encode_tag(ptr, e, kUpb_MsgSet_TypeId, kUpb_WireType_Varint); |
| ptr = encode_tag(ptr, e, kUpb_MsgSet_Item, kUpb_WireType_StartGroup); |
| return ptr; |
| } |
| |
| static char* encode_ext(char* ptr, upb_encstate* e, |
| const upb_MiniTableExtension* ext, |
| upb_MessageValue ext_val, bool is_message_set) { |
| if (UPB_UNLIKELY(is_message_set)) { |
| ptr = encode_msgset_item(ptr, e, ext, ext_val); |
| } else { |
| upb_MiniTableSubInternal sub; |
| if (upb_MiniTableField_IsSubMessage(&ext->UPB_PRIVATE(field))) { |
| sub.UPB_PRIVATE(submsg) = &ext->UPB_PRIVATE(sub).UPB_PRIVATE(submsg); |
| } else { |
| sub.UPB_PRIVATE(subenum) = ext->UPB_PRIVATE(sub).UPB_PRIVATE(subenum); |
| } |
| ptr = encode_field(ptr, e, &ext_val.UPB_PRIVATE(ext_msg_val), &sub, |
| &ext->UPB_PRIVATE(field)); |
| } |
| return ptr; |
| } |
| |
| static char* encode_exts(char* ptr, upb_encstate* e, const upb_MiniTable* m, |
| const upb_Message* msg) { |
| if (m->UPB_PRIVATE(ext) == kUpb_ExtMode_NonExtendable) return ptr; |
| |
| upb_Message_Internal* in = UPB_PRIVATE(_upb_Message_GetInternal)(msg); |
| if (!in) return ptr; |
| |
| /* Encode all extensions together. Unlike C++, we do not attempt to keep |
| * these in field number order relative to normal fields or even to each |
| * other. */ |
| uintptr_t iter = kUpb_Message_ExtensionBegin; |
| const upb_MiniTableExtension* ext; |
| upb_MessageValue ext_val; |
| if (!UPB_PRIVATE(_upb_Message_NextExtensionReverse)(msg, &ext, &ext_val, |
| &iter)) { |
| // Message has no extensions. |
| return ptr; |
| } |
| |
| if (e->options & kUpb_EncodeOption_Deterministic) { |
| _upb_sortedmap sorted; |
| if (!_upb_mapsorter_pushexts(&e->sorter, in, &sorted)) { |
| // TODO: b/378744096 - handle alloc failure |
| } |
| const upb_Extension* ext; |
| while (_upb_sortedmap_nextext(&e->sorter, &sorted, &ext)) { |
| ptr = encode_ext(ptr, e, ext->ext, ext->data, |
| m->UPB_PRIVATE(ext) == kUpb_ExtMode_IsMessageSet); |
| } |
| _upb_mapsorter_popmap(&e->sorter, &sorted); |
| } else { |
| do { |
| ptr = encode_ext(ptr, e, ext, ext_val, |
| m->UPB_PRIVATE(ext) == kUpb_ExtMode_IsMessageSet); |
| } while (UPB_PRIVATE(_upb_Message_NextExtensionReverse)(msg, &ext, &ext_val, |
| &iter)); |
| } |
| return ptr; |
| } |
| |
| static char* encode_message(char* ptr, upb_encstate* e, const upb_Message* msg, |
| const upb_MiniTable* m, size_t* size) { |
| size_t pre_len = e->limit - ptr; |
| |
| if (e->options & kUpb_EncodeOption_CheckRequired) { |
| if (m->UPB_PRIVATE(required_count)) { |
| if (!UPB_PRIVATE(_upb_Message_IsInitializedShallow)(msg, m)) { |
| encode_err(e, kUpb_EncodeStatus_MissingRequired); |
| } |
| } |
| } |
| |
| if ((e->options & kUpb_EncodeOption_SkipUnknown) == 0) { |
| size_t unknown_size = 0; |
| uintptr_t iter = kUpb_Message_UnknownBegin; |
| upb_StringView unknown; |
| // Need to write in reverse order, but iteration is in-order; scan to |
| // reserve capacity up front, then write in-order |
| while (upb_Message_NextUnknown(msg, &unknown, &iter)) { |
| unknown_size += unknown.size; |
| } |
| if (unknown_size != 0) { |
| ptr = encode_reserve(ptr, e, unknown_size); |
| char* tmp_ptr = ptr; |
| iter = kUpb_Message_UnknownBegin; |
| while (upb_Message_NextUnknown(msg, &unknown, &iter)) { |
| memcpy(tmp_ptr, unknown.data, unknown.size); |
| tmp_ptr += unknown.size; |
| } |
| } |
| } |
| |
| ptr = encode_exts(ptr, e, m, msg); |
| |
| if (upb_MiniTable_FieldCount(m)) { |
| const upb_MiniTableField* f = |
| &m->UPB_PRIVATE(fields)[m->UPB_PRIVATE(field_count)]; |
| const upb_MiniTableField* first = &m->UPB_PRIVATE(fields)[0]; |
| while (f != first) { |
| f--; |
| if (encode_shouldencode(msg, f)) { |
| ptr = encode_field(ptr, e, msg, m->UPB_PRIVATE(subs), f); |
| } |
| } |
| } |
| |
| *size = (e->limit - ptr) - pre_len; |
| return ptr; |
| } |
| |
| static upb_EncodeStatus upb_Encoder_Encode(char* ptr, |
| upb_encstate* const encoder, |
| const upb_Message* const msg, |
| const upb_MiniTable* const l, |
| char** const buf, size_t* const size, |
| bool prepend_len) { |
| // Unfortunately we must continue to perform hackery here because there are |
| // code paths which blindly copy the returned pointer without bothering to |
| // check for errors until much later (b/235839510). So we still set *buf to |
| // NULL on error and we still set it to non-NULL on a successful empty result. |
| if (UPB_SETJMP(encoder->err) == 0) { |
| size_t encoded_msg_size; |
| ptr = encode_message(ptr, encoder, msg, l, &encoded_msg_size); |
| if (prepend_len) { |
| ptr = encode_varint(ptr, encoder, encoded_msg_size); |
| } |
| *size = encoder->limit - ptr; |
| if (*size == 0) { |
| static char ch; |
| *buf = &ch; |
| } else { |
| UPB_ASSERT(ptr); |
| *buf = ptr; |
| } |
| } else { |
| UPB_ASSERT(encoder->status != kUpb_EncodeStatus_Ok); |
| *buf = NULL; |
| *size = 0; |
| } |
| |
| _upb_mapsorter_destroy(&encoder->sorter); |
| return encoder->status; |
| } |
| |
| static uint16_t upb_EncodeOptions_GetMaxDepth(uint32_t options) { |
| return options >> 16; |
| } |
| |
| uint16_t upb_EncodeOptions_GetEffectiveMaxDepth(uint32_t options) { |
| uint16_t max_depth = upb_EncodeOptions_GetMaxDepth(options); |
| return max_depth ? max_depth : kUpb_WireFormat_DefaultDepthLimit; |
| } |
| |
| static upb_EncodeStatus _upb_Encode(const upb_Message* msg, |
| const upb_MiniTable* l, int options, |
| upb_Arena* arena, char** buf, size_t* size, |
| bool prepend_len) { |
| upb_encstate e; |
| |
| e.status = kUpb_EncodeStatus_Ok; |
| e.arena = arena; |
| e.buf = NULL; |
| e.limit = NULL; |
| e.depth = upb_EncodeOptions_GetEffectiveMaxDepth(options); |
| e.options = options; |
| _upb_mapsorter_init(&e.sorter); |
| |
| return upb_Encoder_Encode(NULL, &e, msg, l, buf, size, prepend_len); |
| } |
| |
| upb_EncodeStatus upb_Encode(const upb_Message* msg, const upb_MiniTable* l, |
| int options, upb_Arena* arena, char** buf, |
| size_t* size) { |
| return _upb_Encode(msg, l, options, arena, buf, size, false); |
| } |
| |
| upb_EncodeStatus upb_EncodeLengthPrefixed(const upb_Message* msg, |
| const upb_MiniTable* l, int options, |
| upb_Arena* arena, char** buf, |
| size_t* size) { |
| return _upb_Encode(msg, l, options, arena, buf, size, true); |
| } |
| |
| const char* upb_EncodeStatus_String(upb_EncodeStatus status) { |
| switch (status) { |
| case kUpb_EncodeStatus_Ok: |
| return "Ok"; |
| case kUpb_EncodeStatus_MissingRequired: |
| return "Missing required field"; |
| case kUpb_EncodeStatus_MaxDepthExceeded: |
| return "Max depth exceeded"; |
| case kUpb_EncodeStatus_OutOfMemory: |
| return "Arena alloc failed"; |
| default: |
| return "Unknown encode status"; |
| } |
| } |