blob: 3b67547f520de53a01a9dac0d8f39f74544364cd [file]
// Protocol Buffers - Google's data interchange format
// Copyright 2023 Google LLC. All rights reserved.
//
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file or at
// https://developers.google.com/open-source/licenses/bsd
// We encode backwards, to avoid pre-computing lengths (one-pass encode).
#include "upb/wire/internal/encoder.h"
#include <setjmp.h>
#include <stddef.h>
#include <stdint.h>
#include <string.h>
#include "upb/base/descriptor_constants.h"
#include "upb/base/internal/endian.h"
#include "upb/base/string_view.h"
#include "upb/hash/common.h"
#include "upb/hash/int_table.h"
#include "upb/hash/str_table.h"
#include "upb/mem/arena.h"
#include "upb/message/array.h"
#include "upb/message/internal/accessors.h"
#include "upb/message/internal/extension.h"
#include "upb/message/internal/map.h"
#include "upb/message/internal/map_entry.h"
#include "upb/message/internal/map_sorter.h"
#include "upb/message/internal/message.h"
#include "upb/message/map.h"
#include "upb/message/message.h"
#include "upb/mini_table/extension.h"
#include "upb/mini_table/field.h"
#include "upb/mini_table/internal/field.h"
#include "upb/mini_table/internal/message.h"
#include "upb/mini_table/message.h"
#include "upb/port/def.inc"
#include "upb/wire/encode.h"
#include "upb/wire/internal/back_alloc.h"
#include "upb/wire/internal/constants.h"
#include "upb/wire/types.h"
#include "upb/wire/writer.h"
// Must be last.
#include "upb/port/def.inc"
UPB_NOINLINE bool _upb_Encoder_AddMapEntryUnknown(
upb_Message* msg, const upb_MiniTableField* field, upb_Message* ent_msg,
const upb_MiniTable* entry, upb_Arena* arena) {
char* buf;
size_t size;
upb_EncodeStatus status =
_upb_Encode(ent_msg, entry, 0, arena, &buf, &size, false);
if (status != kUpb_EncodeStatus_Ok) {
return false;
}
char delim_buf[2 * kUpb_Encoder_EncodeVarint32MaxSize];
char* delim_end = delim_buf;
uint32_t tag =
((uint32_t)field->UPB_PRIVATE(number) << 3) | kUpb_WireType_Delimited;
delim_end = upb_Encoder_EncodeVarint32(tag, delim_end);
delim_end = upb_Encoder_EncodeVarint32(size, delim_end);
upb_StringView unknown[] = {
{delim_buf, delim_end - delim_buf},
{buf, size},
};
return UPB_PRIVATE(_upb_Message_AddUnknownV)(msg, arena, unknown, 2);
}
static uint32_t encode_zz32(int32_t n) {
return ((uint32_t)n << 1) ^ (n >> 31);
}
static uint64_t encode_zz64(int64_t n) {
return ((uint64_t)n << 1) ^ (n >> 63);
}
UPB_NORETURN static void encode_err(upb_encstate* e, upb_EncodeStatus s) {
UPB_ASSERT(s != kUpb_EncodeStatus_Ok);
e->status = s;
UPB_LONGJMP(*e->err, 1);
}
UPB_NOINLINE static char* encode_growbuffer(char* ptr, upb_encstate* e,
size_t bytes) {
ptr = upb_BackAlloc_Grow(&e->alloc, ptr, bytes);
if (ptr == NULL) {
encode_err(e, kUpb_EncodeStatus_OutOfMemory);
}
return ptr;
}
// Call to ensure that at least `bytes` bytes are available for writing at
// ptr.
UPB_FORCEINLINE
char* encode_reserve(char* ptr, upb_encstate* e, size_t bytes) {
if (upb_BackAlloc_HasBytes(&e->alloc, ptr, bytes)) {
return ptr - bytes;
}
return encode_growbuffer(ptr, e, bytes);
}
static char* encode_bytes_unchecked(char* ptr, upb_encstate* e,
const void* data, size_t len) {
if (len == 0) return ptr; /* memcpy() with zero size is UB */
ptr -= len;
memcpy(ptr, data, len);
return ptr;
}
/* Writes the given bytes to the buffer, handling reserve/advance. */
static char* encode_bytes(char* ptr, upb_encstate* e, const void* data,
size_t len) {
if (len == 0) return ptr; /* memcpy() with zero size is UB */
ptr = encode_reserve(ptr, e, len);
memcpy(ptr, data, len);
return ptr;
}
static char* encode_fixed64_unchecked(char* ptr, upb_encstate* e,
uint64_t val) {
val = upb_BigEndian64(val);
return encode_bytes_unchecked(ptr, e, &val, sizeof(uint64_t));
}
static char* encode_fixed32_unchecked(char* ptr, upb_encstate* e,
uint32_t val) {
val = upb_BigEndian32(val);
return encode_bytes_unchecked(ptr, e, &val, sizeof(uint32_t));
}
#define UPB_PB_VARINT_MAX_LEN 10
#define UPB_PB_VARINT32_MAX_LEN 5
#if UPB_ARM64_ASM
// Each arm64 instruction encodes to 4 bytes, and it takes two intructions
// to process each byte of output, so we branch ahead by (4 + 4) * skip to
// avoid the remaining bytes. When BTI is on, we need to use specific
// "landing pad" instructions, so we pad those with nop to make it a power
// of 2, skipping 16 bytes at each stage instead of 8. This carries some
// overhead especially on in-order cores so they're not included unless
// building with branch protection.
#if UPB_ARM64_BTI_DEFAULT
// BTI is used with jc targets here because we don't control which register will
// be used for addr; if it's x16 or x17 a `br` is treated like a call.
#define UPB_BTI_JC "bti jc\n"
#define UPB_BTI_NOP "nop\n"
#define UPB_BTI_SHIFT_IMM "4\n"
#else
#define UPB_BTI_JC
#define UPB_BTI_NOP
#define UPB_BTI_SHIFT_IMM "3\n"
#endif
UPB_NOINLINE static char* encode_longvarint(char* ptr, upb_encstate* e,
uint64_t val) {
ptr = encode_reserve(ptr, e, UPB_PB_VARINT_MAX_LEN);
uint64_t clz;
__asm__("clz %[cnt], %[val]\n" : [cnt] "=r"(clz) : [val] "r"(val));
uint32_t skip =
UPB_PRIVATE(upb_WireWriter_VarintUnusedSizeFromLeadingZeros64)(clz);
ptr += skip;
uint64_t addr, mask;
__asm__ volatile(
// Formatter keeps merging short lines
// clang-format off
"adr %[addr], 0f\n"
"add %[addr], %[addr], %[cnt], lsl #" UPB_BTI_SHIFT_IMM
"mov %w[mask], #0x80\n"
"br %[addr]\n"
// Work around llvm/llvm-project#47432, where alignment directives inside
// functions crash the compiler when generating SEH info on windows.
#ifndef __SEH__
".p2align " UPB_BTI_SHIFT_IMM
#endif
"0:\n"
// We don't need addr any more, but we've got the register for our whole
// assembly block so we'll use it as scratch to store the shift+masked
// values before storing them.
// The following stores are unsigned offset stores:
// strb Wt, [Xn, #imm]
UPB_BTI_JC
"orr %[addr], %[mask], %[val], lsr #56\n"
"strb %w[addr], [%[ptr], #8]\n"
UPB_BTI_NOP
UPB_BTI_JC
"orr %[addr], %[mask], %[val], lsr #49\n"
"strb %w[addr], [%[ptr], #7]\n"
UPB_BTI_NOP
UPB_BTI_JC
"orr %[addr], %[mask], %[val], lsr #42\n"
"strb %w[addr], [%[ptr], #6]\n"
UPB_BTI_NOP
UPB_BTI_JC
"orr %[addr], %[mask], %[val], lsr #35\n"
"strb %w[addr], [%[ptr], #5]\n"
UPB_BTI_NOP
UPB_BTI_JC
"orr %[addr], %[mask], %[val], lsr #28\n"
"strb %w[addr], [%[ptr], #4]\n"
UPB_BTI_NOP
UPB_BTI_JC
"orr %w[addr], %w[mask], %w[val], lsr #21\n"
"strb %w[addr], [%[ptr], #3]\n"
UPB_BTI_NOP
UPB_BTI_JC
"orr %w[addr], %w[mask], %w[val], lsr #14\n"
"strb %w[addr], [%[ptr], #2]\n"
UPB_BTI_NOP
UPB_BTI_JC
"orr %w[addr], %w[mask], %w[val], lsr #7\n"
"strb %w[addr], [%[ptr], #1]\n"
UPB_BTI_NOP
UPB_BTI_JC
"orr %w[addr], %w[val], #0x80\n"
"strb %w[addr], [%[ptr]]\n"
UPB_BTI_NOP
UPB_BTI_JC
// clang-format on
: [addr] "=&r"(addr), [mask] "=&r"(mask)
: [val] "r"(val), [ptr] "r"(ptr), [cnt] "r"((uint64_t)skip)
: "memory");
uint32_t continuations = UPB_PB_VARINT_MAX_LEN - 1 - skip;
// msan can't instrument stores in inline assembly
UPB_PRIVATE(upb_Xsan_MarkInitialized)(ptr, continuations);
// Encode the final byte after the continuation bytes.
ptr[continuations] = val >> (7 * continuations);
return ptr;
}
#undef UPB_BTI_JC
#undef UPB_BTI_NOP
#undef UPB_BTI_SHIFT_IMM
#else
UPB_NOINLINE
static char* encode_longvarint(char* ptr, upb_encstate* e, uint64_t val) {
ptr = encode_reserve(ptr, e, UPB_PB_VARINT_MAX_LEN);
size_t len = 0;
do {
uint8_t byte = val & 0x7fU;
val >>= 7;
if (val) byte |= 0x80U;
ptr[len++] = byte;
} while (val);
char* start = ptr + UPB_PB_VARINT_MAX_LEN - len;
memmove(start, ptr, len);
return start;
}
#endif
UPB_FORCEINLINE
char* encode_varint_unchecked(char* ptr, upb_encstate* e, uint64_t val) {
if (val < 128) {
--ptr;
*ptr = val;
return ptr;
} else {
return encode_longvarint(ptr, e, val);
}
}
UPB_FORCEINLINE
char* encode_varint(char* ptr, upb_encstate* e, uint64_t val) {
if (val < 128 && upb_BackAlloc_HasBytes(&e->alloc, ptr, 1)) {
--ptr;
*ptr = val;
return ptr;
} else {
return encode_longvarint(ptr, e, val);
}
}
UPB_NOINLINE
char* encode_longlength(char* ptr, upb_encstate* e, uint64_t val) {
if (val > INT32_MAX) {
encode_err(e, kUpb_EncodeStatus_MaxSizeExceeded);
}
return encode_longvarint(ptr, e, val);
}
UPB_FORCEINLINE
char* encode_length(char* ptr, upb_encstate* e, uint64_t val) {
if (val < 128 && upb_BackAlloc_HasBytes(&e->alloc, ptr, 1)) {
--ptr;
*ptr = val;
return ptr;
} else {
return encode_longlength(ptr, e, val);
}
}
UPB_FORCEINLINE
char* encode_length_unchecked(char* ptr, upb_encstate* e, uint64_t val) {
if (val < 128) {
--ptr;
*ptr = val;
return ptr;
} else {
return encode_longlength(ptr, e, val);
}
}
static char* encode_double_unchecked(char* ptr, upb_encstate* e, double d) {
uint64_t u64;
UPB_STATIC_ASSERT(sizeof(double) == sizeof(uint64_t), "bad double size");
memcpy(&u64, &d, sizeof(uint64_t));
return encode_fixed64_unchecked(ptr, e, u64);
}
static char* encode_float_unchecked(char* ptr, upb_encstate* e, float d) {
uint32_t u32;
UPB_STATIC_ASSERT(sizeof(float) == sizeof(uint32_t), "bad float size");
memcpy(&u32, &d, sizeof(uint32_t));
return encode_fixed32_unchecked(ptr, e, u32);
}
static char* encode_tag_unchecked(char* ptr, upb_encstate* e,
uint32_t field_number, uint8_t wire_type) {
return encode_varint_unchecked(ptr, e, (field_number << 3) | wire_type);
}
static char* encode_tag(char* ptr, upb_encstate* e, uint32_t field_number,
uint8_t wire_type) {
return encode_varint(ptr, e, (field_number << 3) | wire_type);
}
static char* encode_fixedarray(char* ptr, upb_encstate* e, const upb_Array* arr,
size_t elem_size, uint32_t tag) {
size_t bytes = upb_Array_Size(arr) * elem_size;
const char* data = upb_Array_DataPtr(arr);
const char* arr_ptr = data + bytes - elem_size;
if (tag || !upb_IsLittleEndian()) {
while (true) {
if (elem_size == 4) {
uint32_t val;
memcpy(&val, arr_ptr, sizeof(val));
val = upb_BigEndian32(val);
ptr = encode_bytes(ptr, e, &val, elem_size);
} else {
UPB_ASSERT(elem_size == 8);
uint64_t val;
memcpy(&val, arr_ptr, sizeof(val));
val = upb_BigEndian64(val);
ptr = encode_bytes(ptr, e, &val, elem_size);
}
if (tag) {
ptr = encode_varint(ptr, e, tag);
}
if (arr_ptr == data) break;
arr_ptr -= elem_size;
}
return ptr;
} else {
return encode_bytes(ptr, e, data, bytes);
}
}
static char* encode_scalar(char* ptr, upb_encstate* e, const void* field_mem,
const upb_MiniTableField* f) {
// Max size is tag + 10 bytes for max varint or 8 for largest fixed size
#define CASE(ctype, type, wtype, encodeval) \
{ \
const size_t bytes = UPB_PB_VARINT32_MAX_LEN + UPB_PB_VARINT_MAX_LEN; \
ptr = encode_reserve(ptr, e, bytes); \
ptr += bytes; \
const ctype val = *(const ctype*)field_mem; \
ptr = encode_##type##_unchecked(ptr, e, encodeval); \
return encode_tag_unchecked(ptr, e, upb_MiniTableField_Number(f), wtype); \
}
switch (f->UPB_PRIVATE(descriptortype)) {
case kUpb_FieldType_Double:
CASE(double, double, kUpb_WireType_64Bit, val);
case kUpb_FieldType_Float:
CASE(float, float, kUpb_WireType_32Bit, val);
case kUpb_FieldType_Int64:
case kUpb_FieldType_UInt64:
CASE(uint64_t, varint, kUpb_WireType_Varint, val);
case kUpb_FieldType_UInt32:
CASE(uint32_t, varint, kUpb_WireType_Varint, val);
case kUpb_FieldType_Int32:
case kUpb_FieldType_Enum:
CASE(int32_t, varint, kUpb_WireType_Varint, (int64_t)val);
case kUpb_FieldType_SFixed64:
case kUpb_FieldType_Fixed64:
CASE(uint64_t, fixed64, kUpb_WireType_64Bit, val);
case kUpb_FieldType_Fixed32:
case kUpb_FieldType_SFixed32:
CASE(uint32_t, fixed32, kUpb_WireType_32Bit, val);
case kUpb_FieldType_Bool:
CASE(bool, varint, kUpb_WireType_Varint, val);
case kUpb_FieldType_SInt32:
CASE(int32_t, varint, kUpb_WireType_Varint, encode_zz32(val));
case kUpb_FieldType_SInt64:
CASE(int64_t, varint, kUpb_WireType_Varint, encode_zz64(val));
case kUpb_FieldType_String:
case kUpb_FieldType_Bytes: {
upb_StringView view = *(upb_StringView*)field_mem;
const size_t max_size =
UPB_PB_VARINT32_MAX_LEN + UPB_PB_VARINT32_MAX_LEN + view.size;
ptr = encode_reserve(ptr, e, max_size);
ptr += max_size;
ptr = encode_bytes_unchecked(ptr, e, view.data, view.size);
ptr = encode_length_unchecked(ptr, e, view.size);
return encode_tag_unchecked(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_Delimited);
}
case kUpb_FieldType_Group: {
size_t size;
upb_Message* submsg = *(upb_Message**)field_mem;
const upb_MiniTable* subm = upb_MiniTable_GetSubMessageTable(f);
if (submsg == 0) {
return ptr;
}
if (--e->depth == 0) encode_err(e, kUpb_EncodeStatus_MaxDepthExceeded);
ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_EndGroup);
ptr = encode_message(ptr, e, submsg, subm, &size);
e->depth++;
return encode_tag(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_StartGroup);
}
case kUpb_FieldType_Message: {
size_t size;
upb_Message* submsg = *(upb_Message**)field_mem;
const upb_MiniTable* subm = upb_MiniTable_GetSubMessageTable(f);
if (submsg == 0) {
return ptr;
}
if (--e->depth == 0) encode_err(e, kUpb_EncodeStatus_MaxDepthExceeded);
ptr = encode_message(ptr, e, submsg, subm, &size);
e->depth++;
size_t max_size = UPB_PB_VARINT32_MAX_LEN + UPB_PB_VARINT32_MAX_LEN;
ptr = encode_reserve(ptr, e, max_size);
ptr += max_size;
ptr = encode_length_unchecked(ptr, e, size);
return encode_tag_unchecked(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_Delimited);
}
default:
UPB_UNREACHABLE();
}
#undef CASE
}
static char* encode_array(char* ptr, upb_encstate* e, const upb_Message* msg,
const upb_MiniTableField* f) {
const upb_Array* arr = *UPB_PTR_AT(msg, f->UPB_PRIVATE(offset), upb_Array*);
bool packed = upb_MiniTableField_IsPacked(f);
size_t pre_len = upb_BackAlloc_Size(&e->alloc, ptr);
if (arr == NULL || upb_Array_Size(arr) == 0) {
return ptr;
}
#define VARINT_CASE(ctype, encode) \
{ \
const ctype* start = upb_Array_DataPtr(arr); \
const ctype* arr_ptr = start + upb_Array_Size(arr); \
if (packed) { \
do { \
arr_ptr--; \
ptr = encode_varint(ptr, e, encode); \
} while (arr_ptr != start); \
} else { \
uint32_t number = upb_MiniTableField_Number(f); \
do { \
arr_ptr--; \
ptr = encode_varint(ptr, e, encode); \
ptr = encode_tag(ptr, e, number, kUpb_WireType_Varint); \
} while (arr_ptr != start); \
} \
} \
break;
#define TAG(wire_type) (packed ? 0 : (f->UPB_PRIVATE(number) << 3 | wire_type))
switch (f->UPB_PRIVATE(descriptortype)) {
case kUpb_FieldType_Double:
ptr = encode_fixedarray(ptr, e, arr, sizeof(double),
TAG(kUpb_WireType_64Bit));
break;
case kUpb_FieldType_Float:
ptr = encode_fixedarray(ptr, e, arr, sizeof(float),
TAG(kUpb_WireType_32Bit));
break;
case kUpb_FieldType_SFixed64:
case kUpb_FieldType_Fixed64:
ptr = encode_fixedarray(ptr, e, arr, sizeof(uint64_t),
TAG(kUpb_WireType_64Bit));
break;
case kUpb_FieldType_Fixed32:
case kUpb_FieldType_SFixed32:
ptr = encode_fixedarray(ptr, e, arr, sizeof(uint32_t),
TAG(kUpb_WireType_32Bit));
break;
case kUpb_FieldType_Int64:
case kUpb_FieldType_UInt64:
VARINT_CASE(uint64_t, *arr_ptr);
case kUpb_FieldType_UInt32:
VARINT_CASE(uint32_t, *arr_ptr);
case kUpb_FieldType_Int32:
case kUpb_FieldType_Enum:
VARINT_CASE(int32_t, (int64_t)*arr_ptr);
case kUpb_FieldType_Bool:
VARINT_CASE(bool, *arr_ptr);
case kUpb_FieldType_SInt32:
VARINT_CASE(int32_t, encode_zz32(*arr_ptr));
case kUpb_FieldType_SInt64:
VARINT_CASE(int64_t, encode_zz64(*arr_ptr));
case kUpb_FieldType_String:
case kUpb_FieldType_Bytes: {
const upb_StringView* start = upb_Array_DataPtr(arr);
const upb_StringView* str_ptr = start + upb_Array_Size(arr);
do {
str_ptr--;
ptr = encode_bytes(ptr, e, str_ptr->data, str_ptr->size);
ptr = encode_length(ptr, e, str_ptr->size);
ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_Delimited);
} while (str_ptr != start);
return ptr;
}
case kUpb_FieldType_Group: {
const upb_Message* const* start = upb_Array_DataPtr(arr);
const upb_Message* const* arr_ptr = start + upb_Array_Size(arr);
const upb_MiniTable* subm = upb_MiniTable_GetSubMessageTable(f);
if (--e->depth == 0) encode_err(e, kUpb_EncodeStatus_MaxDepthExceeded);
do {
size_t size;
arr_ptr--;
ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_EndGroup);
ptr = encode_message(ptr, e, *arr_ptr, subm, &size);
ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_StartGroup);
} while (arr_ptr != start);
e->depth++;
return ptr;
}
case kUpb_FieldType_Message: {
const upb_Message* const* start = upb_Array_DataPtr(arr);
const upb_Message* const* arr_ptr = start + upb_Array_Size(arr);
const upb_MiniTable* subm = upb_MiniTable_GetSubMessageTable(f);
if (--e->depth == 0) encode_err(e, kUpb_EncodeStatus_MaxDepthExceeded);
do {
size_t size;
arr_ptr--;
ptr = encode_message(ptr, e, *arr_ptr, subm, &size);
ptr = encode_length(ptr, e, size);
ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_Delimited);
} while (arr_ptr != start);
e->depth++;
return ptr;
}
}
#undef VARINT_CASE
if (packed) {
ptr = encode_length(ptr, e, upb_BackAlloc_Size(&e->alloc, ptr) - pre_len);
ptr = encode_tag(ptr, e, upb_MiniTableField_Number(f),
kUpb_WireType_Delimited);
}
return ptr;
}
static char* encode_mapentry(char* ptr, upb_encstate* e, uint32_t number,
const upb_MiniTable* layout,
const upb_MapEntry* ent) {
const upb_MiniTableField* key_field = upb_MiniTable_MapKey(layout);
const upb_MiniTableField* val_field = upb_MiniTable_MapValue(layout);
size_t pre_len = upb_BackAlloc_Size(&e->alloc, ptr);
size_t size;
ptr = encode_scalar(ptr, e, &ent->v, val_field);
ptr = encode_scalar(ptr, e, &ent->k, key_field);
size = upb_BackAlloc_Size(&e->alloc, ptr) - pre_len;
ptr = encode_length(ptr, e, size);
ptr = encode_tag(ptr, e, number, kUpb_WireType_Delimited);
return ptr;
}
static char* encode_map(char* ptr, upb_encstate* e, const upb_Message* msg,
const upb_MiniTableField* f) {
const upb_Map* map = *UPB_PTR_AT(msg, f->UPB_PRIVATE(offset), const upb_Map*);
const upb_MiniTable* layout = upb_MiniTable_MapEntrySubMessage(f);
UPB_ASSERT(upb_MiniTable_FieldCount(layout) == 2);
if (!map || !upb_Map_Size(map)) return ptr;
if (e->options & kUpb_EncodeOption_Deterministic) {
_upb_sortedmap sorted;
_upb_mapsorter_pushmap(
&e->sorter, layout->UPB_PRIVATE(fields)[0].UPB_PRIVATE(descriptortype),
map, &sorted);
upb_MapEntry ent;
while (_upb_sortedmap_next(&e->sorter, map, &sorted, &ent)) {
ptr = encode_mapentry(ptr, e, upb_MiniTableField_Number(f), layout, &ent);
}
_upb_mapsorter_popmap(&e->sorter, &sorted);
} else {
upb_value val;
if (map->UPB_PRIVATE(is_strtable)) {
intptr_t iter = UPB_STRTABLE_BEGIN;
upb_StringView strkey;
while (upb_strtable_next2(&map->t.strtable, &strkey, &val, &iter)) {
upb_MapEntry ent;
_upb_map_fromkey(strkey, &ent.k, map->key_size);
_upb_map_fromvalue(val, &ent.v, map->val_size);
ptr =
encode_mapentry(ptr, e, upb_MiniTableField_Number(f), layout, &ent);
}
} else {
intptr_t iter = UPB_INTTABLE_BEGIN;
uintptr_t intkey = 0;
while (upb_inttable_next(&map->t.inttable, &intkey, &val, &iter)) {
upb_MapEntry ent;
memcpy(&ent.k, &intkey, map->key_size);
_upb_map_fromvalue(val, &ent.v, map->val_size);
ptr =
encode_mapentry(ptr, e, upb_MiniTableField_Number(f), layout, &ent);
}
}
}
return ptr;
}
static bool encode_shouldencode(const upb_Message* msg,
const upb_MiniTableField* f) {
if (f->presence == 0) {
// Proto3 presence or map/array.
const void* mem = UPB_PTR_AT(msg, f->UPB_PRIVATE(offset), void);
switch (UPB_PRIVATE(_upb_MiniTableField_GetRep)(f)) {
case kUpb_FieldRep_1Byte: {
char ch;
memcpy(&ch, mem, 1);
return ch != 0;
}
case kUpb_FieldRep_4Byte: {
uint32_t u32;
memcpy(&u32, mem, 4);
return u32 != 0;
}
case kUpb_FieldRep_8Byte: {
uint64_t u64;
memcpy(&u64, mem, 8);
return u64 != 0;
}
case kUpb_FieldRep_StringView: {
const upb_StringView* str = (const upb_StringView*)mem;
return str->size != 0;
}
default:
UPB_UNREACHABLE();
}
} else if (UPB_PRIVATE(_upb_MiniTableField_HasHasbit)(f)) {
// Proto2 presence: hasbit.
return UPB_PRIVATE(_upb_Message_GetHasbit)(msg, f);
} else {
// Field is in a oneof.
return UPB_PRIVATE(_upb_Message_GetOneofCase)(msg, f) ==
upb_MiniTableField_Number(f);
}
}
static char* encode_field(char* ptr, upb_encstate* e, const upb_Message* msg,
const upb_MiniTableField* field) {
switch (UPB_PRIVATE(_upb_MiniTableField_Mode)(field)) {
case kUpb_FieldMode_Array:
return encode_array(ptr, e, msg, field);
case kUpb_FieldMode_Map:
return encode_map(ptr, e, msg, field);
case kUpb_FieldMode_Scalar:
return encode_scalar(
ptr, e, UPB_PTR_AT(msg, field->UPB_PRIVATE(offset), void), field);
default:
UPB_UNREACHABLE();
}
}
static char* encode_msgset_item(char* ptr, upb_encstate* e,
const upb_MiniTableExtension* ext,
const upb_MessageValue ext_val) {
size_t size;
ptr = encode_tag(ptr, e, kUpb_MsgSet_Item, kUpb_WireType_EndGroup);
ptr = encode_message(ptr, e, ext_val.msg_val,
upb_MiniTableExtension_GetSubMessage(ext), &size);
ptr = encode_varint(ptr, e, size);
ptr = encode_tag(ptr, e, kUpb_MsgSet_Message, kUpb_WireType_Delimited);
ptr = encode_varint(ptr, e, upb_MiniTableExtension_Number(ext));
ptr = encode_tag(ptr, e, kUpb_MsgSet_TypeId, kUpb_WireType_Varint);
ptr = encode_tag(ptr, e, kUpb_MsgSet_Item, kUpb_WireType_StartGroup);
return ptr;
}
static char* encode_ext(char* ptr, upb_encstate* e,
const upb_MiniTableExtension* ext,
upb_MessageValue ext_val, bool is_message_set) {
if (UPB_UNLIKELY(is_message_set)) {
ptr = encode_msgset_item(ptr, e, ext, ext_val);
} else {
ptr = encode_field(ptr, e, &ext_val.UPB_PRIVATE(ext_msg_val),
&ext->UPB_PRIVATE(field));
}
return ptr;
}
static char* encode_exts(char* ptr, upb_encstate* e, const upb_MiniTable* m,
const upb_Message* msg) {
if (UPB_PRIVATE(_upb_MiniTable_ExtModeBase)(m) == kUpb_ExtMode_NonExtendable)
return ptr;
upb_Message_Internal* in = UPB_PRIVATE(_upb_Message_GetInternal)(msg);
if (!in) return ptr;
/* Encode all extensions together. Unlike C++, we do not attempt to keep
* these in field number order relative to normal fields or even to each
* other. */
uintptr_t iter = kUpb_Message_ExtensionBegin;
const upb_MiniTableExtension* ext;
upb_MessageValue ext_val;
if (!UPB_PRIVATE(_upb_Message_NextExtensionReverse)(msg, &ext, &ext_val,
&iter)) {
// Message has no extensions.
return ptr;
}
if (e->options & kUpb_EncodeOption_Deterministic) {
_upb_sortedmap sorted;
if (!_upb_mapsorter_pushexts(&e->sorter, in, &sorted)) {
// TODO: b/378744096 - handle alloc failure
}
const upb_Extension* ext;
while (_upb_sortedmap_nextext(&e->sorter, &sorted, &ext)) {
ptr = encode_ext(ptr, e, ext->ext, ext->data,
UPB_PRIVATE(_upb_MiniTable_ExtModeBase)(m) ==
kUpb_ExtMode_IsMessageSet);
}
_upb_mapsorter_popmap(&e->sorter, &sorted);
} else {
do {
ptr = encode_ext(ptr, e, ext, ext_val,
m->UPB_PRIVATE(ext) == kUpb_ExtMode_IsMessageSet);
} while (UPB_PRIVATE(_upb_Message_NextExtensionReverse)(msg, &ext, &ext_val,
&iter));
}
return ptr;
}
char* encode_message(char* ptr, upb_encstate* e, const upb_Message* msg,
const upb_MiniTable* m, size_t* size) {
size_t pre_len = upb_BackAlloc_Size(&e->alloc, ptr);
if (e->options & kUpb_EncodeOption_CheckRequired) {
if (m->UPB_PRIVATE(required_count)) {
if (!UPB_PRIVATE(_upb_Message_IsInitializedShallow)(msg, m)) {
encode_err(e, kUpb_EncodeStatus_MissingRequired);
}
}
}
if ((e->options & kUpb_EncodeOption_SkipUnknown) == 0) {
size_t unknown_size = 0;
uintptr_t iter = kUpb_Message_UnknownBegin;
upb_StringView unknown;
// Need to write in reverse order, but iteration is in-order; scan to
// reserve capacity up front, then write in-order
while (upb_Message_NextUnknown(msg, &unknown, &iter)) {
unknown_size += unknown.size;
}
if (unknown_size != 0) {
ptr = encode_reserve(ptr, e, unknown_size);
char* tmp_ptr = ptr;
iter = kUpb_Message_UnknownBegin;
while (upb_Message_NextUnknown(msg, &unknown, &iter)) {
memcpy(tmp_ptr, unknown.data, unknown.size);
tmp_ptr += unknown.size;
}
}
}
ptr = encode_exts(ptr, e, m, msg);
if (upb_MiniTable_FieldCount(m)) {
const upb_MiniTableField* f =
&m->UPB_PRIVATE(fields)[m->UPB_PRIVATE(field_count)];
const upb_MiniTableField* first = &m->UPB_PRIVATE(fields)[0];
while (f != first) {
f--;
if (encode_shouldencode(msg, f)) {
ptr = encode_field(ptr, e, msg, f);
}
}
}
*size = upb_BackAlloc_Size(&e->alloc, ptr) - pre_len;
return ptr;
}
static upb_EncodeStatus upb_Encoder_Encode(char* ptr,
upb_encstate* const encoder,
const upb_Message* const msg,
const upb_MiniTable* const l,
char** const buf, size_t* const size,
bool prepend_len) {
// Unfortunately we must continue to perform hackery here because there are
// code paths which blindly copy the returned pointer without bothering to
// check for errors until much later (b/235839510). So we still set *buf to
// NULL on error and we still set it to non-NULL on a successful empty result.
if (UPB_SETJMP(*encoder->err) == 0) {
size_t encoded_msg_size;
ptr = encode_message(ptr, encoder, msg, l, &encoded_msg_size);
if (prepend_len) {
ptr = encode_length(ptr, encoder, encoded_msg_size);
}
*size = upb_BackAlloc_Finish(&encoder->alloc, ptr);
*buf = ptr;
} else {
UPB_ASSERT(encoder->status != kUpb_EncodeStatus_Ok);
upb_BackAlloc_Abort(&encoder->alloc);
*buf = NULL;
*size = 0;
}
UPB_PRIVATE(_upb_encstate_destroy)(encoder);
return encoder->status;
}
upb_EncodeStatus _upb_Encode(const upb_Message* msg, const upb_MiniTable* l,
int options, upb_Arena* arena, char** buf,
size_t* size, bool prepend_len) {
upb_encstate e;
jmp_buf err;
e.status = kUpb_EncodeStatus_Ok;
e.err = &err;
char* ptr = upb_BackAlloc_Init(&e.alloc, arena);
e.depth = upb_EncodeOptions_GetEffectiveMaxDepth(options);
e.options = options;
_upb_mapsorter_init(&e.sorter);
return upb_Encoder_Encode(ptr, &e, msg, l, buf, size, prepend_len);
}
upb_EncodeStatus UPB_PRIVATE(_upb_Encode_Field)(upb_encstate* e,
const upb_Message* msg,
const upb_MiniTableField* field,
char** buf, size_t* size,
int options) {
e->options = options;
e->depth = upb_EncodeOptions_GetEffectiveMaxDepth(options);
char* ptr = *buf;
if (encode_shouldencode(msg, field)) {
ptr = encode_field(ptr, e, msg, field);
}
*size = upb_BackAlloc_Finish(&e->alloc, ptr);
*buf = ptr;
return e->status;
}
upb_EncodeStatus UPB_PRIVATE(_upb_Encode_Extension)(
upb_encstate* e, const upb_MiniTableExtension* ext,
upb_MessageValue ext_val, bool is_message_set, char** buf, size_t* size,
int options) {
e->options = options;
e->depth = upb_EncodeOptions_GetEffectiveMaxDepth(options);
char* ptr = *buf;
ptr = encode_ext(ptr, e, ext, ext_val, is_message_set);
*size = upb_BackAlloc_Finish(&e->alloc, ptr);
*buf = ptr;
return e->status;
}