#include "upb/msg.h" static bool is_power_of_two(size_t val) { return (val & (val - 1)) == 0; } /* Align up to the given power of 2. */ static size_t align_up(size_t val, size_t align) { UPB_ASSERT(is_power_of_two(align)); return (val + align - 1) & ~(align - 1); } static size_t div_round_up(size_t n, size_t d) { return (n + d - 1) / d; } bool upb_fieldtype_mapkeyok(upb_fieldtype_t type) { return type == UPB_TYPE_BOOL || type == UPB_TYPE_INT32 || type == UPB_TYPE_UINT32 || type == UPB_TYPE_INT64 || type == UPB_TYPE_UINT64 || type == UPB_TYPE_STRING; } void *upb_array_pack(const upb_array *arr, void *p, size_t *ofs, size_t size); void *upb_map_pack(const upb_map *map, void *p, size_t *ofs, size_t size); #define PTR_AT(msg, ofs, type) (type*)((char*)msg + ofs) #define VOIDPTR_AT(msg, ofs) PTR_AT(msg, ofs, void) #define ENCODE_MAX_NESTING 64 #define CHECK_TRUE(x) if (!(x)) { return false; } /** upb_msgval ****************************************************************/ #define upb_alignof(t) offsetof(struct { char c; t x; }, x) /* These functions will generate real memcpy() calls on ARM sadly, because * the compiler assumes they might not be aligned. */ static upb_msgval upb_msgval_read(const void *p, size_t ofs, uint8_t size) { upb_msgval val; p = (char*)p + ofs; memcpy(&val, p, size); return val; } static void upb_msgval_write(void *p, size_t ofs, upb_msgval val, uint8_t size) { p = (char*)p + ofs; memcpy(p, &val, size); } static size_t upb_msgval_sizeof(upb_fieldtype_t type) { switch (type) { case UPB_TYPE_DOUBLE: case UPB_TYPE_INT64: case UPB_TYPE_UINT64: return 8; case UPB_TYPE_ENUM: case UPB_TYPE_INT32: case UPB_TYPE_UINT32: case UPB_TYPE_FLOAT: return 4; case UPB_TYPE_BOOL: return 1; case UPB_TYPE_BYTES: case UPB_TYPE_MESSAGE: return sizeof(void*); case UPB_TYPE_STRING: return sizeof(char*) + sizeof(size_t); } UPB_UNREACHABLE(); } static uint8_t upb_msg_fieldsize(const upb_msglayout_fieldinit_v1 *field) { if (field->label == UPB_LABEL_REPEATED) { return sizeof(void*); } else { return upb_msgval_sizeof(field->type); } } static uint8_t upb_msg_fielddefsize(const upb_fielddef *f) { if (upb_fielddef_isseq(f)) { return sizeof(void*); } else { return upb_msgval_sizeof(upb_fielddef_type(f)); } } /* TODO(haberman): this is broken right now because upb_msgval can contain * a char* / size_t pair, which is too big for a upb_value. To fix this * we'll probably need to dynamically allocate a upb_msgval and store a * pointer to that in the tables for extensions/maps. */ static upb_value upb_toval(upb_msgval val) { upb_value ret; UPB_UNUSED(val); memset(&ret, 0, sizeof(upb_value)); /* XXX */ return ret; } static upb_msgval upb_msgval_fromval(upb_value val) { upb_msgval ret; UPB_UNUSED(val); memset(&ret, 0, sizeof(upb_msgval)); /* XXX */ return ret; } static upb_ctype_t upb_fieldtotabtype(upb_fieldtype_t type) { switch (type) { case UPB_TYPE_FLOAT: return UPB_CTYPE_FLOAT; case UPB_TYPE_DOUBLE: return UPB_CTYPE_DOUBLE; case UPB_TYPE_BOOL: return UPB_CTYPE_BOOL; case UPB_TYPE_BYTES: case UPB_TYPE_MESSAGE: case UPB_TYPE_STRING: return UPB_CTYPE_CONSTPTR; case UPB_TYPE_ENUM: case UPB_TYPE_INT32: return UPB_CTYPE_INT32; case UPB_TYPE_UINT32: return UPB_CTYPE_UINT32; case UPB_TYPE_INT64: return UPB_CTYPE_INT64; case UPB_TYPE_UINT64: return UPB_CTYPE_UINT64; default: UPB_ASSERT(false); return 0; } } static upb_msgval upb_msgval_fromdefault(const upb_fielddef *f) { switch (upb_fielddef_type(f)) { case UPB_TYPE_FLOAT: return upb_msgval_float(upb_fielddef_defaultfloat(f)); case UPB_TYPE_DOUBLE: return upb_msgval_double(upb_fielddef_defaultdouble(f)); case UPB_TYPE_BOOL: return upb_msgval_bool(upb_fielddef_defaultbool(f)); case UPB_TYPE_STRING: case UPB_TYPE_BYTES: { size_t len; const char *ptr = upb_fielddef_defaultstr(f, &len); return upb_msgval_str(ptr, len); } case UPB_TYPE_MESSAGE: return upb_msgval_msg(NULL); case UPB_TYPE_ENUM: case UPB_TYPE_INT32: return upb_msgval_int32(upb_fielddef_defaultint32(f)); case UPB_TYPE_UINT32: return upb_msgval_uint32(upb_fielddef_defaultuint32(f)); case UPB_TYPE_INT64: return upb_msgval_int64(upb_fielddef_defaultint64(f)); case UPB_TYPE_UINT64: return upb_msgval_uint64(upb_fielddef_defaultuint64(f)); default: UPB_ASSERT(false); return upb_msgval_msg(NULL); } } /** upb_msglayout *************************************************************/ struct upb_msglayout { struct upb_msglayout_msginit_v1 data; }; static void upb_msglayout_free(upb_msglayout *l) { upb_gfree(l->data.default_msg); upb_gfree(l); } static size_t upb_msglayout_place(upb_msglayout *l, size_t size) { size_t ret; l->data.size = align_up(l->data.size, size); l->data.align = align_up(l->data.align, size); ret = l->data.size; l->data.size += size; return ret; } static uint32_t upb_msglayout_offset(const upb_msglayout *l, const upb_fielddef *f) { return l->data.fields[upb_fielddef_index(f)].offset; } static uint32_t upb_msglayout_hasbit(const upb_msglayout *l, const upb_fielddef *f) { return l->data.fields[upb_fielddef_index(f)].hasbit; } static bool upb_msglayout_initdefault(upb_msglayout *l, const upb_msgdef *m) { upb_msg_field_iter it; if (upb_msgdef_syntax(m) == UPB_SYNTAX_PROTO2 && l->data.size) { /* Allocate default message and set default values in it. */ l->data.default_msg = upb_gmalloc(l->data.size); if (!l->data.default_msg) { return false; } memset(l->data.default_msg, 0, l->data.size); for (upb_msg_field_begin(&it, m); !upb_msg_field_done(&it); upb_msg_field_next(&it)) { const upb_fielddef* f = upb_msg_iter_field(&it); if (upb_fielddef_containingoneof(f)) { continue; } /* TODO(haberman): handle strings. */ if (!upb_fielddef_isstring(f) && !upb_fielddef_issubmsg(f) && !upb_fielddef_isseq(f)) { upb_msg_set(l->data.default_msg, upb_fielddef_index(f), upb_msgval_fromdefault(f), l); } } } return true; } static upb_msglayout *upb_msglayout_new(const upb_msgdef *m) { upb_msg_field_iter it; upb_msg_oneof_iter oit; upb_msglayout *l; size_t hasbit; size_t submsg_count = 0; const upb_msglayout_msginit_v1 **submsgs; upb_msglayout_fieldinit_v1 *fields; upb_msglayout_oneofinit_v1 *oneofs; for (upb_msg_field_begin(&it, m), hasbit = sizeof(void*) * 8; !upb_msg_field_done(&it); upb_msg_field_next(&it)) { const upb_fielddef* f = upb_msg_iter_field(&it); if (upb_fielddef_issubmsg(f)) { submsg_count++; } } l = upb_gmalloc(sizeof(*l)); if (!l) return NULL; memset(l, 0, sizeof(*l)); fields = upb_gmalloc(upb_msgdef_numfields(m) * sizeof(*fields)); submsgs = upb_gmalloc(submsg_count * sizeof(*submsgs)); oneofs = upb_gmalloc(upb_msgdef_numoneofs(m) * sizeof(*oneofs)); if ((!fields && upb_msgdef_numfields(m)) || (!submsgs && submsg_count) || (!oneofs && upb_msgdef_numoneofs(m))) { /* OOM. */ upb_gfree(l); upb_gfree(fields); upb_gfree(submsgs); upb_gfree(oneofs); return NULL; } l->data.field_count = upb_msgdef_numfields(m); l->data.oneof_count = upb_msgdef_numoneofs(m); l->data.fields = fields; l->data.submsgs = submsgs; l->data.oneofs = oneofs; l->data.is_proto2 = (upb_msgdef_syntax(m) == UPB_SYNTAX_PROTO2); /* Allocate data offsets in three stages: * * 1. hasbits. * 2. regular fields. * 3. oneof fields. * * OPT: There is a lot of room for optimization here to minimize the size. */ /* Allocate hasbits and set basic field attributes. */ for (upb_msg_field_begin(&it, m), hasbit = 0; !upb_msg_field_done(&it); upb_msg_field_next(&it)) { const upb_fielddef* f = upb_msg_iter_field(&it); upb_msglayout_fieldinit_v1 *field = &fields[upb_fielddef_index(f)]; field->number = upb_fielddef_number(f); field->type = upb_fielddef_type(f); field->label = upb_fielddef_label(f); if (upb_fielddef_containingoneof(f)) { field->oneof_index = upb_oneofdef_index(upb_fielddef_containingoneof(f)); } else { field->oneof_index = UPB_NOT_IN_ONEOF; } if (upb_fielddef_haspresence(f) && !upb_fielddef_containingoneof(f)) { field->hasbit = hasbit++; } } /* Account for space used by hasbits. */ l->data.size = div_round_up(hasbit, 8); l->data.align = 1; /* Allocate non-oneof fields. */ for (upb_msg_field_begin(&it, m); !upb_msg_field_done(&it); upb_msg_field_next(&it)) { const upb_fielddef* f = upb_msg_iter_field(&it); size_t field_size = upb_msg_fielddefsize(f); size_t index = upb_fielddef_index(f); if (upb_fielddef_containingoneof(f)) { /* Oneofs are handled separately below. */ continue; } fields[index].offset = upb_msglayout_place(l, field_size); } /* Allocate oneof fields. Each oneof field consists of a uint32 for the case * and space for the actual data. */ for (upb_msg_oneof_begin(&oit, m); !upb_msg_oneof_done(&oit); upb_msg_oneof_next(&oit)) { const upb_oneofdef* o = upb_msg_iter_oneof(&oit); upb_oneof_iter fit; size_t case_size = sizeof(uint32_t); /* Could potentially optimize this. */ upb_msglayout_oneofinit_v1 *oneof = &oneofs[upb_oneofdef_index(o)]; size_t field_size = 0; /* Calculate field size: the max of all field sizes. */ for (upb_oneof_begin(&fit, o); !upb_oneof_done(&fit); upb_oneof_next(&fit)) { const upb_fielddef* f = upb_oneof_iter_field(&fit); field_size = UPB_MAX(field_size, upb_msg_fielddefsize(f)); } /* Align and allocate case offset. */ oneof->case_offset = upb_msglayout_place(l, case_size); oneof->data_offset = upb_msglayout_place(l, field_size); } /* Size of the entire structure should be a multiple of its greatest * alignment. */ l->data.size = align_up(l->data.size, l->data.align); if (upb_msglayout_initdefault(l, m)) { return l; } else { upb_msglayout_free(l); return NULL; } } /** upb_msgfactory ************************************************************/ struct upb_msgfactory { const upb_symtab *symtab; /* We own a ref. */ upb_inttable layouts; upb_inttable mergehandlers; }; upb_msgfactory *upb_msgfactory_new(const upb_symtab *symtab) { upb_msgfactory *ret = upb_gmalloc(sizeof(*ret)); ret->symtab = symtab; upb_inttable_init(&ret->layouts, UPB_CTYPE_PTR); upb_inttable_init(&ret->mergehandlers, UPB_CTYPE_CONSTPTR); return ret; } void upb_msgfactory_free(upb_msgfactory *f) { upb_inttable_iter i; upb_inttable_begin(&i, &f->layouts); for(; !upb_inttable_done(&i); upb_inttable_next(&i)) { upb_msglayout *l = upb_value_getptr(upb_inttable_iter_value(&i)); upb_msglayout_free(l); } upb_inttable_begin(&i, &f->mergehandlers); for(; !upb_inttable_done(&i); upb_inttable_next(&i)) { const upb_handlers *h = upb_value_getconstptr(upb_inttable_iter_value(&i)); upb_handlers_unref(h, f); } upb_inttable_uninit(&f->layouts); upb_inttable_uninit(&f->mergehandlers); upb_gfree(f); } const upb_symtab *upb_msgfactory_symtab(const upb_msgfactory *f) { return f->symtab; } const upb_msglayout *upb_msgfactory_getlayout(upb_msgfactory *f, const upb_msgdef *m) { upb_value v; UPB_ASSERT(upb_symtab_lookupmsg(f->symtab, upb_msgdef_fullname(m)) == m); UPB_ASSERT(!upb_msgdef_mapentry(m)); if (upb_inttable_lookupptr(&f->layouts, m, &v)) { UPB_ASSERT(upb_value_getptr(v)); return upb_value_getptr(v); } else { upb_msgfactory *mutable_f = (void*)f; upb_msglayout *l = upb_msglayout_new(m); upb_inttable_insertptr(&mutable_f->layouts, m, upb_value_ptr(l)); UPB_ASSERT(l); return l; } } /* Our handlers that we don't expose externally. */ void *upb_msg_startstr(void *msg, const void *hd, size_t size_hint) { uint32_t ofs = (uintptr_t)hd; upb_alloc *alloc = upb_msg_alloc(msg); upb_msgval val; UPB_UNUSED(size_hint); val = upb_msgval_read(msg, ofs, upb_msgval_sizeof(UPB_TYPE_STRING)); upb_free(alloc, (void*)val.str.ptr); val.str.ptr = NULL; val.str.len = 0; upb_msgval_write(msg, ofs, val, upb_msgval_sizeof(UPB_TYPE_STRING)); return msg; } size_t upb_msg_str(void *msg, const void *hd, const char *ptr, size_t size, const upb_bufhandle *handle) { uint32_t ofs = (uintptr_t)hd; upb_alloc *alloc = upb_msg_alloc(msg); upb_msgval val; size_t newsize; UPB_UNUSED(handle); val = upb_msgval_read(msg, ofs, upb_msgval_sizeof(UPB_TYPE_STRING)); newsize = val.str.len + size; val.str.ptr = upb_realloc(alloc, (void*)val.str.ptr, val.str.len, newsize); if (!val.str.ptr) { return false; } memcpy((char*)val.str.ptr + val.str.len, ptr, size); val.str.len = newsize; upb_msgval_write(msg, ofs, val, upb_msgval_sizeof(UPB_TYPE_STRING)); return size; } static void callback(const void *closure, upb_handlers *h) { upb_msgfactory *factory = (upb_msgfactory*)closure; const upb_msgdef *md = upb_handlers_msgdef(h); const upb_msglayout* layout = upb_msgfactory_getlayout(factory, md); upb_msg_field_iter i; UPB_UNUSED(factory); for(upb_msg_field_begin(&i, md); !upb_msg_field_done(&i); upb_msg_field_next(&i)) { const upb_fielddef *f = upb_msg_iter_field(&i); size_t offset = upb_msglayout_offset(layout, f); upb_handlerattr attr = UPB_HANDLERATTR_INITIALIZER; upb_handlerattr_sethandlerdata(&attr, (void*)offset); if (upb_fielddef_isseq(f)) { } else if (upb_fielddef_isstring(f)) { upb_handlers_setstartstr(h, f, upb_msg_startstr, &attr); upb_handlers_setstring(h, f, upb_msg_str, &attr); } else { upb_msg_setscalarhandler( h, f, offset, upb_msglayout_hasbit(layout, f)); } } } const upb_handlers *upb_msgfactory_getmergehandlers(upb_msgfactory *f, const upb_msgdef *m) { upb_msgfactory *mutable_f = (void*)f; /* TODO(haberman): properly cache these. */ const upb_handlers *ret = upb_handlers_newfrozen(m, f, callback, f); upb_inttable_push(&mutable_f->mergehandlers, upb_value_constptr(ret)); return ret; } const upb_visitorplan *upb_msgfactory_getvisitorplan(upb_msgfactory *f, const upb_handlers *h) { const upb_msgdef *md = upb_handlers_msgdef(h); return (const upb_visitorplan*)upb_msgfactory_getlayout(f, md); } /** upb_visitor ***************************************************************/ struct upb_visitor { const upb_msglayout *layout; upb_sink *sink; }; static upb_selector_t getsel2(const upb_fielddef *f, upb_handlertype_t type) { upb_selector_t ret; bool ok = upb_handlers_getselector(f, type, &ret); UPB_ASSERT(ok); return ret; } static bool upb_visitor_hasfield(const upb_msg *msg, const upb_fielddef *f, const upb_msglayout *layout) { int field_index = upb_fielddef_index(f); if (upb_fielddef_isseq(f)) { return upb_msgval_getarr(upb_msg_get(msg, field_index, layout)) != NULL; } else if (upb_msgdef_syntax(upb_fielddef_containingtype(f)) == UPB_SYNTAX_PROTO2) { return upb_msg_has(msg, field_index, layout); } else { upb_msgval val = upb_msg_get(msg, field_index, layout); switch (upb_fielddef_type(f)) { case UPB_TYPE_FLOAT: return upb_msgval_getfloat(val) != 0; case UPB_TYPE_DOUBLE: return upb_msgval_getdouble(val) != 0; case UPB_TYPE_BOOL: return upb_msgval_getbool(val); case UPB_TYPE_ENUM: case UPB_TYPE_INT32: return upb_msgval_getint32(val) != 0; case UPB_TYPE_UINT32: return upb_msgval_getuint32(val) != 0; case UPB_TYPE_INT64: return upb_msgval_getint64(val) != 0; case UPB_TYPE_UINT64: return upb_msgval_getuint64(val) != 0; case UPB_TYPE_STRING: case UPB_TYPE_BYTES: return upb_msgval_getstr(val) && upb_msgval_getstrlen(val) > 0; case UPB_TYPE_MESSAGE: return upb_msgval_getmsg(val) != NULL; } UPB_UNREACHABLE(); } } static bool upb_visitor_visitmsg2(const upb_msg *msg, const upb_msglayout *layout, upb_sink *sink, int depth) { const upb_msgdef *md = upb_handlers_msgdef(sink->handlers); upb_msg_field_iter i; upb_status status; upb_sink_startmsg(sink); /* Protect against cycles (possible because users may freely reassign message * and repeated fields) by imposing a maximum recursion depth. */ if (depth > ENCODE_MAX_NESTING) { return false; } for (upb_msg_field_begin(&i, md); !upb_msg_field_done(&i); upb_msg_field_next(&i)) { upb_fielddef *f = upb_msg_iter_field(&i); upb_msgval val; if (!upb_visitor_hasfield(msg, f, layout)) { continue; } val = upb_msg_get(msg, upb_fielddef_index(f), layout); if (upb_fielddef_isseq(f)) { const upb_array *arr = upb_msgval_getarr(val); UPB_ASSERT(arr); /* TODO: putary(ary, f, sink, depth);*/ } else if (upb_fielddef_issubmsg(f)) { const upb_map *map = upb_msgval_getmap(val); UPB_ASSERT(map); /* TODO: putmap(map, f, sink, depth);*/ } else if (upb_fielddef_isstring(f)) { /* TODO putstr(); */ } else { upb_selector_t sel = getsel2(f, upb_handlers_getprimitivehandlertype(f)); UPB_ASSERT(upb_fielddef_isprimitive(f)); switch (upb_fielddef_type(f)) { case UPB_TYPE_FLOAT: CHECK_TRUE(upb_sink_putfloat(sink, sel, upb_msgval_getfloat(val))); break; case UPB_TYPE_DOUBLE: CHECK_TRUE(upb_sink_putdouble(sink, sel, upb_msgval_getdouble(val))); break; case UPB_TYPE_BOOL: CHECK_TRUE(upb_sink_putbool(sink, sel, upb_msgval_getbool(val))); break; case UPB_TYPE_ENUM: case UPB_TYPE_INT32: CHECK_TRUE(upb_sink_putint32(sink, sel, upb_msgval_getint32(val))); break; case UPB_TYPE_UINT32: CHECK_TRUE(upb_sink_putuint32(sink, sel, upb_msgval_getuint32(val))); break; case UPB_TYPE_INT64: CHECK_TRUE(upb_sink_putint64(sink, sel, upb_msgval_getint64(val))); break; case UPB_TYPE_UINT64: CHECK_TRUE(upb_sink_putuint64(sink, sel, upb_msgval_getuint64(val))); break; case UPB_TYPE_STRING: case UPB_TYPE_BYTES: case UPB_TYPE_MESSAGE: UPB_UNREACHABLE(); } } } upb_sink_endmsg(sink, &status); return true; } upb_visitor *upb_visitor_create(upb_env *e, const upb_visitorplan *vp, upb_sink *output) { upb_visitor *visitor = upb_env_malloc(e, sizeof(*visitor)); visitor->layout = (const upb_msglayout*)vp; visitor->sink = output; return visitor; } bool upb_visitor_visitmsg(upb_visitor *visitor, const upb_msg *msg) { return upb_visitor_visitmsg2(msg, visitor->layout, visitor->sink, 0); } /** upb_msg *******************************************************************/ /* If we always read/write as a consistent type to each address, this shouldn't * violate aliasing. */ #define DEREF(msg, ofs, type) *PTR_AT(msg, ofs, type) /* Internal members of a upb_msg. We can change this without breaking binary * compatibility. We put these before the user's data. The user's upb_msg* * points after the upb_msg_internal. */ /* Used when a message is not extendable. */ typedef struct { /* TODO(haberman): add unknown fields. */ upb_alloc *alloc; } upb_msg_internal; /* Used when a message is extendable. */ typedef struct { upb_inttable *extdict; upb_msg_internal base; } upb_msg_internal_withext; static int upb_msg_internalsize(const upb_msglayout *l) { return sizeof(upb_msg_internal) - l->data.extendable * sizeof(void*); } static upb_msg_internal *upb_msg_getinternal(upb_msg *msg) { return VOIDPTR_AT(msg, -sizeof(upb_msg_internal)); } static const upb_msg_internal *upb_msg_getinternal_const(const upb_msg *msg) { return VOIDPTR_AT(msg, -sizeof(upb_msg_internal)); } static upb_msg_internal_withext *upb_msg_getinternalwithext( upb_msg *msg, const upb_msglayout *l) { UPB_ASSERT(l->data.extendable); return VOIDPTR_AT(msg, -sizeof(upb_msg_internal_withext)); } static const upb_msglayout_fieldinit_v1 *upb_msg_checkfield( int field_index, const upb_msglayout *l) { UPB_ASSERT(field_index >= 0 && field_index < l->data.field_count); return &l->data.fields[field_index]; } static bool upb_msg_inoneof(const upb_msglayout_fieldinit_v1 *field) { return field->oneof_index != UPB_NOT_IN_ONEOF; } static uint32_t *upb_msg_oneofcase(const upb_msg *msg, int field_index, const upb_msglayout *l) { const upb_msglayout_fieldinit_v1 *field = upb_msg_checkfield(field_index, l); UPB_ASSERT(upb_msg_inoneof(field)); return PTR_AT(msg, l->data.oneofs[field->oneof_index].case_offset, uint32_t); } size_t upb_msg_sizeof(const upb_msglayout *l) { return l->data.size + upb_msg_internalsize(l); } upb_msg *upb_msg_init(void *mem, const upb_msglayout *l, upb_alloc *a) { upb_msg *msg = VOIDPTR_AT(mem, upb_msg_internalsize(l)); if (l->data.default_msg) { memcpy(msg, l->data.default_msg, l->data.size); } else { memset(msg, 0, l->data.size); } UPB_ASSERT(!upb_msg_getinternal(msg)->alloc); upb_msg_getinternal(msg)->alloc = a; if (l->data.extendable) { upb_msg_getinternalwithext(msg, l)->extdict = NULL; } return msg; } void *upb_msg_uninit(upb_msg *msg, const upb_msglayout *l) { if (l->data.extendable) { upb_inttable *ext_dict = upb_msg_getinternalwithext(msg, l)->extdict; if (ext_dict) { upb_inttable_uninit2(ext_dict, upb_msg_alloc(msg)); upb_free(upb_msg_alloc(msg), ext_dict); } } return VOIDPTR_AT(msg, -upb_msg_internalsize(l)); } upb_msg *upb_msg_new(const upb_msglayout *l, upb_alloc *a) { void *mem = upb_malloc(a, upb_msg_sizeof(l)); return mem ? upb_msg_init(mem, l, a) : NULL; } void upb_msg_free(upb_msg *msg, const upb_msglayout *l) { upb_free(upb_msg_alloc(msg), upb_msg_uninit(msg, l)); } upb_alloc *upb_msg_alloc(const upb_msg *msg) { return upb_msg_getinternal_const(msg)->alloc; } bool upb_msg_has(const upb_msg *msg, int field_index, const upb_msglayout *l) { const upb_msglayout_fieldinit_v1 *field = upb_msg_checkfield(field_index, l); UPB_ASSERT(l->data.is_proto2); if (upb_msg_inoneof(field)) { /* Oneofs are set when the oneof number is set to this field. */ return *upb_msg_oneofcase(msg, field_index, l) == field->number; } else { /* Other fields are set when their hasbit is set. */ uint32_t hasbit = l->data.fields[field_index].hasbit; return DEREF(msg, hasbit / 8, char) | (1 << (hasbit % 8)); } } upb_msgval upb_msg_get(const upb_msg *msg, int field_index, const upb_msglayout *l) { const upb_msglayout_fieldinit_v1 *field = upb_msg_checkfield(field_index, l); int size = upb_msg_fieldsize(field); if (upb_msg_inoneof(field)) { if (*upb_msg_oneofcase(msg, field_index, l) == field->number) { size_t ofs = l->data.oneofs[field->oneof_index].data_offset; return upb_msgval_read(msg, ofs, size); } else { /* Return default. */ return upb_msgval_read(l->data.default_msg, field->offset, size); } } else { return upb_msgval_read(msg, field->offset, size); } } void upb_msg_set(upb_msg *msg, int field_index, upb_msgval val, const upb_msglayout *l) { const upb_msglayout_fieldinit_v1 *field = upb_msg_checkfield(field_index, l); int size = upb_msg_fieldsize(field); if (upb_msg_inoneof(field)) { size_t ofs = l->data.oneofs[field->oneof_index].data_offset; *upb_msg_oneofcase(msg, field_index, l) = field->number; upb_msgval_write(msg, ofs, val, size); } else { upb_msgval_write(msg, field->offset, val, size); } } /** upb_array *****************************************************************/ struct upb_array { upb_fieldtype_t type; uint8_t element_size; void *data; /* Each element is element_size. */ size_t len; /* Measured in elements. */ size_t size; /* Measured in elements. */ upb_alloc *alloc; }; #define DEREF_ARR(arr, i, type) ((type*)arr->data)[i] size_t upb_array_sizeof(upb_fieldtype_t type) { UPB_UNUSED(type); return sizeof(upb_array); } void upb_array_init(upb_array *arr, upb_fieldtype_t type, upb_alloc *alloc) { arr->type = type; arr->data = NULL; arr->len = 0; arr->size = 0; arr->element_size = upb_msgval_sizeof(type); arr->alloc = alloc; } void upb_array_uninit(upb_array *arr) { upb_free(arr->alloc, arr->data); } upb_array *upb_array_new(upb_fieldtype_t type, upb_alloc *a) { upb_array *ret = upb_malloc(a, upb_array_sizeof(type)); if (ret) { upb_array_init(ret, type, a); } return ret; } void upb_array_free(upb_array *arr) { upb_array_uninit(arr); upb_free(arr->alloc, arr); } size_t upb_array_size(const upb_array *arr) { return arr->len; } upb_fieldtype_t upb_array_type(const upb_array *arr) { return arr->type; } upb_msgval upb_array_get(const upb_array *arr, size_t i) { UPB_ASSERT(i < arr->len); return upb_msgval_read(arr->data, i * arr->element_size, arr->element_size); } bool upb_array_set(upb_array *arr, size_t i, upb_msgval val) { UPB_ASSERT(i <= arr->len); if (i == arr->len) { /* Extending the array. */ if (i == arr->size) { /* Need to reallocate. */ size_t new_size = UPB_MAX(arr->size * 2, 8); size_t new_bytes = new_size * arr->element_size; size_t old_bytes = arr->size * arr->element_size; upb_msgval *new_data = upb_realloc(arr->alloc, arr->data, old_bytes, new_bytes); if (!new_data) { return false; } arr->data = new_data; arr->size = new_size; } arr->len = i + 1; } upb_msgval_write(arr->data, i * arr->element_size, val, arr->element_size); return true; } /** upb_map *******************************************************************/ struct upb_map { upb_fieldtype_t key_type; upb_fieldtype_t val_type; /* We may want to optimize this to use inttable where possible, for greater * efficiency and lower memory footprint. */ upb_strtable strtab; upb_alloc *alloc; }; static void upb_map_tokey(upb_fieldtype_t type, upb_msgval *key, const char **out_key, size_t *out_len) { switch (type) { case UPB_TYPE_STRING: /* Point to string data of the input key. */ *out_key = key->str.ptr; *out_len = key->str.len; return; case UPB_TYPE_BOOL: case UPB_TYPE_INT32: case UPB_TYPE_UINT32: case UPB_TYPE_INT64: case UPB_TYPE_UINT64: /* Point to the key itself. XXX: big-endian. */ *out_key = (const char*)key; *out_len = upb_msgval_sizeof(type); return; case UPB_TYPE_BYTES: case UPB_TYPE_DOUBLE: case UPB_TYPE_ENUM: case UPB_TYPE_FLOAT: case UPB_TYPE_MESSAGE: break; /* Cannot be a map key. */ } UPB_UNREACHABLE(); } static upb_msgval upb_map_fromkey(upb_fieldtype_t type, const char *key, size_t len) { switch (type) { case UPB_TYPE_STRING: return upb_msgval_str(key, len); case UPB_TYPE_BOOL: case UPB_TYPE_INT32: case UPB_TYPE_UINT32: case UPB_TYPE_INT64: case UPB_TYPE_UINT64: return upb_msgval_read(key, 0, upb_msgval_sizeof(type)); case UPB_TYPE_BYTES: case UPB_TYPE_DOUBLE: case UPB_TYPE_ENUM: case UPB_TYPE_FLOAT: case UPB_TYPE_MESSAGE: break; /* Cannot be a map key. */ } UPB_UNREACHABLE(); } size_t upb_map_sizeof(upb_fieldtype_t ktype, upb_fieldtype_t vtype) { /* Size does not currently depend on key/value type. */ UPB_UNUSED(ktype); UPB_UNUSED(vtype); return sizeof(upb_map); } bool upb_map_init(upb_map *map, upb_fieldtype_t ktype, upb_fieldtype_t vtype, upb_alloc *a) { upb_ctype_t vtabtype = upb_fieldtotabtype(vtype); UPB_ASSERT(upb_fieldtype_mapkeyok(ktype)); map->key_type = ktype; map->val_type = vtype; map->alloc = a; if (!upb_strtable_init2(&map->strtab, vtabtype, a)) { return false; } return true; } void upb_map_uninit(upb_map *map) { upb_strtable_uninit2(&map->strtab, map->alloc); } upb_map *upb_map_new(upb_fieldtype_t ktype, upb_fieldtype_t vtype, upb_alloc *a) { upb_map *map = upb_malloc(a, upb_map_sizeof(ktype, vtype)); if (!map) { return NULL; } if (!upb_map_init(map, ktype, vtype, a)) { return NULL; } return map; } void upb_map_free(upb_map *map) { upb_map_uninit(map); upb_free(map->alloc, map); } size_t upb_map_size(const upb_map *map) { return upb_strtable_count(&map->strtab); } upb_fieldtype_t upb_map_keytype(const upb_map *map) { return map->key_type; } upb_fieldtype_t upb_map_valuetype(const upb_map *map) { return map->val_type; } bool upb_map_get(const upb_map *map, upb_msgval key, upb_msgval *val) { upb_value tabval; const char *key_str; size_t key_len; bool ret; upb_map_tokey(map->key_type, &key, &key_str, &key_len); ret = upb_strtable_lookup2(&map->strtab, key_str, key_len, &tabval); if (ret) { memcpy(val, &tabval, sizeof(tabval)); } return ret; } bool upb_map_set(upb_map *map, upb_msgval key, upb_msgval val, upb_msgval *removed) { const char *key_str; size_t key_len; upb_value tabval = upb_toval(val); upb_value removedtabval; upb_alloc *a = map->alloc; upb_map_tokey(map->key_type, &key, &key_str, &key_len); /* TODO(haberman): add overwrite operation to minimize number of lookups. */ if (upb_strtable_lookup2(&map->strtab, key_str, key_len, NULL)) { upb_strtable_remove3(&map->strtab, key_str, key_len, &removedtabval, a); memcpy(&removed, &removedtabval, sizeof(removed)); } return upb_strtable_insert3(&map->strtab, key_str, key_len, tabval, a); } bool upb_map_del(upb_map *map, upb_msgval key) { const char *key_str; size_t key_len; upb_alloc *a = map->alloc; upb_map_tokey(map->key_type, &key, &key_str, &key_len); return upb_strtable_remove3(&map->strtab, key_str, key_len, NULL, a); } /** upb_mapiter ***************************************************************/ struct upb_mapiter { upb_strtable_iter iter; upb_fieldtype_t key_type; }; size_t upb_mapiter_sizeof() { return sizeof(upb_mapiter); } void upb_mapiter_begin(upb_mapiter *i, const upb_map *map) { upb_strtable_begin(&i->iter, &map->strtab); i->key_type = map->key_type; } upb_mapiter *upb_mapiter_new(const upb_map *t, upb_alloc *a) { upb_mapiter *ret = upb_malloc(a, upb_mapiter_sizeof()); if (!ret) { return NULL; } upb_mapiter_begin(ret, t); return ret; } void upb_mapiter_free(upb_mapiter *i, upb_alloc *a) { upb_free(a, i); } void upb_mapiter_next(upb_mapiter *i) { upb_strtable_next(&i->iter); } bool upb_mapiter_done(const upb_mapiter *i) { return upb_strtable_done(&i->iter); } upb_msgval upb_mapiter_key(const upb_mapiter *i) { return upb_map_fromkey(i->key_type, upb_strtable_iter_key(&i->iter), upb_strtable_iter_keylength(&i->iter)); } upb_msgval upb_mapiter_value(const upb_mapiter *i) { return upb_msgval_fromval(upb_strtable_iter_value(&i->iter)); } void upb_mapiter_setdone(upb_mapiter *i) { upb_strtable_iter_setdone(&i->iter); } bool upb_mapiter_isequal(const upb_mapiter *i1, const upb_mapiter *i2) { return upb_strtable_iter_isequal(&i1->iter, &i2->iter); } /** Handlers for upb_msg ******************************************************/ typedef struct { size_t offset; int32_t hasbit; } upb_msg_handlerdata; /* Fallback implementation if the handler is not specialized by the producer. */ #define MSG_WRITER(type, ctype) \ bool upb_msg_set ## type (void *c, const void *hd, ctype val) { \ uint8_t *m = c; \ const upb_msg_handlerdata *d = hd; \ if (d->hasbit > 0) \ *(uint8_t*)&m[d->hasbit / 8] |= 1 << (d->hasbit % 8); \ *(ctype*)&m[d->offset] = val; \ return true; \ } \ MSG_WRITER(double, double) MSG_WRITER(float, float) MSG_WRITER(int32, int32_t) MSG_WRITER(int64, int64_t) MSG_WRITER(uint32, uint32_t) MSG_WRITER(uint64, uint64_t) MSG_WRITER(bool, bool) bool upb_msg_setscalarhandler(upb_handlers *h, const upb_fielddef *f, size_t offset, int32_t hasbit) { upb_handlerattr attr = UPB_HANDLERATTR_INITIALIZER; bool ok; upb_msg_handlerdata *d = upb_gmalloc(sizeof(*d)); if (!d) return false; d->offset = offset; d->hasbit = hasbit; upb_handlerattr_sethandlerdata(&attr, d); upb_handlerattr_setalwaysok(&attr, true); upb_handlers_addcleanup(h, d, upb_gfree); #define TYPE(u, l) \ case UPB_TYPE_##u: \ ok = upb_handlers_set##l(h, f, upb_msg_set##l, &attr); break; ok = false; switch (upb_fielddef_type(f)) { TYPE(INT64, int64); TYPE(INT32, int32); TYPE(ENUM, int32); TYPE(UINT64, uint64); TYPE(UINT32, uint32); TYPE(DOUBLE, double); TYPE(FLOAT, float); TYPE(BOOL, bool); default: UPB_ASSERT(false); break; } #undef TYPE upb_handlerattr_uninit(&attr); return ok; } bool upb_msg_getscalarhandlerdata(const upb_handlers *h, upb_selector_t s, upb_fieldtype_t *type, size_t *offset, int32_t *hasbit) { const upb_msg_handlerdata *d; upb_func *f = upb_handlers_gethandler(h, s); if ((upb_int64_handlerfunc*)f == upb_msg_setint64) { *type = UPB_TYPE_INT64; } else if ((upb_int32_handlerfunc*)f == upb_msg_setint32) { *type = UPB_TYPE_INT32; } else if ((upb_uint64_handlerfunc*)f == upb_msg_setuint64) { *type = UPB_TYPE_UINT64; } else if ((upb_uint32_handlerfunc*)f == upb_msg_setuint32) { *type = UPB_TYPE_UINT32; } else if ((upb_double_handlerfunc*)f == upb_msg_setdouble) { *type = UPB_TYPE_DOUBLE; } else if ((upb_float_handlerfunc*)f == upb_msg_setfloat) { *type = UPB_TYPE_FLOAT; } else if ((upb_bool_handlerfunc*)f == upb_msg_setbool) { *type = UPB_TYPE_BOOL; } else { return false; } d = upb_handlers_gethandlerdata(h, s); *offset = d->offset; *hasbit = d->hasbit; return true; }