Incremental progress towards getting upb_def to bootstrap.

pull/13171/head
Joshua Haberman 15 years ago
parent 67b16cbe5c
commit db6c7387bc
  1. 3
      Makefile
  2. 9
      core/upb.c
  3. 7
      core/upb.h
  4. 102
      core/upb_def.c
  5. 62
      core/upb_def.h
  6. 1
      core/upb_stream_vtbl.h
  7. 2
      core/upb_table.c
  8. 3
      tests/test_string.c

@ -48,12 +48,13 @@ clean:
# The core library (core/libupb.a)
SRC=core/upb.c stream/upb_decoder.c core/upb_table.c core/upb_def.c core/upb_string.c \
descriptor/descriptor.c
$(SRC): perf-cppflags
# Parts of core that are yet to be converted.
OTHERSRC=src/upb_encoder.c src/upb_text.c
# Override the optimization level for upb_def.o, because it is not in the
# critical path but gets very large when -O3 is used.
core/upb_def.o: core/upb_def.c
$(CC) $(CFLAGS) $(CPPFLAGS) -Os -c -o $@ $<
$(CC) $(CFLAGS) $(CPPFLAGS) -O0 -c -o $@ $<
core/upb_def.lo: core/upb_def.c
$(CC) $(CFLAGS) $(CPPFLAGS) -Os -c -o $@ $< -fPIC

@ -44,12 +44,11 @@ void upb_seterr(upb_status *status, enum upb_status_code code,
const char *msg, ...)
{
if(upb_ok(status)) { // The first error is the most interesting.
status->str = upb_string_new();
char *str = upb_string_getrwbuf(status->str, UPB_ERRORMSG_MAXLEN);
status->code = code;
status->str = upb_string_tryrecycle(status->str);
va_list args;
va_start(args, msg);
vsnprintf(str, UPB_ERRORMSG_MAXLEN, msg, args);
upb_string_vprintf(status->str, msg, args);
va_end(args);
}
}
@ -57,10 +56,10 @@ void upb_seterr(upb_status *status, enum upb_status_code code,
void upb_copyerr(upb_status *to, upb_status *from)
{
to->code = from->code;
to->str = upb_string_getref(from->str);
if(from->str) to->str = upb_string_getref(from->str);
}
void upb_reset(upb_status *status) {
void upb_status_reset(upb_status *status) {
status->code = UPB_STATUS_OK;
upb_string_unref(status->str);
status->str = NULL;

@ -195,7 +195,12 @@ INLINE bool upb_ok(upb_status *status) {
return status->code == UPB_STATUS_OK;
}
void upb_reset(upb_status *status);
INLINE void upb_status_init(upb_status *status) {
status->code = UPB_STATUS_OK;
status->str = NULL;
}
void upb_status_reset(upb_status *status);
void upb_seterr(upb_status *status, enum upb_status_code code, const char *msg,
...);
void upb_copyerr(upb_status *to, upb_status *from);

@ -155,8 +155,9 @@ static int upb_cycle_ref_or_unref(upb_msgdef *m, upb_msgdef *cycle_base,
} else {
open_defs[num_open_defs++] = m;
}
for(int i = 0; i < m->num_fields; i++) {
upb_fielddef *f = &m->fields[i];
upb_msg_iter iter = upb_msg_begin(m);
for(; !upb_msg_done(iter); iter = upb_msg_next(m, iter)) {
upb_fielddef *f = upb_msg_iter_field(iter);
upb_def *def = f->def;
if(upb_issubmsg(f) && def->is_cyclic) {
upb_msgdef *sub_m = upb_downcast_msgdef(def);
@ -230,16 +231,6 @@ static void upb_unresolveddef_free(struct _upb_unresolveddef *def) {
/* upb_enumdef ****************************************************************/
typedef struct {
upb_strtable_entry e;
uint32_t value;
} ntoi_ent;
typedef struct {
upb_inttable_entry e;
upb_string *string;
} iton_ent;
static void upb_enumdef_free(upb_enumdef *e) {
upb_strtable_free(&e->ntoi);
upb_inttable_free(&e->iton);
@ -271,8 +262,8 @@ static bool upb_addenum_val(upb_src *src, upb_enumdef *e, upb_status *status)
upb_seterr(status, UPB_STATUS_ERROR, "Enum value missing name or number.");
goto err;
}
ntoi_ent ntoi_ent = {{name, 0}, number};
iton_ent iton_ent = {{number, 0}, name};
upb_ntoi_ent ntoi_ent = {{name, 0}, number};
upb_iton_ent iton_ent = {{number, 0}, name};
upb_strtable_insert(&e->ntoi, &ntoi_ent.e);
upb_inttable_insert(&e->iton, &iton_ent.e);
// We don't unref "name" because we pass our ref to the iton entry of the
@ -291,11 +282,14 @@ static bool upb_addenum(upb_src *src, upb_deflist *defs, upb_status *status)
{
upb_enumdef *e = malloc(sizeof(*e));
upb_def_init(&e->base, UPB_DEF_ENUM);
upb_strtable_init(&e->ntoi, 0, sizeof(ntoi_ent));
upb_inttable_init(&e->iton, 0, sizeof(iton_ent));
upb_strtable_init(&e->ntoi, 0, sizeof(upb_ntoi_ent));
upb_inttable_init(&e->iton, 0, sizeof(upb_iton_ent));
upb_fielddef *f;
while((f = upb_src_getdef(src)) != NULL) {
switch(f->number) {
case GOOGLE_PROTOBUF_ENUMDESCRIPTORPROTO_NAME_FIELDNUM:
e->base.fqname = upb_string_tryrecycle(e->base.fqname);
CHECKSRC(upb_src_getstr(src, e->base.fqname));
case GOOGLE_PROTOBUF_ENUMDESCRIPTORPROTO_VALUE_FIELDNUM:
CHECK(upb_addenum_val(src, e, status));
break;
@ -304,37 +298,25 @@ static bool upb_addenum(upb_src *src, upb_deflist *defs, upb_status *status)
break;
}
}
assert(e->base.fqname);
upb_deflist_push(defs, UPB_UPCAST(e));
return true;
src_err:
upb_copyerr(status, upb_src_status(src));
err:
upb_enumdef_free(e);
return false;
}
static void fill_iter(upb_enum_iter *iter, ntoi_ent *ent) {
iter->state = ent;
iter->name = ent->e.key;
iter->val = ent->value;
}
void upb_enum_begin(upb_enum_iter *iter, upb_enumdef *e) {
upb_enum_iter upb_enum_begin(upb_enumdef *e) {
// We could iterate over either table here; the choice is arbitrary.
ntoi_ent *ent = upb_strtable_begin(&e->ntoi);
iter->e = e;
fill_iter(iter, ent);
return upb_inttable_begin(&e->iton);
}
void upb_enum_next(upb_enum_iter *iter) {
ntoi_ent *ent = iter->state;
assert(ent);
ent = upb_strtable_next(&iter->e->ntoi, &ent->e);
iter->state = ent;
if(ent) fill_iter(iter, ent);
}
bool upb_enum_done(upb_enum_iter *iter) {
return iter->state == NULL;
upb_enum_iter upb_enum_next(upb_enumdef *e, upb_enum_iter iter) {
assert(iter);
return upb_inttable_next(&e->iton, &iter->e);
}
@ -346,7 +328,7 @@ static void upb_fielddef_free(upb_fielddef *f) {
static void upb_fielddef_uninit(upb_fielddef *f) {
upb_string_unref(f->name);
if(upb_hasdef(f) && f->owned) {
if(f->owned) {
upb_def_unref(f->def);
}
}
@ -354,6 +336,8 @@ static void upb_fielddef_uninit(upb_fielddef *f) {
static bool upb_addfield(upb_src *src, upb_msgdef *m, upb_status *status)
{
upb_fielddef *f = malloc(sizeof(*f));
f->number = -1;
f->name = NULL;
f->def = NULL;
f->owned = false;
upb_fielddef *parsed_f;
@ -388,6 +372,7 @@ static bool upb_addfield(upb_src *src, upb_msgdef *m, upb_status *status)
}
CHECKSRC(upb_src_eof(src));
// TODO: verify that all required fields were present.
assert(f->number != -1 && f->name != NULL);
assert((f->def != NULL) == upb_hasdef(f));
// Field was successfully read, add it as a field of the msgdef.
@ -461,9 +446,9 @@ err:
static void upb_msgdef_free(upb_msgdef *m)
{
for (upb_field_count_t i = 0; i < m->num_fields; i++)
upb_fielddef_uninit(&m->fields[i]);
free(m->fields);
upb_msg_iter i;
for(i = upb_msg_begin(m); !upb_msg_done(i); i = upb_msg_next(m, i))
upb_fielddef_uninit(upb_msg_iter_field(i));
upb_strtable_free(&m->ntof);
upb_inttable_free(&m->itof);
upb_def_uninit(&m->base);
@ -479,6 +464,13 @@ static void upb_msgdef_resolve(upb_msgdef *m, upb_fielddef *f, upb_def *def) {
upb_def_ref(def);
}
upb_msg_iter upb_msg_begin(upb_msgdef *m) {
return upb_inttable_begin(&m->itof);
}
upb_msg_iter upb_msg_next(upb_msgdef *m, upb_msg_iter iter) {
return upb_inttable_next(&m->itof, &iter->e);
}
/* symtab internal ***********************************************************/
@ -601,8 +593,9 @@ static bool upb_symtab_findcycles(upb_msgdef *m, int depth, upb_status *status)
} else {
UPB_UPCAST(m)->search_depth = ++depth;
bool cycle_found = false;
for(upb_field_count_t i = 0; i < m->num_fields; i++) {
upb_fielddef *f = &m->fields[i];
upb_msg_iter i;
for(i = upb_msg_begin(m); !upb_msg_done(i); i = upb_msg_next(m, i)) {
upb_fielddef *f = upb_msg_iter_field(i);
if(!upb_issubmsg(f)) continue;
upb_def *sub_def = f->def;
upb_msgdef *sub_m = upb_downcast_msgdef(sub_def);
@ -632,8 +625,9 @@ bool upb_resolverefs(upb_strtable *tmptab, upb_strtable *symtab,
// Type names are resolved relative to the message in which they appear.
upb_string *base = e->e.key;
for(upb_field_count_t i = 0; i < m->num_fields; i++) {
upb_fielddef *f = &m->fields[i];
upb_msg_iter i;
for(i = upb_msg_begin(m); !upb_msg_done(i); i = upb_msg_next(m, i)) {
upb_fielddef *f = upb_msg_iter_field(i);
if(!upb_hasdef(f)) continue; // No resolving necessary.
upb_string *name = upb_downcast_unresolveddef(f->def)->name;
@ -873,7 +867,6 @@ typedef struct {
upb_wire_type_t wire_type;
upb_strlen_t delimited_len;
upb_strlen_t stack[UPB_MAX_NESTING], *top;
upb_string *str;
} upb_baredecoder;
static uint64_t upb_baredecoder_readv64(upb_baredecoder *d)
@ -929,6 +922,12 @@ static upb_fielddef *upb_baredecoder_getdef(upb_baredecoder *d)
return &d->field;
}
static bool upb_baredecoder_getstr(upb_baredecoder *d, upb_string *str) {
upb_string_substr(str, d->input, d->offset, d->delimited_len);
d->offset += d->delimited_len;
return true;
}
static bool upb_baredecoder_getval(upb_baredecoder *d, upb_valueptr val)
{
switch(d->wire_type) {
@ -950,11 +949,6 @@ static bool upb_baredecoder_getval(upb_baredecoder *d, upb_valueptr val)
return true;
}
static bool upb_baredecoder_getstr(upb_baredecoder *d, upb_string *str) {
upb_string_substr(str, d->input, d->offset, d->delimited_len);
return true;
}
static bool upb_baredecoder_skipval(upb_baredecoder *d)
{
upb_value val;
@ -986,7 +980,6 @@ static upb_baredecoder *upb_baredecoder_new(upb_string *str)
{
upb_baredecoder *d = malloc(sizeof(*d));
d->input = upb_string_getref(str);
d->str = upb_string_new();
d->top = &d->stack[0];
upb_src_init(&d->src, &upb_baredecoder_src_vtbl);
return d;
@ -995,7 +988,6 @@ static upb_baredecoder *upb_baredecoder_new(upb_string *str)
static void upb_baredecoder_free(upb_baredecoder *d)
{
upb_string_unref(d->input);
upb_string_unref(d->str);
free(d);
}
@ -1004,11 +996,8 @@ static upb_src *upb_baredecoder_src(upb_baredecoder *d)
return &d->src;
}
upb_symtab *upb_get_descriptor_symtab()
void upb_symtab_add_descriptorproto(upb_symtab *symtab)
{
// TODO: implement sharing of symtabs, so that successive calls to this
// function will return the same symtab.
upb_symtab *symtab = upb_symtab_new();
// TODO: allow upb_strings to be static or on the stack.
upb_string *descriptor = upb_strduplen(descriptor_pb, descriptor_pb_len);
upb_baredecoder *decoder = upb_baredecoder_new(descriptor);
@ -1017,5 +1006,4 @@ upb_symtab *upb_get_descriptor_symtab()
assert(upb_ok(&status));
upb_baredecoder_free(decoder);
upb_string_unref(descriptor);
return symtab;
}

@ -135,11 +135,6 @@ INLINE bool upb_elem_ismm(upb_fielddef *f) {
typedef struct _upb_msgdef {
upb_def base;
upb_atomic_refcount_t cycle_refcount;
size_t size;
upb_field_count_t num_fields;
uint32_t set_flags_bytes;
uint32_t num_required_fields; // Required fields have the lowest set bytemasks.
upb_fielddef *fields; // We have exclusive ownership of these.
// Tables for looking up fields by number and name.
upb_inttable itof; // int to field
@ -170,6 +165,21 @@ INLINE upb_fielddef *upb_msg_ntof(upb_msgdef *m, upb_string *name) {
return e ? e->f : NULL;
}
// Iteration over fields. The order is undefined.
// upb_msg_iter i;
// for(i = upb_msg_begin(m); !upb_msg_done(&i); i = upb_msg_next(&i)) {
// // ...
// }
typedef upb_itof_ent *upb_msg_iter;
upb_msg_iter upb_msg_begin(upb_msgdef *m);
upb_msg_iter upb_msg_next(upb_msgdef *m, upb_msg_iter iter);
INLINE bool upb_msg_done(upb_msg_iter iter) { return iter == NULL; }
INLINE upb_fielddef *upb_msg_iter_field(upb_msg_iter iter) {
return iter->f;
}
/* upb_enumdef ****************************************************************/
typedef struct _upb_enumdef {
@ -178,6 +188,16 @@ typedef struct _upb_enumdef {
upb_inttable iton;
} upb_enumdef;
typedef struct {
upb_strtable_entry e;
uint32_t value;
} upb_ntoi_ent;
typedef struct {
upb_inttable_entry e;
upb_string *string;
} upb_iton_ent;
typedef int32_t upb_enumval_t;
// Lookups from name to integer and vice-versa.
@ -186,18 +206,22 @@ upb_string *upb_enumdef_iton(upb_enumdef *e, upb_enumval_t num);
// Iteration over name/value pairs. The order is undefined.
// upb_enum_iter i;
// for(upb_enum_begin(&i, e); !upb_enum_done(&i); upb_enum_next(&i)) {
// for(i = upb_enum_begin(e); !upb_enum_done(i); i = upb_enum_next(e, i)) {
// // ...
// }
typedef struct {
upb_enumdef *e;
void *state; // Internal iteration state.
upb_string *name;
upb_enumval_t val;
} upb_enum_iter;
void upb_enum_begin(upb_enum_iter *iter, upb_enumdef *e);
void upb_enum_next(upb_enum_iter *iter);
bool upb_enum_done(upb_enum_iter *iter);
typedef upb_iton_ent *upb_enum_iter;
upb_enum_iter upb_enum_begin(upb_enumdef *e);
upb_enum_iter upb_enum_next(upb_enumdef *e, upb_enum_iter iter);
INLINE bool upb_enum_done(upb_enum_iter iter) { return iter == NULL; }
INLINE upb_string *upb_enum_iter_name(upb_enum_iter iter) {
return iter->string;
}
INLINE int32_t upb_enum_iter_number(upb_enum_iter iter) {
return iter->e.key;
}
/* upb_symtab *****************************************************************/
@ -252,10 +276,10 @@ upb_def **upb_symtab_getdefs(upb_symtab *s, int *count, upb_def_type_t type);
// more useful? Maybe it should be an option.
void upb_symtab_addfds(upb_symtab *s, upb_src *desc, upb_status *status);
// Returns a symtab that defines google.protobuf.DescriptorProto and all other
// types that are defined in descriptor.proto. This allows you to load other
// proto types. The caller owns a ref on the returned symtab.
upb_symtab *upb_get_descriptor_symtab();
// Adds defs for google.protobuf.FileDescriptorSet and friends to this symtab.
// This is necessary for bootstrapping, since these are the upb_defs that
// specify other defs and allow them to be loaded.
void upb_symtab_add_descriptorproto(upb_symtab *s);
/* upb_def casts **************************************************************/

@ -88,6 +88,7 @@ struct upb_bytesrc {
INLINE void upb_src_init(upb_src *s, upb_src_vtable *vtbl) {
s->vtbl = vtbl;
s->eof = false;
upb_status_init(&s->status);
#ifndef DEBUG
// TODO: initialize debug-mode checking.
#endif

@ -179,7 +179,7 @@ static void strinsert(upb_strtable *t, upb_strtable_entry *e)
memcpy(strent(t, empty_bucket), table_e, t->t.entry_size); /* copies next */
upb_strtable_entry *evictee_e = strent(t, evictee_bucket);
while(1) {
assert(!upb_string_isnull(evictee_e->key));
assert(evictee_e->key);
assert(evictee_e->next != UPB_END_OF_CHAIN);
if(evictee_e->next == bucket) {
evictee_e->next = empty_bucket;

@ -66,4 +66,7 @@ int main() {
upb_string_unref(str);
upb_string_unref(str2);
// Unref of NULL is harmless.
upb_string_unref(NULL);
}

Loading…
Cancel
Save