Protocol Buffers - Google's data interchange format (grpc依赖)
https://developers.google.com/protocol-buffers/
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
390 lines
15 KiB
390 lines
15 KiB
/* |
|
* upb - a minimalist implementation of protocol buffers. |
|
* |
|
* Copyright (c) 2010-2011 Google Inc. See LICENSE for details. |
|
* Author: Josh Haberman <jhaberman@gmail.com> |
|
* |
|
* upb_handlers is a generic visitor-like interface for iterating over a stream |
|
* of protobuf data. You can register function pointers that will be called |
|
* for each message and/or field as the data is being parsed or iterated over, |
|
* without having to know the source format that we are parsing from. This |
|
* decouples the parsing logic from the processing logic. |
|
*/ |
|
|
|
#ifndef UPB_HANDLERS_H |
|
#define UPB_HANDLERS_H |
|
|
|
#include <limits.h> |
|
#include "upb/upb.h" |
|
#include "upb/def.h" |
|
#include "upb/bytestream.h" |
|
|
|
#ifdef __cplusplus |
|
extern "C" { |
|
#endif |
|
|
|
/* Handlers protocol definition ***********************************************/ |
|
|
|
// A upb_handlers object represents a graph of handlers. Each message can have |
|
// a set of handlers as well as a set of fields which themselves have handlers. |
|
// Fields that represent submessages or groups are linked to other message |
|
// handlers, so the overall set of handlers can form a graph structure (which |
|
// may be cyclic). |
|
// |
|
// The upb_mhandlers (message handlers) object can have the following handlers: |
|
// |
|
// static upb_flow_t startmsg(void *closure) { |
|
// // Called when the message begins. "closure" was supplied by our caller. |
|
// return UPB_CONTINUE; |
|
// } |
|
// |
|
// static void endmsg(void *closure, upb_status *status) { |
|
// // Called when processing of this message ends, whether in success or |
|
// // failure. "status" indicates the final status of processing, and can |
|
// / also be modified in-place to update the final status. |
|
// // |
|
// // Since this callback is guaranteed to always be called eventually, it |
|
// // can be used to free any resources that were allocated during processing. |
|
// } |
|
// |
|
// TODO: unknown field handler. |
|
// |
|
// The upb_fhandlers (field handlers) object can have the following handlers: |
|
// |
|
// static upb_flow_t value(void *closure, upb_value fval, upb_value val) { |
|
// // Called when the field's value is encountered. "fval" contains |
|
// // whatever value was bound to this field at registration type |
|
// // (for upb_register_all(), this will be the field's upb_fielddef*). |
|
// return UPB_CONTINUE; |
|
// } |
|
// |
|
// static upb_sflow_t startsubmsg(void *closure, upb_value fval) { |
|
// // Called when a submessage begins. The second element of the return |
|
// // value is the closure for the submessage. |
|
// return UPB_CONTINUE_WITH(closure); |
|
// } |
|
// |
|
// static upb_flow_t endsubmsg(void *closure, upb_value fval) { |
|
// // Called when a submessage ends. |
|
// return UPB_CONTINUE; |
|
// } |
|
// |
|
// static upb_sflow_t startseqmsg(void *closure, upb_value fval) { |
|
// // Called when a sequence (repeated field) begins. The second element |
|
// // of the return value is the closure for the sequence. |
|
// return UPB_CONTINUE_WITH(closure); |
|
// } |
|
// |
|
// static upb_flow_t endeqvoid *closure, upb_value fval) { |
|
// // Called when a sequence ends. |
|
// return UPB_CONTINUE; |
|
// } |
|
// |
|
// All handlers except the endmsg handler return a value from this enum, to |
|
// control whether parsing will continue or not. |
|
typedef enum { |
|
// Data source should continue calling callbacks. |
|
UPB_CONTINUE = 0, |
|
|
|
// Halt processing permanently (in a non-resumable way). The endmsg handlers |
|
// for any currently open messages will be called which can supply a more |
|
// specific status message. No further input data will be consumed. |
|
UPB_BREAK, |
|
|
|
// Skips to the end of the current submessage (or if we are at the top |
|
// level, skips to the end of the entire message). In other words, it is |
|
// like a UPB_BREAK that applies only to the current level. |
|
// |
|
// If you UPB_SKIPSUBMSG from a startmsg handler, the endmsg handler will |
|
// be called to perform cleanup and return a status. Returning |
|
// UPB_SKIPSUBMSG from a startsubmsg handler will *not* call the startmsg, |
|
// endmsg, or endsubmsg handlers. |
|
// |
|
// If UPB_SKIPSUBMSG is called from the top-level message, no further input |
|
// data will be consumed. |
|
UPB_SKIPSUBMSG, |
|
|
|
// TODO: Add UPB_SUSPEND, for resumable producers/consumers. |
|
} upb_flow_t; |
|
|
|
// The startsubmsg handler needs to also pass a closure to the submsg. |
|
typedef struct { |
|
upb_flow_t flow; |
|
void *closure; |
|
} upb_sflow_t; |
|
|
|
INLINE upb_sflow_t UPB_SFLOW(upb_flow_t flow, void *closure) { |
|
upb_sflow_t ret = {flow, closure}; |
|
return ret; |
|
} |
|
#define UPB_CONTINUE_WITH(c) UPB_SFLOW(UPB_CONTINUE, c) |
|
#define UPB_SBREAK UPB_SFLOW(UPB_BREAK, NULL) |
|
|
|
// Typedefs for all of the handler functions defined above. |
|
typedef upb_flow_t (upb_startmsg_handler)(void *c); |
|
typedef void (upb_endmsg_handler)(void *c, upb_status *status); |
|
typedef upb_flow_t (upb_value_handler)(void *c, upb_value fval, upb_value val); |
|
typedef upb_sflow_t (upb_startfield_handler)(void *closure, upb_value fval); |
|
typedef upb_flow_t (upb_endfield_handler)(void *closure, upb_value fval); |
|
|
|
|
|
/* upb_fhandlers **************************************************************/ |
|
|
|
// A upb_fhandlers object represents the set of handlers associated with one |
|
// specific message field. |
|
struct _upb_decoder; |
|
struct _upb_mhandlers; |
|
typedef struct _upb_fieldent { |
|
bool junk; |
|
upb_fieldtype_t type; |
|
bool repeated; |
|
bool is_repeated_primitive; |
|
upb_atomic_t refcount; |
|
uint32_t number; |
|
int32_t valuehasbit; |
|
struct _upb_mhandlers *msg; |
|
struct _upb_mhandlers *submsg; // Set iff upb_issubmsgtype(type) == true. |
|
upb_value fval; |
|
upb_value_handler *value; |
|
upb_startfield_handler *startsubmsg; |
|
upb_endfield_handler *endsubmsg; |
|
upb_startfield_handler *startseq; |
|
upb_endfield_handler *endseq; |
|
#ifdef UPB_USE_JIT_X64 |
|
uint32_t jit_pclabel; |
|
uint32_t jit_pclabel_notypecheck; |
|
uint32_t jit_submsg_done_pclabel; |
|
#endif |
|
void (*decode)(struct _upb_decoder *d, struct _upb_fieldent *f); |
|
} upb_fhandlers; |
|
|
|
// fhandlers are created as part of a upb_handlers instance, but can be ref'd |
|
// and unref'd to prolong the life of the handlers. |
|
void upb_fhandlers_ref(upb_fhandlers *m); |
|
void upb_fhandlers_unref(upb_fhandlers *m); |
|
|
|
// upb_fhandlers accessors |
|
#define UPB_FHANDLERS_ACCESSORS(name, type) \ |
|
INLINE void upb_fhandlers_set ## name(upb_fhandlers *f, type v){f->name = v;} \ |
|
INLINE type upb_fhandlers_get ## name(upb_fhandlers *f) { return f->name; } |
|
UPB_FHANDLERS_ACCESSORS(fval, upb_value) |
|
UPB_FHANDLERS_ACCESSORS(value, upb_value_handler*) |
|
UPB_FHANDLERS_ACCESSORS(startsubmsg, upb_startfield_handler*) |
|
UPB_FHANDLERS_ACCESSORS(endsubmsg, upb_endfield_handler*) |
|
UPB_FHANDLERS_ACCESSORS(startseq, upb_startfield_handler*) |
|
UPB_FHANDLERS_ACCESSORS(endseq, upb_endfield_handler*) |
|
UPB_FHANDLERS_ACCESSORS(msg, struct _upb_mhandlers*) |
|
UPB_FHANDLERS_ACCESSORS(submsg, struct _upb_mhandlers*) |
|
// If set to >= 0, the hasbit will automatically be set after the corresponding |
|
// callback is called (when a JIT is enabled, this can be significantly more |
|
// efficient than setting the hasbit yourself inside the callback). Could add |
|
// this for seq and submsg also, but doesn't look like a win at the moment. |
|
UPB_FHANDLERS_ACCESSORS(valuehasbit, int32_t) |
|
|
|
|
|
/* upb_mhandlers **************************************************************/ |
|
|
|
// A upb_mhandlers object represents the set of handlers associated with a |
|
// message in the graph of messages. |
|
|
|
typedef struct _upb_mhandlers { |
|
upb_atomic_t refcount; |
|
upb_startmsg_handler *startmsg; |
|
upb_endmsg_handler *endmsg; |
|
upb_inttable fieldtab; // Maps field number -> upb_fhandlers. |
|
bool is_group; |
|
#ifdef UPB_USE_JIT_X64 |
|
uint32_t jit_startmsg_pclabel; |
|
uint32_t jit_endofbuf_pclabel; |
|
uint32_t jit_endofmsg_pclabel; |
|
uint32_t jit_unknownfield_pclabel; |
|
int32_t jit_parent_field_done_pclabel; |
|
uint32_t max_field_number; |
|
// Currently keyed on field number. Could also try keying it |
|
// on encoded or decoded tag, or on encoded field number. |
|
void **tablearray; |
|
#endif |
|
} upb_mhandlers; |
|
|
|
// mhandlers are created as part of a upb_handlers instance, but can be ref'd |
|
// and unref'd to prolong the life of the handlers. |
|
void upb_mhandlers_ref(upb_mhandlers *m); |
|
void upb_mhandlers_unref(upb_mhandlers *m); |
|
|
|
// Creates a new field with the given name and number. There must not be an |
|
// existing field with either this name or number or abort() will be called. |
|
// TODO: this should take a name also. |
|
upb_fhandlers *upb_mhandlers_newfhandlers(upb_mhandlers *m, uint32_t n, |
|
upb_fieldtype_t type, bool repeated); |
|
// Like the previous but for MESSAGE or GROUP fields. For GROUP fields, the |
|
// given submessage must not have any fields with this field number. |
|
upb_fhandlers *upb_mhandlers_newfhandlers_subm(upb_mhandlers *m, uint32_t n, |
|
upb_fieldtype_t type, |
|
bool repeated, |
|
upb_mhandlers *subm); |
|
|
|
// upb_mhandlers accessors. |
|
#define UPB_MHANDLERS_ACCESSORS(name, type) \ |
|
INLINE void upb_mhandlers_set ## name(upb_mhandlers *m, type v){m->name = v;} \ |
|
INLINE type upb_mhandlers_get ## name(upb_mhandlers *m) { return m->name; } |
|
UPB_MHANDLERS_ACCESSORS(startmsg, upb_startmsg_handler*); |
|
UPB_MHANDLERS_ACCESSORS(endmsg, upb_endmsg_handler*); |
|
|
|
|
|
/* upb_handlers ***************************************************************/ |
|
|
|
struct _upb_handlers { |
|
upb_atomic_t refcount; |
|
upb_mhandlers **msgs; // Array of msgdefs, [0]=toplevel. |
|
int msgs_len, msgs_size; |
|
bool should_jit; |
|
}; |
|
typedef struct _upb_handlers upb_handlers; |
|
|
|
upb_handlers *upb_handlers_new(void); |
|
void upb_handlers_ref(upb_handlers *h); |
|
void upb_handlers_unref(upb_handlers *h); |
|
|
|
// Appends a new message to the graph of handlers and returns it. This message |
|
// can be obtained later at index upb_handlers_msgcount()-1. All handlers will |
|
// be initialized to no-op handlers. |
|
upb_mhandlers *upb_handlers_newmhandlers(upb_handlers *h); |
|
upb_mhandlers *upb_handlers_getmhandlers(upb_handlers *h, int index); |
|
|
|
// Convenience function for registering handlers for all messages and |
|
// fields in a msgdef and all its children. For every registered message |
|
// "msgreg_cb" will be called with the newly-created mhandlers, and likewise |
|
// with "fieldreg_cb" |
|
// |
|
// See upb_handlers_reghandlerset() below for an example. |
|
typedef void upb_onmsgreg(void *closure, upb_mhandlers *mh, upb_msgdef *m); |
|
typedef void upb_onfieldreg(void *closure, upb_fhandlers *mh, upb_fielddef *m); |
|
upb_mhandlers *upb_handlers_regmsgdef(upb_handlers *h, upb_msgdef *m, |
|
upb_onmsgreg *msgreg_cb, |
|
upb_onfieldreg *fieldreg_cb, |
|
void *closure); |
|
|
|
// Convenience function for registering a set of handlers for all messages and |
|
// fields in a msgdef and its children, with the fval bound to the upb_fielddef. |
|
// Any of the handlers may be NULL, in which case no callback will be set and |
|
// the nop callback will be used. |
|
typedef struct { |
|
upb_startmsg_handler *startmsg; |
|
upb_endmsg_handler *endmsg; |
|
upb_value_handler *value; |
|
upb_startfield_handler *startsubmsg; |
|
upb_endfield_handler *endsubmsg; |
|
upb_startfield_handler *startseq; |
|
upb_endfield_handler *endseq; |
|
} upb_handlerset; |
|
|
|
INLINE void upb_onmreg_hset(void *c, upb_mhandlers *mh, upb_msgdef *m) { |
|
(void)m; |
|
upb_handlerset *hs = (upb_handlerset*)c; |
|
if (hs->startmsg) upb_mhandlers_setstartmsg(mh, hs->startmsg); |
|
if (hs->endmsg) upb_mhandlers_setendmsg(mh, hs->endmsg); |
|
} |
|
INLINE void upb_onfreg_hset(void *c, upb_fhandlers *fh, upb_fielddef *f) { |
|
upb_handlerset *hs = (upb_handlerset*)c; |
|
if (hs->value) upb_fhandlers_setvalue(fh, hs->value); |
|
if (hs->startsubmsg) upb_fhandlers_setstartsubmsg(fh, hs->startsubmsg); |
|
if (hs->endsubmsg) upb_fhandlers_setendsubmsg(fh, hs->endsubmsg); |
|
if (hs->startseq) upb_fhandlers_setstartseq(fh, hs->startseq); |
|
if (hs->endseq) upb_fhandlers_setendseq(fh, hs->endseq); |
|
upb_value val; |
|
upb_value_setfielddef(&val, f); |
|
upb_fhandlers_setfval(fh, val); |
|
} |
|
INLINE upb_mhandlers *upb_handlers_reghandlerset(upb_handlers *h, upb_msgdef *m, |
|
upb_handlerset *hs) { |
|
return upb_handlers_regmsgdef(h, m, &upb_onmreg_hset, &upb_onfreg_hset, hs); |
|
} |
|
|
|
|
|
/* upb_dispatcher *************************************************************/ |
|
|
|
// upb_dispatcher can be used by sources of data to invoke the appropriate |
|
// handlers on a upb_handlers object. Besides maintaining the runtime stack of |
|
// closures and handlers, the dispatcher checks the return status of user |
|
// callbacks and properly handles statuses other than UPB_CONTINUE, invoking |
|
// "skip" or "exit" handlers on the underlying data source as appropriate. |
|
|
|
typedef struct { |
|
upb_fhandlers *f; |
|
void *closure; |
|
|
|
// Members to use as the data source requires. |
|
void *srcclosure; |
|
uint64_t end_ofs; |
|
uint16_t msgindex; |
|
uint16_t fieldindex; |
|
|
|
bool is_sequence; // frame represents seq or submsg? (f might be both). |
|
bool is_packed; // !upb_issubmsg(f) && end_ofs != UINT64_MAX (strings aren't pushed) |
|
} upb_dispatcher_frame; |
|
|
|
// Called when some of the input needs to be skipped. All frames from |
|
// top to bottom, inclusive, should be skipped. |
|
typedef void upb_skip_handler(void *, upb_dispatcher_frame *top, |
|
upb_dispatcher_frame *bottom); |
|
typedef void upb_exit_handler(void *); |
|
|
|
typedef struct { |
|
upb_dispatcher_frame *top, *limit; |
|
|
|
upb_handlers *handlers; |
|
|
|
// Msg and dispatch table for the current level. |
|
upb_mhandlers *msgent; |
|
upb_inttable *dispatch_table; |
|
upb_skip_handler *skip; |
|
upb_exit_handler *exit; |
|
void *srcclosure; |
|
|
|
// Stack. |
|
upb_status status; |
|
upb_dispatcher_frame stack[UPB_MAX_NESTING]; |
|
} upb_dispatcher; |
|
|
|
void upb_dispatcher_init(upb_dispatcher *d, upb_handlers *h, |
|
upb_skip_handler *skip, upb_exit_handler *exit, |
|
void *closure); |
|
upb_dispatcher_frame *upb_dispatcher_reset(upb_dispatcher *d, void *topclosure); |
|
void upb_dispatcher_uninit(upb_dispatcher *d); |
|
|
|
// Tests whether the runtime stack is in the base level message. |
|
bool upb_dispatcher_stackempty(upb_dispatcher *d); |
|
|
|
// Looks up a field by number for the current message. |
|
INLINE upb_fhandlers *upb_dispatcher_lookup(upb_dispatcher *d, uint32_t n) { |
|
return (upb_fhandlers*)upb_inttable_fastlookup( |
|
d->dispatch_table, n, sizeof(upb_fhandlers)); |
|
} |
|
|
|
void _upb_dispatcher_unwind(upb_dispatcher *d, upb_flow_t flow); |
|
|
|
INLINE void _upb_dispatcher_sethas(void *_p, int32_t hasbit) { |
|
char *p = (char*)_p; |
|
if (hasbit >= 0) p[hasbit / 8] |= (1 << (hasbit % 8)); |
|
} |
|
|
|
// Dispatch functions -- call the user handler and handle errors. |
|
INLINE void upb_dispatch_value(upb_dispatcher *d, upb_fhandlers *f, |
|
upb_value val) { |
|
upb_flow_t flow = UPB_CONTINUE; |
|
if (f->value) flow = f->value(d->top->closure, f->fval, val); |
|
_upb_dispatcher_sethas(d->top->closure, f->valuehasbit); |
|
if (flow != UPB_CONTINUE) _upb_dispatcher_unwind(d, flow); |
|
} |
|
void upb_dispatch_startmsg(upb_dispatcher *d); |
|
void upb_dispatch_endmsg(upb_dispatcher *d, upb_status *status); |
|
upb_dispatcher_frame *upb_dispatch_startsubmsg(upb_dispatcher *d, upb_fhandlers *f); |
|
upb_dispatcher_frame *upb_dispatch_endsubmsg(upb_dispatcher *d); |
|
upb_dispatcher_frame *upb_dispatch_startseq(upb_dispatcher *d, upb_fhandlers *f); |
|
upb_dispatcher_frame *upb_dispatch_endseq(upb_dispatcher *d); |
|
|
|
#ifdef __cplusplus |
|
} /* extern "C" */ |
|
#endif |
|
|
|
#endif
|
|
|