Protocol Buffers - Google's data interchange format (grpc依赖) https://developers.google.com/protocol-buffers/
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1013 lines
41 KiB

/*
* upb - a minimalist implementation of protocol buffers.
*
* Copyright (c) 2010-2012 Google Inc. See LICENSE for details.
* Author: Josh Haberman <jhaberman@gmail.com>
*
* A upb_handlers is like a virtual table for a upb_msgdef. Each field of the
* message can have associated functions that will be called when we are
* parsing or visiting a stream of data. This is similar to how handlers work
* in SAX (the Simple API for XML).
*
* The handlers have no idea where the data is coming from, so a single set of
* handlers could be used with two completely different data sources (for
* example, a parser and a visitor over in-memory objects). This decoupling is
* the most important feature of upb, because it allows parsers and serializers
* to be highly reusable.
*
* This is a mixed C/C++ interface that offers a full API to both languages.
* See the top-level README for more information.
*/
#ifndef UPB_HANDLERS_H
#define UPB_HANDLERS_H
#include "upb/def.h"
#ifdef __cplusplus
struct upb_frametype;
namespace upb {
typedef upb_frametype FrameType;
class Handlers;
class SinkFrame;
}
typedef upb::FrameType upb_frametype;
typedef upb::Handlers upb_handlers;
typedef upb::SinkFrame upb_sinkframe;
UPB_INLINE void *upb_sinkframe_handlerdata(const upb_sinkframe* frame);
#else
struct upb_frametype;
struct upb_handlers;
struct upb_sinkframe;
typedef struct upb_frametype upb_frametype;
typedef struct upb_handlers upb_handlers;
typedef struct upb_sinkframe upb_sinkframe;
#endif
// All the different types of handlers that can be registered.
// Only needed for the advanced functions in upb::Handlers.
typedef enum {
UPB_HANDLER_INT32,
UPB_HANDLER_INT64,
UPB_HANDLER_UINT32,
UPB_HANDLER_UINT64,
UPB_HANDLER_FLOAT,
UPB_HANDLER_DOUBLE,
UPB_HANDLER_BOOL,
UPB_HANDLER_STARTSTR,
UPB_HANDLER_STRING,
UPB_HANDLER_ENDSTR,
UPB_HANDLER_STARTSUBMSG,
UPB_HANDLER_ENDSUBMSG,
UPB_HANDLER_STARTSEQ,
UPB_HANDLER_ENDSEQ,
} upb_handlertype_t;
#define UPB_HANDLER_MAX (UPB_HANDLER_ENDSEQ+1)
#define UPB_BREAK NULL
// A convenient definition for when no closure is needed.
extern char _upb_noclosure;
#define UPB_NO_CLOSURE &_upb_noclosure
// A selector refers to a specific field handler in the Handlers object
// (for example: the STARTSUBMSG handler for field "field15").
typedef int32_t upb_selector_t;
#ifdef __cplusplus
// A upb::Handlers object represents the set of handlers associated with a
// message in the graph of messages. You can think of it as a big virtual
// table with functions corresponding to all the events that can fire while
// parsing or visiting a message of a specific type.
//
// Any handlers that are not set behave as if they had successfully consumed
// the value. For start* handlers that return a void* closure, an unset handler
// will propagate the existing closure.
class upb::Handlers {
public:
typedef upb_selector_t Selector;
typedef upb_handlertype_t Type;
typedef bool StartMessageHandler(const SinkFrame*);
typedef void EndMessageHandler(const SinkFrame*, Status* status);
typedef void* StartFieldHandler(const SinkFrame*);
typedef bool EndFieldHandler(const SinkFrame*);
typedef void* StartStringHandler(const SinkFrame* c, size_t size_hint);
typedef size_t StringHandler(const SinkFrame* c, const char* buf, size_t len);
template <class T> struct Value {
typedef bool Handler(const SinkFrame*, T val);
};
typedef Value<upb_int32_t>::Handler Int32Handler;
typedef Value<upb_int64_t>::Handler Int64Handler;
typedef Value<upb_uint32_t>::Handler UInt32Handler;
typedef Value<upb_uint64_t>::Handler UInt64Handler;
typedef Value<float>::Handler FloatHandler;
typedef Value<double>::Handler DoubleHandler;
typedef Value<bool>::Handler BoolHandler;
#ifdef UPB_TWO_32BIT_TYPES
typedef Value<upb_int32alt_t>::Handler Int32Handler2;
typedef Value<upb_uint32alt_t>::Handler UInt32Handler2;
#endif
#ifdef UPB_TWO_64BIT_TYPES
typedef Value<upb_int64alt_t>::Handler Int64Handler2;
typedef Value<upb_uint64alt_t>::Handler UInt64Handler2;
#endif
// Any function pointer can be converted to this and converted back to its
// correct type.
typedef void GenericFunction();
// For freeing handler data.
typedef void Free(void *data);
typedef void HandlersCallback(void *closure, upb_handlers *h);
// Returns a new handlers object for the given frozen msgdef that will use
// the given FrameType as its top-level state (can be NULL, for now). A
// single ref on the returned object will belong to the given owner.
// Returns NULL if memory allocation failed.
static Handlers* New(const MessageDef* m,
const FrameType* ft,
const void *owner);
// Convenience function for registering a graph of handlers that mirrors the
// graph of msgdefs for some message. For "m" and all its children a new set
// of handlers will be created and the given callback will be invoked,
// allowing the client to register handlers for this message. Note that any
// subhandlers set by the callback will be overwritten. A single ref on the
// returned object will belong to the given owner.
static const Handlers* NewFrozen(const MessageDef *m,
const FrameType* ft,
const void *owner,
HandlersCallback *callback, void *closure);
// Functionality from upb::RefCounted.
bool IsFrozen() const;
void Ref(const void* owner) const;
void Unref(const void* owner) const;
void DonateRef(const void *from, const void *to) const;
void CheckRef(const void *owner) const;
// Top-level frame type.
const FrameType* frame_type() const;
// Freezes the given set of handlers. You may not freeze a handler without
// also freezing any handlers they point to. In the future we may want to
// require that all fields of the submessage have had subhandlers set for
// them.
static bool Freeze(Handlers*const* handlers, int n, Status* s);
// Returns the msgdef associated with this handlers object.
const MessageDef* message_def() const;
// Sets the startmsg handler for the message, which is defined as follows:
//
// bool startmsg(const upb::SinkFrame* frame) {
// // Called when the message begins. Returns true if processing should
// // continue.
// return true;
// }
void SetStartMessageHandler(StartMessageHandler *handler);
StartMessageHandler *GetStartMessageHandler() const;
// Sets the endmsg handler for the message, which is defined as follows:
//
// void endmsg(const upb::SinkFrame* frame, upb_status *status) {
// // Called when processing of this message ends, whether in success or
// // failure. "status" indicates the final status of processing, and
// // can also be modified in-place to update the final status.
// }
void SetEndMessageHandler(EndMessageHandler *handler);
EndMessageHandler *GetEndMessageHandler() const;
// Sets the value handler for the given field, which is defined as follows
// (this is for an int32 field; other field types will pass their native
// C/C++ type for "val"):
//
// bool value(const upb::SinkFrame *frame, upb_int32_t val) {
// // Called when the field's value is encountered. "d" contains
// // whatever data was bound to this field when it was registered.
// // Returns true if processing should continue.
// return true;
// }
//
// The value type must exactly match f->type().
// For example, SetInt32Handler() may only be used for fields of type
// UPB_TYPE_INT32 and UPB_TYPE_ENUM.
//
// "d" is the data that will be bound to this callback and passed to it.
// If "fr" is non-NULL it will be run when the data is no longer needed.
//
// Returns "false" if "f" does not belong to this message or has the wrong
// type for this handler.
//
// NOTE: the prototype above uses "upb_int32_t" and not "int32_t" from
// stdint.h. For C++ any int32 typedef will work correctly thanks to
// function overloading on the function pointer type. But in C things are
// more complicated; "int" and "long" could both be 32-bit types, but the
// two are incompatible with each other when it comes to function pointers.
// Since we don't know what the underlying type of int32_t is, we have to
// define our own which we *do* know the underlying type of. The easiest
// and most portable choice is to define handlers in C with the upb_intXX_t
// types.
bool SetInt32Handler (const FieldDef* f, Int32Handler* h, void* d, Free* fr);
bool SetInt64Handler (const FieldDef* f, Int64Handler* h, void* d, Free* fr);
bool SetUInt32Handler(const FieldDef* f, UInt32Handler* h, void* d, Free* fr);
bool SetUInt64Handler(const FieldDef* f, UInt64Handler* h, void* d, Free* fr);
bool SetFloatHandler (const FieldDef* f, FloatHandler* h, void* d, Free* fr);
bool SetDoubleHandler(const FieldDef* f, DoubleHandler* h, void* d, Free* fr);
bool SetBoolHandler (const FieldDef* f, BoolHandler* h, void* d, Free* fr);
// Convenience versions that look up the field by name first. These return
// false if no field with this name exists, or for any of the other reasons
// that the FieldDef* version returns false.
bool SetInt32Handler (const char *name, Int32Handler* h, void* d, Free* fr);
bool SetInt64Handler (const char *name, Int64Handler* h, void* d, Free* fr);
bool SetUInt32Handler(const char *name, UInt32Handler* h, void* d, Free* fr);
bool SetUInt64Handler(const char *name, UInt64Handler* h, void* d, Free* fr);
bool SetFloatHandler (const char *name, FloatHandler* h, void* d, Free* fr);
bool SetDoubleHandler(const char *name, DoubleHandler* h, void* d, Free* fr);
bool SetBoolHandler (const char *name, BoolHandler* h, void* d, Free* fr);
// On platforms where there are two 32-bit or 64-bit integer types, provide
// registration functions for both. Function overloading should make this
// all transparent to the user.
#ifdef UPB_TWO_32BIT_TYPES
bool SetInt32Handler (const FieldDef* f, Int32Handler2* h, void* d, Free* x);
bool SetUInt32Handler(const FieldDef* f, UInt32Handler2* h, void* d, Free* x);
bool SetInt32Handler (const char *name, Int32Handler2* h, void* d, Free* x);
bool SetUInt32Handler(const char *name, UInt32Handler2* h, void* d, Free* x);
#endif
#ifdef UPB_TWO_64BIT_TYPES
bool SetInt64Handler (const FieldDef* f, Int64Handler2* h, void* d, Free* x);
bool SetUInt64Handler(const FieldDef* f, UInt64Handler2* h, void* d, Free* x);
bool SetInt64Handler (const char *name, Int64Handler2* h, void* d, Free* x);
bool SetUInt64Handler(const char *name, UInt64Handler2* h, void* d, Free* x);
#endif
// Like the above, but these are templated on the type of the value. For
// example, templating on int64_t is equivalent to calling SetInt64Handler.
// Attempts to template on a type that does not map to a UPB_TYPE_* type
// (like int8_t, since protobufs have no 8-bit type) will get an "undefined
// function" compilation error.
template<class T> bool SetValueHandler(
const FieldDef* f, typename Value<T>::Handler* h, void* d, Free* fr);
template<class T> bool SetValueHandler(
const char* name, typename Value<T>::Handler* h, void* d, Free* fr);
// Sets handlers for a string field, which are defined as follows:
//
// void* startstr(const upb::SinkFrame *frame, size_t size_hint) {
// // Called when a string value begins. The return value indicates the
// // closure for the string. "size_hint" indicates the size of the
// // string if it is known, however if the string is length-delimited
// // and the end-of-string is not available size_hint will be zero.
// // This case is indistinguishable from the case where the size is
// // known to be zero.
// //
// // TODO(haberman): is it important to distinguish these cases?
// // If we had ssize_t as a type we could make -1 "unknown", but
// // ssize_t is POSIX (not ANSI) and therefore less portable.
// // In practice I suspect it won't be important to distinguish.
// return closure;
// }
upb_stream: all callbacks registered ahead-of-time. This is a significant change to the upb_stream protocol, and should hopefully be the last significant change. All callbacks are now registered ahead-of-time instead of having delegated callbacks registered at runtime, which makes it much easier to aggressively optimize ahead-of-time (like with a JIT). Other impacts of this change: - You no longer need to have loaded descriptor.proto as a upb_def to load other descriptors! This means the special-case code we used for bootstrapping is no longer necessary, and we no longer need to link the descriptor for descriptor.proto into upb. - A client can now register any upb_value as what will be delivered to their value callback, not just a upb_fielddef*. This should allow for other clients to get more bang out of the streaming decoder. This change unfortunately causes a bit of a performance regression -- I think largely due to highly suboptimal code that GCC generates when structs are returned by value. See: http://blog.reverberate.org/2011/03/19/when-a-compilers-slow-code-actually-bites-you/ On the other hand, once we have a JIT this should no longer matter. Performance numbers: plain.parsestream_googlemessage1.upb_table: 374 -> 396 (5.88) plain.parsestream_googlemessage2.upb_table: 616 -> 449 (-27.11) plain.parsetostruct_googlemessage1.upb_table_byref: 268 -> 269 (0.37) plain.parsetostruct_googlemessage1.upb_table_byval: 215 -> 204 (-5.12) plain.parsetostruct_googlemessage2.upb_table_byref: 307 -> 281 (-8.47) plain.parsetostruct_googlemessage2.upb_table_byval: 297 -> 272 (-8.42) omitfp.parsestream_googlemessage1.upb_table: 423 -> 410 (-3.07) omitfp.parsestream_googlemessage2.upb_table: 679 -> 483 (-28.87) omitfp.parsetostruct_googlemessage1.upb_table_byref: 287 -> 282 (-1.74) omitfp.parsetostruct_googlemessage1.upb_table_byval: 226 -> 219 (-3.10) omitfp.parsetostruct_googlemessage2.upb_table_byref: 315 -> 298 (-5.40) omitfp.parsetostruct_googlemessage2.upb_table_byval: 297 -> 287 (-3.37)
14 years ago
//
// size_t str(const upb::SinkFrame* frame, const char *str, size_t len) {
// // Called for each buffer of string data; the multiple physical buffers
// // are all part of the same logical string. The return value indicates
// // how many bytes were consumed. If this number is less than "len",
// // this will also indicate that processing should be halted for now,
// // like returning false or UPB_BREAK from any other callback. If
// // number is greater than "len", the excess bytes will be skipped over
// // and not passed to the callback.
// return len;
// }
//
// bool endstr(const upb::SinkFrame* frame) {
// // Called when a string value ends.
// return true;
// }
bool SetStartStringHandler(const FieldDef* f, StartStringHandler* h,
void* d, Free* fr);
bool SetStringHandler(const FieldDef* f, StringHandler* h, void* d, Free* fr);
bool SetEndStringHandler(const FieldDef* f, EndFieldHandler* h,
void* d, Free* fr);
// Convenience versions that look up the field by name first. These return
// false if no field with this name exists, or for any of the other reasons
// that the FieldDef* version returns false.
bool SetStartStringHandler(const char* name, StartStringHandler* h,
void* d, Free* fr);
bool SetStringHandler(const char* name, StringHandler* h, void* d, Free* fr);
bool SetEndStringHandler(const char* name, EndFieldHandler* h,
void* d, Free* fr);
// Sets the startseq handler, which is defined as follows:
//
// void *startseq(const upb::SinkFrame* frame) {
// // Called when a sequence (repeated field) begins. The returned
// // pointer indicates the closure for the sequence (or UPB_BREAK
// // to interrupt processing).
// return closure;
// }
//
// Returns "false" if "f" does not belong to this message or is not a
// repeated field.
//
// "data" is the data that will be bound to this callback and passed to it.
// If "cleanup" is non-NULL it will be run when the data is no longer needed.
bool SetStartSequenceHandler(const FieldDef* f, StartFieldHandler *handler,
void* data, Free* cleanup);
bool SetStartSequenceHandler(const char* name, StartFieldHandler *handler,
void* data, Free* cleanup);
// Sets the startsubmsg handler for the given field, which is defined as
// follows:
//
// void *startsubmsg(const upb::SinkFrame *frame) {
// // Called when a submessage begins. The returned pointer indicates the
// // closure for the sequence (or UPB_BREAK to interrupt processing).
// return closure;
// }
//
// "data" is the data that will be bound to this callback and passed to it.
// If "cleanup" is non-NULL it will be run when the data is no longer needed.
//
// Returns "false" if "f" does not belong to this message or is not a
// submessage/group field.
bool SetStartSubMessageHandler(const FieldDef* f, StartFieldHandler *handler,
void* data, Free* cleanup);
bool SetStartSubMessageHandler(const char* name, StartFieldHandler *handler,
void* data, Free* cleanup);
// Sets the endsubmsg handler for the given field, which is defined as
// follows:
//
// bool endsubmsg(const upb::SinkFrame *frame) {
// // Called when a submessage ends. Returns true to continue processing.
// return true;
// }
//
// "data" is the data that will be bound to this callback and passed to it.
// If "cleanup" is non-NULL it will be run when the data is no longer needed.
//
// Returns "false" if "f" does not belong to this message or is not a
// submessage/group field.
bool SetEndSubMessageHandler(const FieldDef* f, EndFieldHandler *handler,
void* data, Free* cleanup);
bool SetEndSubMessageHandler(const char* name, EndFieldHandler *handler,
void* data, Free* cleanup);
// Starts the endsubseq handler for the given field, which is defined as
// follows:
//
// bool endseq(const upb::SinkFrame *frame) {
// // Called when a sequence ends. Returns true continue processing.
// return true;
// }
//
// "data" is the data that will be bound to this callback and passed to it.
// If "cleanup" is non-NULL it will be run when the data is no longer needed.
//
// Returns "false" if "f" does not belong to this message or is not a
// repeated field.
bool SetEndSequenceHandler(const FieldDef* f, EndFieldHandler *handler,
void* data, Free* cleanup);
bool SetEndSequenceHandler(const char* name, EndFieldHandler *handler,
void* data, Free* cleanup);
// Sets or gets the object that specifies handlers for the given field, which
// must be a submessage or group. Returns NULL if no handlers are set.
bool SetSubHandlers(const FieldDef* f, const Handlers* sub);
const Handlers* GetSubHandlers(const FieldDef* f) const;
// Equivalent to GetSubHandlers, but takes the STARTSUBMSG selector for the
// field.
const Handlers* GetSubHandlers(Selector startsubmsg) const;
// A selector refers to a specific field handler in the Handlers object
// (for example: the STARTSUBMSG handler for field "field15").
// On success, returns true and stores the selector in "s".
// If the FieldDef or Type are invalid, returns false.
// The returned selector is ONLY valid for Handlers whose MessageDef
// contains this FieldDef.
static bool GetSelector(const FieldDef* f, Type type, Selector* s);
// Given a START selector of any kind, returns the corresponding END selector.
static Selector GetEndSelector(Selector start_selector);
// Returns the function pointer for this handler. It is the client's
// responsibility to cast to the correct function type before calling it.
GenericFunction* GetHandler(Selector selector);
// Returns the handler data that was registered with this handler.
void* GetHandlerData(Selector selector);
// Gets the byte offset from a Handlers* where the given handler can be found.
// Useful for JITs that want to read the pointer in their fast path.
static size_t GetHandlerOffset(Selector selector);
// Could add any of the following functions as-needed, with some minor
// implementation changes:
//
// const FieldDef* GetFieldDef(Selector selector);
// static bool IsSequence(Selector selector);
private:
UPB_DISALLOW_POD_OPS(Handlers);
friend void* ::upb_sinkframe_handlerdata(const upb_sinkframe* frame);
#else
struct upb_handlers {
#endif
upb_refcounted base;
const upb_msgdef *msg;
const upb_frametype *ft;
bool (*startmsg)(const upb_sinkframe*);
void (*endmsg)(const upb_sinkframe*, upb_status*);
void *fh_base[1]; // Start of dynamically-sized field handler array.
};
// Native C API.
#ifdef __cplusplus
extern "C" {
#endif
typedef bool upb_startmsg_handler(const upb_sinkframe *frame);
typedef void upb_endmsg_handler(const upb_sinkframe *frame, upb_status *status);
typedef void* upb_startfield_handler(const upb_sinkframe *frame);
typedef bool upb_endfield_handler(const upb_sinkframe *frame);
typedef void upb_handlers_callback(void *closure, upb_handlers *h);
typedef void upb_handlerfree(void *d);
typedef void upb_func();
typedef bool upb_int32_handler(const upb_sinkframe *f, upb_int32_t val);
typedef bool upb_int64_handler(const upb_sinkframe *f, upb_int64_t val);
typedef bool upb_uint32_handler(const upb_sinkframe *f, upb_uint32_t val);
typedef bool upb_uint64_handler(const upb_sinkframe *f, upb_uint64_t val);
typedef bool upb_float_handler(const upb_sinkframe *f, float val);
typedef bool upb_double_handler(const upb_sinkframe *f, double val);
typedef bool upb_bool_handler(const upb_sinkframe *f, bool val);
typedef void* upb_startstr_handler(const upb_sinkframe *f, size_t size_hint);
typedef size_t upb_string_handler(
const upb_sinkframe *f, const char *buf, size_t n);
#ifdef UPB_TWO_32BIT_TYPES
typedef bool upb_int32_handler2(const upb_sinkframe *f, upb_int32alt_t val);
typedef bool upb_uint32_handler2(const upb_sinkframe *f, upb_uint32alt_t val);
#endif
#ifdef UPB_TWO_64BIT_TYPES
typedef bool upb_int64_handler2(const upb_sinkframe *f, upb_int64alt_t val);
typedef bool upb_uint64_handler2(const upb_sinkframe *f, upb_uint64alt_t val);
#endif
upb_handlers *upb_handlers_new(const upb_msgdef *m,
const upb_frametype *ft,
const void *owner);
const upb_handlers *upb_handlers_newfrozen(const upb_msgdef *m,
const upb_frametype *ft,
const void *owner,
upb_handlers_callback *callback,
void *closure);
// From upb_refcounted.
void upb_handlers_unref(const upb_handlers *h, const void *owner);
bool upb_handlers_isfrozen(const upb_handlers *h);
void upb_handlers_ref(const upb_handlers *h, const void *owner);
void upb_handlers_donateref(
const upb_handlers *h, const void *from, const void *to);
void upb_handlers_checkref(const upb_handlers *h, const void *owner);
bool upb_handlers_freeze(upb_handlers *const*handlers, int n, upb_status *s);
const upb_msgdef *upb_handlers_msgdef(const upb_handlers *h);
const upb_frametype *upb_handlers_frametype(const upb_handlers *h);
void upb_handlers_setstartmsg(upb_handlers *h, upb_startmsg_handler *handler);
upb_startmsg_handler *upb_handlers_getstartmsg(const upb_handlers *h);
void upb_handlers_setendmsg(upb_handlers *h, upb_endmsg_handler *handler);
upb_endmsg_handler *upb_handlers_getendmsg(const upb_handlers *h);
bool upb_handlers_setint32(
upb_handlers *h, const upb_fielddef *f, upb_int32_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setint64(
upb_handlers *h, const upb_fielddef *f, upb_int64_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setuint32(
upb_handlers *h, const upb_fielddef *f, upb_uint32_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setuint64(
upb_handlers *h, const upb_fielddef *f, upb_uint64_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setfloat(
upb_handlers *h, const upb_fielddef *f, upb_float_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setdouble(
upb_handlers *h, const upb_fielddef *f, upb_double_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setbool(
upb_handlers *h, const upb_fielddef *f, upb_bool_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setstartstr(
upb_handlers *h, const upb_fielddef *f, upb_startstr_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setstring(
upb_handlers *h, const upb_fielddef *f, upb_string_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setendstr(
upb_handlers *h, const upb_fielddef *f, upb_endfield_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setstartseq(
upb_handlers *h, const upb_fielddef *f, upb_startfield_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setstartsubmsg(
upb_handlers *h, const upb_fielddef *f, upb_startfield_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setendsubmsg(
upb_handlers *h, const upb_fielddef *f, upb_endfield_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setendseq(
upb_handlers *h, const upb_fielddef *f, upb_endfield_handler *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setsubhandlers(
upb_handlers *h, const upb_fielddef *f, const upb_handlers *sub);
const upb_handlers *upb_handlers_getsubhandlers(
const upb_handlers *h, const upb_fielddef *f);
const upb_handlers *upb_handlers_getsubhandlers_sel(
const upb_handlers *h, upb_selector_t sel);
upb_handlertype_t upb_handlers_getprimitivehandlertype(const upb_fielddef *f);
bool upb_getselector(
const upb_fielddef *f, upb_handlertype_t type, upb_selector_t *s);
UPB_INLINE upb_selector_t upb_getendselector(upb_selector_t start) {
return start + 1;
}
upb_func *upb_handlers_gethandler(const upb_handlers *h, upb_selector_t s);
void *upb_handlers_gethandlerdata(const upb_handlers *h, upb_selector_t s);
size_t upb_gethandleroffset(upb_selector_t s);
#ifdef UPB_TWO_32BIT_TYPES
bool upb_handlers_setint32alt(
upb_handlers *h, const upb_fielddef *f, upb_int32_handler2 *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setuint32alt(
upb_handlers *h, const upb_fielddef *f, upb_uint32_handler2 *handler,
void *d, upb_handlerfree *fr);
#endif
#ifdef UPB_TWO_64BIT_TYPES
bool upb_handlers_setint64alt(
upb_handlers *h, const upb_fielddef *f, upb_int64_handler2 *handler,
void *d, upb_handlerfree *fr);
bool upb_handlers_setuint64alt(
upb_handlers *h, const upb_fielddef *f, upb_uint64_handler2 *handler,
void *d, upb_handlerfree *fr);
#endif
// Internal-only.
uint32_t upb_handlers_selectorbaseoffset(const upb_fielddef *f);
uint32_t upb_handlers_selectorcount(const upb_fielddef *f);
#ifdef __cplusplus
} // extern "C"
#endif
upb_stream: all callbacks registered ahead-of-time. This is a significant change to the upb_stream protocol, and should hopefully be the last significant change. All callbacks are now registered ahead-of-time instead of having delegated callbacks registered at runtime, which makes it much easier to aggressively optimize ahead-of-time (like with a JIT). Other impacts of this change: - You no longer need to have loaded descriptor.proto as a upb_def to load other descriptors! This means the special-case code we used for bootstrapping is no longer necessary, and we no longer need to link the descriptor for descriptor.proto into upb. - A client can now register any upb_value as what will be delivered to their value callback, not just a upb_fielddef*. This should allow for other clients to get more bang out of the streaming decoder. This change unfortunately causes a bit of a performance regression -- I think largely due to highly suboptimal code that GCC generates when structs are returned by value. See: http://blog.reverberate.org/2011/03/19/when-a-compilers-slow-code-actually-bites-you/ On the other hand, once we have a JIT this should no longer matter. Performance numbers: plain.parsestream_googlemessage1.upb_table: 374 -> 396 (5.88) plain.parsestream_googlemessage2.upb_table: 616 -> 449 (-27.11) plain.parsetostruct_googlemessage1.upb_table_byref: 268 -> 269 (0.37) plain.parsetostruct_googlemessage1.upb_table_byval: 215 -> 204 (-5.12) plain.parsetostruct_googlemessage2.upb_table_byref: 307 -> 281 (-8.47) plain.parsetostruct_googlemessage2.upb_table_byval: 297 -> 272 (-8.42) omitfp.parsestream_googlemessage1.upb_table: 423 -> 410 (-3.07) omitfp.parsestream_googlemessage2.upb_table: 679 -> 483 (-28.87) omitfp.parsetostruct_googlemessage1.upb_table_byref: 287 -> 282 (-1.74) omitfp.parsetostruct_googlemessage1.upb_table_byval: 226 -> 219 (-3.10) omitfp.parsetostruct_googlemessage2.upb_table_byref: 315 -> 298 (-5.40) omitfp.parsetostruct_googlemessage2.upb_table_byval: 297 -> 287 (-3.37)
14 years ago
// Convenience versions of the above that first look up the field by name.
#define DEFINE_NAME_SETTER(slot, type) \
UPB_INLINE bool upb_handlers_set ## slot ## _n( \
upb_handlers *h, const char *name, type val, \
void *d, upb_handlerfree *fr) { \
const upb_fielddef *f = upb_msgdef_ntof(upb_handlers_msgdef(h), name); \
if (!f) return false; \
return upb_handlers_set ## slot(h, f, val, d, fr); \
}
DEFINE_NAME_SETTER(int32, upb_int32_handler*);
DEFINE_NAME_SETTER(int64, upb_int64_handler*);
DEFINE_NAME_SETTER(uint32, upb_uint32_handler*);
DEFINE_NAME_SETTER(uint64, upb_uint64_handler*);
DEFINE_NAME_SETTER(float, upb_float_handler*);
DEFINE_NAME_SETTER(double, upb_double_handler*);
DEFINE_NAME_SETTER(bool, upb_bool_handler*);
DEFINE_NAME_SETTER(startstr, upb_startstr_handler*);
DEFINE_NAME_SETTER(string, upb_string_handler*);
DEFINE_NAME_SETTER(endstr, upb_endfield_handler*);
DEFINE_NAME_SETTER(startseq, upb_startfield_handler*);
DEFINE_NAME_SETTER(startsubmsg, upb_startfield_handler*);
DEFINE_NAME_SETTER(endsubmsg, upb_endfield_handler*);
DEFINE_NAME_SETTER(endseq, upb_endfield_handler*);
#ifdef UPB_TWO_32BIT_TYPES
DEFINE_NAME_SETTER(int32alt, upb_int32_handler2*);
DEFINE_NAME_SETTER(uint32alt, upb_uint32_handler2*);
#endif
#ifdef UPB_TWO_64BIT_TYPES
DEFINE_NAME_SETTER(int64alt, upb_int64_handler2*);
DEFINE_NAME_SETTER(uint64alt, upb_uint64_handler2*);
#endif
#undef DEFINE_NAME_SETTER
// Value writers for every in-memory type: write the data to a known offset
// from the closure "c." These depend on the fval being a pointer to a
// structure that is (or begins with) the upb_stdmsg_fval type.
//
// TODO(haberman): These are hacky; remove them and replace with an API that
// lets you set a simple "writer" handler in a way that can generate
// specialized code right then.
typedef struct upb_stdmsg_fval {
#ifdef __cplusplus
upb_stdmsg_fval(size_t offset_, int32_t hasbit_)
: offset(offset_),
hasbit(hasbit_) {
}
#endif
size_t offset;
int32_t hasbit;
} upb_stdmsg_fval;
#ifdef __cplusplus
extern "C" {
#endif
bool upb_stdmsg_setint32(const upb_sinkframe *frame, int32_t val);
bool upb_stdmsg_setint64(const upb_sinkframe *frame, int64_t val);
bool upb_stdmsg_setuint32(const upb_sinkframe *frame, uint32_t val);
bool upb_stdmsg_setuint64(const upb_sinkframe *frame, uint64_t val);
bool upb_stdmsg_setfloat(const upb_sinkframe *frame, float val);
bool upb_stdmsg_setdouble(const upb_sinkframe *frame, double val);
bool upb_stdmsg_setbool(const upb_sinkframe *frame, bool val);
#ifdef __cplusplus
} // extern "C"
#endif
#ifdef __cplusplus
namespace upb {
// This function should be specialized by types that have a FrameType.
template<class T> inline const FrameType* GetFrameType() { return NULL; }
// C++ Wrappers
inline Handlers* Handlers::New(const MessageDef* m, const FrameType* ft,
const void *owner) {
return upb_handlers_new(m, ft, owner);
}
inline const Handlers* Handlers::NewFrozen(
const MessageDef *m, const FrameType* ft, const void *owner,
upb_handlers_callback *callback, void *closure) {
return upb_handlers_newfrozen(m, ft, owner, callback, closure);
}
inline bool Handlers::IsFrozen() const {
return upb_handlers_isfrozen(this);
}
inline void Handlers::Ref(const void* owner) const {
upb_handlers_ref(this, owner);
}
inline void Handlers::Unref(const void* owner) const {
upb_handlers_unref(this, owner);
}
inline void Handlers::DonateRef(const void *from, const void *to) const {
upb_handlers_donateref(this, from, to);
}
inline void Handlers::CheckRef(const void *owner) const {
upb_handlers_checkref(this, owner);
}
inline bool Handlers::Freeze(Handlers*const* handlers, int n, Status* s) {
return upb_handlers_freeze(handlers, n, s);
}
inline const FrameType* Handlers::frame_type() const {
return upb_handlers_frametype(this);
}
inline const MessageDef* Handlers::message_def() const {
return upb_handlers_msgdef(this);
}
inline void Handlers::SetStartMessageHandler(
Handlers::StartMessageHandler *handler) {
upb_handlers_setstartmsg(this, handler);
}
inline void Handlers::SetEndMessageHandler(
Handlers::EndMessageHandler *handler) {
upb_handlers_setendmsg(this, handler);
}
inline bool Handlers::SetInt32Handler(
const FieldDef *f, Handlers::Int32Handler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setint32(this, f, handler, d, fr);
}
inline bool Handlers::SetInt64Handler(
const FieldDef *f, Handlers::Int64Handler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setint64(this, f, handler, d, fr);
}
inline bool Handlers::SetUInt32Handler(
const FieldDef *f, Handlers::UInt32Handler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setuint32(this, f, handler, d, fr);
}
inline bool Handlers::SetUInt64Handler(
const FieldDef *f, Handlers::UInt64Handler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setuint64(this, f, handler, d, fr);
}
inline bool Handlers::SetFloatHandler(
const FieldDef *f, Handlers::FloatHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setfloat(this, f, handler, d, fr);
}
inline bool Handlers::SetDoubleHandler(
const FieldDef *f, Handlers::DoubleHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setdouble(this, f, handler, d, fr);
}
inline bool Handlers::SetBoolHandler(
const FieldDef *f, Handlers::BoolHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setbool(this, f, handler, d, fr);
}
inline bool Handlers::SetStartStringHandler(
const FieldDef* f, Handlers::StartStringHandler* handler,
void* d, Handlers::Free* fr) {
return upb_handlers_setstartstr(this, f, handler, d, fr);
}
inline bool Handlers::SetEndStringHandler(
const FieldDef* f, Handlers::EndFieldHandler* handler,
void* d, Handlers::Free* fr) {
return upb_handlers_setendstr(this, f, handler, d, fr);
}
inline bool Handlers::SetStringHandler(
const FieldDef *f, Handlers::StringHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setstring(this, f, handler, d, fr);
}
inline bool Handlers::SetStartSequenceHandler(
const FieldDef* f, Handlers::StartFieldHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setstartseq(this, f, handler, d, fr);
}
inline bool Handlers::SetStartSubMessageHandler(
const FieldDef* f, Handlers::StartFieldHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setstartsubmsg(this, f, handler, d, fr);
}
inline bool Handlers::SetEndSubMessageHandler(
const FieldDef* f, Handlers::EndFieldHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setendsubmsg(this, f, handler, d, fr);
}
inline bool Handlers::SetEndSequenceHandler(
const FieldDef* f, Handlers::EndFieldHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setendseq(this, f, handler, d, fr);
}
inline bool Handlers::SetSubHandlers(
const FieldDef* f, const Handlers* sub) {
return upb_handlers_setsubhandlers(this, f, sub);
}
inline bool Handlers::SetInt32Handler(
const char* name, Handlers::Int32Handler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setint32_n(this, name, handler, d, fr);
}
inline bool Handlers::SetInt64Handler(
const char* name, Handlers::Int64Handler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setint64_n(this, name, handler, d, fr);
}
inline bool Handlers::SetUInt32Handler(
const char* name, Handlers::UInt32Handler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setuint32_n(this, name, handler, d, fr);
}
inline bool Handlers::SetUInt64Handler(
const char* name, Handlers::UInt64Handler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setuint64_n(this, name, handler, d, fr);
}
inline bool Handlers::SetFloatHandler(
const char* name, Handlers::FloatHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setfloat_n(this, name, handler, d, fr);
}
inline bool Handlers::SetDoubleHandler(
const char* name, Handlers::DoubleHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setdouble_n(this, name, handler, d, fr);
}
inline bool Handlers::SetBoolHandler(
const char* name, Handlers::BoolHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setbool_n(this, name, handler, d, fr);
}
inline bool Handlers::SetStartStringHandler(
const char* name, Handlers::StartStringHandler* handler,
void* d, Handlers::Free* fr) {
return upb_handlers_setstartstr_n(this, name, handler, d, fr);
}
inline bool Handlers::SetEndStringHandler(
const char* name, Handlers::EndFieldHandler* handler,
void* d, Handlers::Free* fr) {
return upb_handlers_setendstr_n(this, name, handler, d, fr);
}
inline bool Handlers::SetStringHandler(
const char* name, Handlers::StringHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setstring_n(this, name, handler, d, fr);
}
inline bool Handlers::SetStartSequenceHandler(
const char* name, Handlers::StartFieldHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setstartseq_n(this, name, handler, d, fr);
}
inline bool Handlers::SetStartSubMessageHandler(
const char* name, Handlers::StartFieldHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setstartsubmsg_n(this, name, handler, d, fr);
}
inline bool Handlers::SetEndSubMessageHandler(
const char* name, Handlers::EndFieldHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setendsubmsg_n(this, name, handler, d, fr);
}
inline bool Handlers::SetEndSequenceHandler(
const char* name, Handlers::EndFieldHandler *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setendseq_n(this, name, handler, d, fr);
}
inline Handlers::StartMessageHandler *Handlers::GetStartMessageHandler() const {
return upb_handlers_getstartmsg(this);
}
inline Handlers::EndMessageHandler *Handlers::GetEndMessageHandler() const {
return upb_handlers_getendmsg(this);
}
inline const Handlers* Handlers::GetSubHandlers(
const FieldDef* f) const {
return upb_handlers_getsubhandlers(this, f);
}
inline const Handlers* Handlers::GetSubHandlers(
Handlers::Selector sel) const {
return upb_handlers_getsubhandlers_sel(this, sel);
}
inline bool Handlers::GetSelector(
const FieldDef* f, Handlers::Type type, Handlers::Selector* s) {
return upb_getselector(f, type, s);
}
inline Handlers::Selector Handlers::GetEndSelector(Handlers::Selector start) {
return upb_getendselector(start);
}
inline Handlers::GenericFunction* Handlers::GetHandler(
Handlers::Selector selector) {
return upb_handlers_gethandler(this, selector);
}
inline void* Handlers::GetHandlerData(Handlers::Selector selector) {
return upb_handlers_gethandlerdata(this, selector);
}
inline size_t Handlers::GetHandlerOffset(Handlers::Selector selector) {
return upb_gethandleroffset(selector);
}
#ifdef UPB_TWO_32BIT_TYPES
inline bool Handlers::SetInt32Handler(
const FieldDef *f, Handlers::Int32Handler2 *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setint32alt(this, f, handler, d, fr);
}
inline bool Handlers::SetUInt32Handler(
const FieldDef *f, Handlers::UInt32Handler2 *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setuint32alt(this, f, handler, d, fr);
}
inline bool Handlers::SetInt32Handler(
const char* name, Handlers::Int32Handler2 *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setint32alt_n(this, name, handler, d, fr);
}
inline bool Handlers::SetUInt32Handler(
const char* name, Handlers::UInt32Handler2 *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setuint32alt_n(this, name, handler, d, fr);
}
#endif
#ifdef UPB_TWO_64BIT_TYPES
inline bool Handlers::SetInt64Handler(
const FieldDef *f, Handlers::Int64Handler2 *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setint64alt(this, f, handler, d, fr);
}
inline bool Handlers::SetUInt64Handler(
const FieldDef *f, Handlers::UInt64Handler2 *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setuint64alt(this, f, handler, d, fr);
}
inline bool Handlers::SetInt64Handler(
const char* name, Handlers::Int64Handler2 *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setint64alt_n(this, name, handler, d, fr);
}
inline bool Handlers::SetUInt64Handler(
const char* name, Handlers::UInt64Handler2 *handler,
void *d, Handlers::Free *fr) {
return upb_handlers_setuint64alt_n(this, name, handler, d, fr);
}
#endif
#define SET_VALUE_HANDLER(type, ctype) \
template<> \
inline bool Handlers::SetValueHandler<ctype>( \
const FieldDef* f, \
typename Handlers::Value<ctype>::Handler* handler, \
void* data, Handlers::Free* cleanup) { \
return upb_handlers_set ## type(this, f, handler, data, cleanup); \
} \
template<> \
inline bool Handlers::SetValueHandler<ctype>( \
const char* f, \
typename Handlers::Value<ctype>::Handler* handler, \
void* data, Handlers::Free* cleanup) { \
return upb_handlers_set ## type ## _n(this, f, handler, data, cleanup); \
}
SET_VALUE_HANDLER(double, double);
SET_VALUE_HANDLER(float, float);
SET_VALUE_HANDLER(uint64, upb_uint64_t);
SET_VALUE_HANDLER(uint32, upb_uint32_t);
SET_VALUE_HANDLER(int64, upb_int64_t);
SET_VALUE_HANDLER(int32, upb_int32_t);
SET_VALUE_HANDLER(bool, bool);
#ifdef UPB_TWO_32BIT_TYPES
SET_VALUE_HANDLER(int32alt, upb_int32alt_t);
SET_VALUE_HANDLER(uint32alt, upb_uint32alt_t);
#endif
#ifdef UPB_TWO_64BIT_TYPES
SET_VALUE_HANDLER(int64alt, upb_int64alt_t);
SET_VALUE_HANDLER(uint64alt, upb_uint64alt_t);
#endif
#undef SET_VALUE_HANDLER
template <class T> void DeletePointer(void *p) { delete static_cast<T*>(p); }
template <class T>
void SetStoreValueHandler(
const FieldDef* f, size_t offset, int32_t hasbit, Handlers* h);
// A handy templated function that will retrieve a value handler for a given
// C++ type.
#define SET_STORE_VALUE_HANDLER(type, ctype, handlerctype) \
template <> \
inline void SetStoreValueHandler<ctype>(const FieldDef* f, size_t offset, \
int32_t hasbit, Handlers* h) { \
h->SetValueHandler<handlerctype>( \
f, upb_stdmsg_set ## type, new upb_stdmsg_fval(offset, hasbit), \
&upb::DeletePointer<upb_stdmsg_fval>); \
}
SET_STORE_VALUE_HANDLER(double, double, double);
SET_STORE_VALUE_HANDLER(float, float, float);
SET_STORE_VALUE_HANDLER(uint64, upb_uint64_t, uint64_t);
SET_STORE_VALUE_HANDLER(uint32, upb_uint32_t, uint32_t);
SET_STORE_VALUE_HANDLER(int64, upb_int64_t, int64_t);
SET_STORE_VALUE_HANDLER(int32, upb_int32_t, int32_t);
SET_STORE_VALUE_HANDLER(bool, bool, bool);
#ifdef UPB_TWO_32BIT_TYPES
SET_STORE_VALUE_HANDLER(int32, upb_int32alt_t, int32_t);
SET_STORE_VALUE_HANDLER(uint32, upb_uint32alt_t, uint32_t);
#endif
#ifdef UPB_TWO_64BIT_TYPES
SET_STORE_VALUE_HANDLER(int64, upb_int64alt_t, int64_t);
SET_STORE_VALUE_HANDLER(uint64, upb_uint64alt_t, uint64_t);
#endif
#undef SET_STORE_VALUE_HANDLER
} // namespace upb
#endif
// Implementation detail, put in the header file only so
// upb_sinkframe_handlerdata() can be inlined.
typedef struct {
upb_func *handler;
// Could put either or both of these in a separate table to save memory when
// they are sparse.
void *data;
upb_handlerfree *cleanup;
// TODO(haberman): this is wasteful; only the first "fieldhandler" of a
// submessage field needs this. To reduce memory footprint we should either:
// - put the subhandlers in a separate "fieldhandler", stored as part of
// a union with one of the above fields.
// - count selector offsets by individual pointers instead of by whole
// fieldhandlers.
const upb_handlers *subhandlers;
} upb_fieldhandler;
#endif