Protocol Buffers - Google's data interchange format (grpc依赖)
https://developers.google.com/protocol-buffers/
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
545 lines
17 KiB
545 lines
17 KiB
/* |
|
* upb - a minimalist implementation of protocol buffers. |
|
* |
|
* Copyright (c) 2014 Google Inc. See LICENSE for details. |
|
* Author: Josh Haberman <jhaberman@gmail.com> |
|
* |
|
* This currently uses snprintf() to format primitives, and could be optimized |
|
* further. |
|
*/ |
|
|
|
#include "upb/json/printer.h" |
|
|
|
#include <stdlib.h> |
|
#include <stdio.h> |
|
#include <string.h> |
|
#include <stdint.h> |
|
|
|
// StringPiece; a pointer plus a length. |
|
typedef struct { |
|
const char *ptr; |
|
size_t len; |
|
} strpc; |
|
|
|
strpc *newstrpc(upb_handlers *h, const upb_fielddef *f) { |
|
strpc *ret = malloc(sizeof(*ret)); |
|
ret->ptr = upb_fielddef_name(f); |
|
ret->len = strlen(ret->ptr); |
|
upb_handlers_addcleanup(h, ret, free); |
|
return ret; |
|
} |
|
|
|
// ------------ JSON string printing: values, maps, arrays -------------------- |
|
|
|
static void print_data( |
|
upb_json_printer *p, const char *buf, unsigned int len) { |
|
// TODO: Will need to change if we support pushback from the sink. |
|
size_t n = upb_bytessink_putbuf(p->output_, p->subc_, buf, len, NULL); |
|
UPB_ASSERT_VAR(n, n == len); |
|
} |
|
|
|
static void print_comma(upb_json_printer *p) { |
|
if (!p->first_elem_[p->depth_]) { |
|
print_data(p, ",", 1); |
|
} |
|
p->first_elem_[p->depth_] = false; |
|
} |
|
|
|
// Helpers that print properly formatted elements to the JSON output stream. |
|
|
|
// Used for escaping control chars in strings. |
|
static const char kControlCharLimit = 0x20; |
|
|
|
static inline bool is_json_escaped(char c) { |
|
// See RFC 4627. |
|
unsigned char uc = (unsigned char)c; |
|
return uc < kControlCharLimit || uc == '"' || uc == '\\'; |
|
} |
|
|
|
static inline char* json_nice_escape(char c) { |
|
switch (c) { |
|
case '"': return "\\\""; |
|
case '\\': return "\\\\"; |
|
case '\b': return "\\b"; |
|
case '\f': return "\\f"; |
|
case '\n': return "\\n"; |
|
case '\r': return "\\r"; |
|
case '\t': return "\\t"; |
|
default: return NULL; |
|
} |
|
} |
|
|
|
// Write a properly escaped string chunk. The surrounding quotes are *not* |
|
// printed; this is so that the caller has the option of emitting the string |
|
// content in chunks. |
|
static void putstring(upb_json_printer *p, const char *buf, unsigned int len) { |
|
const char* unescaped_run = NULL; |
|
for (unsigned int i = 0; i < len; i++) { |
|
char c = buf[i]; |
|
// Handle escaping. |
|
if (is_json_escaped(c)) { |
|
// Use a "nice" escape, like \n, if one exists for this character. |
|
const char* escape = json_nice_escape(c); |
|
// If we don't have a specific 'nice' escape code, use a \uXXXX-style |
|
// escape. |
|
char escape_buf[8]; |
|
if (!escape) { |
|
unsigned char byte = (unsigned char)c; |
|
snprintf(escape_buf, sizeof(escape_buf), "\\u%04x", (int)byte); |
|
escape = escape_buf; |
|
} |
|
|
|
// N.B. that we assume that the input encoding is equal to the output |
|
// encoding (both UTF-8 for now), so for chars >= 0x20 and != \, ", we |
|
// can simply pass the bytes through. |
|
|
|
// If there's a current run of unescaped chars, print that run first. |
|
if (unescaped_run) { |
|
print_data(p, unescaped_run, &buf[i] - unescaped_run); |
|
unescaped_run = NULL; |
|
} |
|
// Then print the escape code. |
|
print_data(p, escape, strlen(escape)); |
|
} else { |
|
// Add to the current unescaped run of characters. |
|
if (unescaped_run == NULL) { |
|
unescaped_run = &buf[i]; |
|
} |
|
} |
|
} |
|
|
|
// If the string ended in a run of unescaped characters, print that last run. |
|
if (unescaped_run) { |
|
print_data(p, unescaped_run, &buf[len] - unescaped_run); |
|
} |
|
} |
|
|
|
#define CHKLENGTH(x) if (!(x)) return -1; |
|
|
|
// Helpers that format floating point values according to our custom formats. |
|
// Right now we use %.8g and %.17g for float/double, respectively, to match |
|
// proto2::util::JsonFormat's defaults. May want to change this later. |
|
|
|
static size_t fmt_double(double val, char* buf, size_t length) { |
|
size_t n = snprintf(buf, length, "%.17g", val); |
|
CHKLENGTH(n > 0 && n < length); |
|
return n; |
|
} |
|
|
|
static size_t fmt_float(float val, char* buf, size_t length) { |
|
size_t n = snprintf(buf, length, "%.8g", val); |
|
CHKLENGTH(n > 0 && n < length); |
|
return n; |
|
} |
|
|
|
static size_t fmt_bool(bool val, char* buf, size_t length) { |
|
size_t n = snprintf(buf, length, "%s", (val ? "true" : "false")); |
|
CHKLENGTH(n > 0 && n < length); |
|
return n; |
|
} |
|
|
|
static size_t fmt_int64(long val, char* buf, size_t length) { |
|
size_t n = snprintf(buf, length, "%ld", val); |
|
CHKLENGTH(n > 0 && n < length); |
|
return n; |
|
} |
|
|
|
static size_t fmt_uint64(unsigned long long val, char* buf, size_t length) { |
|
size_t n = snprintf(buf, length, "%llu", val); |
|
CHKLENGTH(n > 0 && n < length); |
|
return n; |
|
} |
|
|
|
// Print a map key given a field name. Called by scalar field handlers and by |
|
// startseq for repeated fields. |
|
static bool putkey(void *closure, const void *handler_data) { |
|
upb_json_printer *p = closure; |
|
const strpc *key = handler_data; |
|
print_comma(p); |
|
print_data(p, "\"", 1); |
|
putstring(p, key->ptr, key->len); |
|
print_data(p, "\":", 2); |
|
return true; |
|
} |
|
|
|
#define CHKFMT(val) if ((val) == -1) return false; |
|
#define CHK(val) if (!(val)) return false; |
|
|
|
#define TYPE_HANDLERS(type, fmt_func) \ |
|
static bool put##type(void *closure, const void *handler_data, type val) { \ |
|
upb_json_printer *p = closure; \ |
|
UPB_UNUSED(handler_data); \ |
|
char data[64]; \ |
|
size_t length = fmt_func(val, data, sizeof(data)); \ |
|
CHKFMT(length); \ |
|
print_data(p, data, length); \ |
|
return true; \ |
|
} \ |
|
static bool scalar_##type(void *closure, const void *handler_data, \ |
|
type val) { \ |
|
CHK(putkey(closure, handler_data)); \ |
|
CHK(put##type(closure, handler_data, val)); \ |
|
return true; \ |
|
} \ |
|
static bool repeated_##type(void *closure, const void *handler_data, \ |
|
type val) { \ |
|
upb_json_printer *p = closure; \ |
|
print_comma(p); \ |
|
CHK(put##type(closure, handler_data, val)); \ |
|
return true; \ |
|
} |
|
|
|
TYPE_HANDLERS(double, fmt_double); |
|
TYPE_HANDLERS(float, fmt_float); |
|
TYPE_HANDLERS(bool, fmt_bool); |
|
TYPE_HANDLERS(int32_t, fmt_int64); |
|
TYPE_HANDLERS(uint32_t, fmt_int64); |
|
TYPE_HANDLERS(int64_t, fmt_int64); |
|
TYPE_HANDLERS(uint64_t, fmt_uint64); |
|
|
|
#undef TYPE_HANDLERS |
|
|
|
typedef struct { |
|
void *keyname; |
|
const upb_enumdef *enumdef; |
|
} EnumHandlerData; |
|
|
|
static bool scalar_enum(void *closure, const void *handler_data, |
|
int32_t val) { |
|
const EnumHandlerData *hd = handler_data; |
|
upb_json_printer *p = closure; |
|
CHK(putkey(closure, hd->keyname)); |
|
|
|
const char *symbolic_name = upb_enumdef_iton(hd->enumdef, val); |
|
if (symbolic_name) { |
|
print_data(p, "\"", 1); |
|
putstring(p, symbolic_name, strlen(symbolic_name)); |
|
print_data(p, "\"", 1); |
|
} else { |
|
putint32_t(closure, NULL, val); |
|
} |
|
|
|
return true; |
|
} |
|
|
|
static bool repeated_enum(void *closure, const void *handler_data, |
|
int32_t val) { |
|
const EnumHandlerData *hd = handler_data; |
|
upb_json_printer *p = closure; |
|
print_comma(p); |
|
|
|
const char *symbolic_name = upb_enumdef_iton(hd->enumdef, val); |
|
if (symbolic_name) { |
|
print_data(p, "\"", 1); |
|
putstring(p, symbolic_name, strlen(symbolic_name)); |
|
print_data(p, "\"", 1); |
|
} else { |
|
putint32_t(closure, NULL, val); |
|
} |
|
|
|
return true; |
|
} |
|
|
|
static void *scalar_startsubmsg(void *closure, const void *handler_data) { |
|
return putkey(closure, handler_data) ? closure : UPB_BREAK; |
|
} |
|
|
|
static void *repeated_startsubmsg(void *closure, const void *handler_data) { |
|
UPB_UNUSED(handler_data); |
|
upb_json_printer *p = closure; |
|
print_comma(p); |
|
return closure; |
|
} |
|
|
|
static bool startmap(void *closure, const void *handler_data) { |
|
UPB_UNUSED(handler_data); |
|
upb_json_printer *p = closure; |
|
if (p->depth_++ == 0) { |
|
upb_bytessink_start(p->output_, 0, &p->subc_); |
|
} |
|
p->first_elem_[p->depth_] = true; |
|
print_data(p, "{", 1); |
|
return true; |
|
} |
|
|
|
static bool endmap(void *closure, const void *handler_data, upb_status *s) { |
|
UPB_UNUSED(handler_data); |
|
UPB_UNUSED(s); |
|
upb_json_printer *p = closure; |
|
if (--p->depth_ == 0) { |
|
upb_bytessink_end(p->output_); |
|
} |
|
print_data(p, "}", 1); |
|
return true; |
|
} |
|
|
|
static void *startseq(void *closure, const void *handler_data) { |
|
upb_json_printer *p = closure; |
|
CHK(putkey(closure, handler_data)); |
|
p->depth_++; |
|
p->first_elem_[p->depth_] = true; |
|
print_data(p, "[", 1); |
|
return closure; |
|
} |
|
|
|
static bool endseq(void *closure, const void *handler_data) { |
|
UPB_UNUSED(handler_data); |
|
upb_json_printer *p = closure; |
|
print_data(p, "]", 1); |
|
p->depth_--; |
|
return true; |
|
} |
|
|
|
static size_t putstr(void *closure, const void *handler_data, const char *str, |
|
size_t len, const upb_bufhandle *handle) { |
|
UPB_UNUSED(handler_data); |
|
UPB_UNUSED(handle); |
|
upb_json_printer *p = closure; |
|
putstring(p, str, len); |
|
return len; |
|
} |
|
|
|
// This has to Base64 encode the bytes, because JSON has no "bytes" type. |
|
static size_t putbytes(void *closure, const void *handler_data, const char *str, |
|
size_t len, const upb_bufhandle *handle) { |
|
UPB_UNUSED(handler_data); |
|
UPB_UNUSED(handle); |
|
upb_json_printer *p = closure; |
|
|
|
// This is the regular base64, not the "web-safe" version. |
|
static const char base64[] = |
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"; |
|
|
|
// Base64-encode. |
|
char data[16000]; |
|
const char *limit = data + sizeof(data); |
|
const unsigned char *from = (const unsigned char*)str; |
|
char *to = data; |
|
size_t remaining = len; |
|
while (remaining > 2) { |
|
// TODO(haberman): handle encoded lengths > sizeof(data) |
|
UPB_ASSERT_VAR(limit, (limit - to) >= 4); |
|
|
|
to[0] = base64[from[0] >> 2]; |
|
to[1] = base64[((from[0] & 0x3) << 4) | (from[1] >> 4)]; |
|
to[2] = base64[((from[1] & 0xf) << 2) | (from[2] >> 6)]; |
|
to[3] = base64[from[2] & 0x3f]; |
|
|
|
remaining -= 3; |
|
to += 4; |
|
from += 3; |
|
} |
|
|
|
switch (remaining) { |
|
case 2: |
|
to[0] = base64[from[0] >> 2]; |
|
to[1] = base64[((from[0] & 0x3) << 4) | (from[1] >> 4)]; |
|
to[2] = base64[(from[1] & 0xf) << 2]; |
|
to[3] = '='; |
|
to += 4; |
|
from += 2; |
|
break; |
|
case 1: |
|
to[0] = base64[from[0] >> 2]; |
|
to[1] = base64[((from[0] & 0x3) << 4)]; |
|
to[2] = '='; |
|
to[3] = '='; |
|
to += 4; |
|
from += 1; |
|
break; |
|
} |
|
|
|
size_t bytes = to - data; |
|
print_data(p, "\"", 1); |
|
putstring(p, data, bytes); |
|
print_data(p, "\"", 1); |
|
return len; |
|
} |
|
|
|
static void *scalar_startstr(void *closure, const void *handler_data, |
|
size_t size_hint) { |
|
UPB_UNUSED(handler_data); |
|
UPB_UNUSED(size_hint); |
|
upb_json_printer *p = closure; |
|
CHK(putkey(closure, handler_data)); |
|
print_data(p, "\"", 1); |
|
return p; |
|
} |
|
|
|
static size_t scalar_str(void *closure, const void *handler_data, |
|
const char *str, size_t len, |
|
const upb_bufhandle *handle) { |
|
CHK(putstr(closure, handler_data, str, len, handle)); |
|
return len; |
|
} |
|
|
|
static bool scalar_endstr(void *closure, const void *handler_data) { |
|
UPB_UNUSED(handler_data); |
|
upb_json_printer *p = closure; |
|
print_data(p, "\"", 1); |
|
return true; |
|
} |
|
|
|
static void *repeated_startstr(void *closure, const void *handler_data, |
|
size_t size_hint) { |
|
UPB_UNUSED(handler_data); |
|
UPB_UNUSED(size_hint); |
|
upb_json_printer *p = closure; |
|
print_comma(p); |
|
print_data(p, "\"", 1); |
|
return p; |
|
} |
|
|
|
static size_t repeated_str(void *closure, const void *handler_data, |
|
const char *str, size_t len, |
|
const upb_bufhandle *handle) { |
|
CHK(putstr(closure, handler_data, str, len, handle)); |
|
return len; |
|
} |
|
|
|
static bool repeated_endstr(void *closure, const void *handler_data) { |
|
UPB_UNUSED(handler_data); |
|
upb_json_printer *p = closure; |
|
print_data(p, "\"", 1); |
|
return true; |
|
} |
|
|
|
static size_t scalar_bytes(void *closure, const void *handler_data, |
|
const char *str, size_t len, |
|
const upb_bufhandle *handle) { |
|
CHK(putkey(closure, handler_data)); |
|
CHK(putbytes(closure, handler_data, str, len, handle)); |
|
return len; |
|
} |
|
|
|
static size_t repeated_bytes(void *closure, const void *handler_data, |
|
const char *str, size_t len, |
|
const upb_bufhandle *handle) { |
|
upb_json_printer *p = closure; |
|
print_comma(p); |
|
CHK(putbytes(closure, handler_data, str, len, handle)); |
|
return len; |
|
} |
|
|
|
void printer_sethandlers(const void *closure, upb_handlers *h) { |
|
UPB_UNUSED(closure); |
|
|
|
upb_handlerattr empty_attr = UPB_HANDLERATTR_INITIALIZER; |
|
upb_handlers_setstartmsg(h, startmap, &empty_attr); |
|
upb_handlers_setendmsg(h, endmap, &empty_attr); |
|
|
|
#define TYPE(type, name, ctype) \ |
|
case type: \ |
|
if (upb_fielddef_isseq(f)) { \ |
|
upb_handlers_set##name(h, f, repeated_##ctype, &empty_attr); \ |
|
} else { \ |
|
upb_handlers_set##name(h, f, scalar_##ctype, &name_attr); \ |
|
} \ |
|
break; |
|
|
|
upb_msg_iter i; |
|
upb_msg_begin(&i, upb_handlers_msgdef(h)); |
|
for(; !upb_msg_done(&i); upb_msg_next(&i)) { |
|
const upb_fielddef *f = upb_msg_iter_field(&i); |
|
|
|
upb_handlerattr name_attr = UPB_HANDLERATTR_INITIALIZER; |
|
upb_handlerattr_sethandlerdata(&name_attr, newstrpc(h, f)); |
|
|
|
if (upb_fielddef_isseq(f)) { |
|
upb_handlers_setstartseq(h, f, startseq, &name_attr); |
|
upb_handlers_setendseq(h, f, endseq, &empty_attr); |
|
} |
|
|
|
switch (upb_fielddef_type(f)) { |
|
TYPE(UPB_TYPE_FLOAT, float, float); |
|
TYPE(UPB_TYPE_DOUBLE, double, double); |
|
TYPE(UPB_TYPE_BOOL, bool, bool); |
|
TYPE(UPB_TYPE_INT32, int32, int32_t); |
|
TYPE(UPB_TYPE_UINT32, uint32, uint32_t); |
|
TYPE(UPB_TYPE_INT64, int64, int64_t); |
|
TYPE(UPB_TYPE_UINT64, uint64, uint64_t); |
|
case UPB_TYPE_ENUM: { |
|
// For now, we always emit symbolic names for enums. We may want an |
|
// option later to control this behavior, but we will wait for a real |
|
// need first. |
|
EnumHandlerData *hd = malloc(sizeof(EnumHandlerData)); |
|
hd->enumdef = (const upb_enumdef *)upb_fielddef_subdef(f); |
|
hd->keyname = newstrpc(h, f); |
|
upb_handlers_addcleanup(h, hd, free); |
|
upb_handlerattr enum_attr = UPB_HANDLERATTR_INITIALIZER; |
|
upb_handlerattr_sethandlerdata(&enum_attr, hd); |
|
|
|
if (upb_fielddef_isseq(f)) { |
|
upb_handlers_setint32(h, f, repeated_enum, &enum_attr); |
|
} else { |
|
upb_handlers_setint32(h, f, scalar_enum, &enum_attr); |
|
} |
|
|
|
upb_handlerattr_uninit(&enum_attr); |
|
break; |
|
} |
|
case UPB_TYPE_STRING: |
|
if (upb_fielddef_isseq(f)) { |
|
upb_handlers_setstartstr(h, f, repeated_startstr, &empty_attr); |
|
upb_handlers_setstring(h, f, repeated_str, &empty_attr); |
|
upb_handlers_setendstr(h, f, repeated_endstr, &empty_attr); |
|
} else { |
|
upb_handlers_setstartstr(h, f, scalar_startstr, &name_attr); |
|
upb_handlers_setstring(h, f, scalar_str, &empty_attr); |
|
upb_handlers_setendstr(h, f, scalar_endstr, &empty_attr); |
|
} |
|
break; |
|
case UPB_TYPE_BYTES: |
|
// XXX: this doesn't support strings that span buffers yet. The base64 |
|
// encoder will need to be made resumable for this to work properly. |
|
if (upb_fielddef_isseq(f)) { |
|
upb_handlers_setstring(h, f, repeated_bytes, &empty_attr); |
|
} else { |
|
upb_handlers_setstring(h, f, scalar_bytes, &name_attr); |
|
} |
|
break; |
|
case UPB_TYPE_MESSAGE: |
|
if (upb_fielddef_isseq(f)) { |
|
upb_handlers_setstartsubmsg(h, f, repeated_startsubmsg, &name_attr); |
|
} else { |
|
upb_handlers_setstartsubmsg(h, f, scalar_startsubmsg, &name_attr); |
|
} |
|
break; |
|
} |
|
|
|
upb_handlerattr_uninit(&name_attr); |
|
} |
|
|
|
upb_handlerattr_uninit(&empty_attr); |
|
#undef TYPE |
|
} |
|
|
|
/* Public API *****************************************************************/ |
|
|
|
void upb_json_printer_init(upb_json_printer *p, const upb_handlers *h) { |
|
p->output_ = NULL; |
|
p->depth_ = 0; |
|
upb_sink_reset(&p->input_, h, p); |
|
} |
|
|
|
void upb_json_printer_uninit(upb_json_printer *p) { |
|
UPB_UNUSED(p); |
|
} |
|
|
|
void upb_json_printer_reset(upb_json_printer *p) { |
|
p->depth_ = 0; |
|
} |
|
|
|
void upb_json_printer_resetoutput(upb_json_printer *p, upb_bytessink *output) { |
|
upb_json_printer_reset(p); |
|
p->output_ = output; |
|
} |
|
|
|
upb_sink *upb_json_printer_input(upb_json_printer *p) { |
|
return &p->input_; |
|
} |
|
|
|
const upb_handlers *upb_json_printer_newhandlers(const upb_msgdef *md, |
|
const void *owner) { |
|
return upb_handlers_newfrozen(md, owner, printer_sethandlers, NULL); |
|
}
|
|
|