Protocol Buffers - Google's data interchange format (grpc依赖)
https://developers.google.com/protocol-buffers/
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
1139 lines
38 KiB
1139 lines
38 KiB
|
|
#include <memory> |
|
|
|
#include "absl/container/flat_hash_map.h" |
|
#include "absl/strings/ascii.h" |
|
#include "absl/strings/str_replace.h" |
|
#include "absl/strings/substitute.h" |
|
#include "google/protobuf/compiler/code_generator.h" |
|
#include "google/protobuf/descriptor.h" |
|
#include "google/protobuf/descriptor.pb.h" |
|
#include "google/protobuf/io/zero_copy_stream.h" |
|
|
|
#include "upbc/generator.h" |
|
#include "upbc/message_layout.h" |
|
|
|
namespace protoc = ::google::protobuf::compiler; |
|
namespace protobuf = ::google::protobuf; |
|
|
|
static std::string StripExtension(absl::string_view fname) { |
|
size_t lastdot = fname.find_last_of("."); |
|
if (lastdot == std::string::npos) { |
|
return std::string(fname); |
|
} |
|
return std::string(fname.substr(0, lastdot)); |
|
} |
|
|
|
static std::string HeaderFilename(std::string proto_filename) { |
|
return StripExtension(proto_filename) + ".upb.h"; |
|
} |
|
|
|
static std::string SourceFilename(std::string proto_filename) { |
|
return StripExtension(proto_filename) + ".upb.c"; |
|
} |
|
|
|
static std::string DefHeaderFilename(std::string proto_filename) { |
|
return StripExtension(proto_filename) + ".upbdefs.h"; |
|
} |
|
|
|
static std::string DefSourceFilename(std::string proto_filename) { |
|
return StripExtension(proto_filename) + ".upbdefs.c"; |
|
} |
|
|
|
class Output { |
|
public: |
|
Output(protobuf::io::ZeroCopyOutputStream* stream) : stream_(stream) {} |
|
~Output() { stream_->BackUp((int)size_); } |
|
|
|
template <class... Arg> |
|
void operator()(absl::string_view format, const Arg&... arg) { |
|
Write(absl::Substitute(format, arg...)); |
|
} |
|
|
|
private: |
|
void Write(absl::string_view data) { |
|
while (!data.empty()) { |
|
RefreshOutput(); |
|
size_t to_write = std::min(data.size(), size_); |
|
memcpy(ptr_, data.data(), to_write); |
|
data.remove_prefix(to_write); |
|
ptr_ += to_write; |
|
size_ -= to_write; |
|
} |
|
} |
|
|
|
void RefreshOutput() { |
|
while (size_ == 0) { |
|
void *ptr; |
|
int size; |
|
if (!stream_->Next(&ptr, &size)) { |
|
fprintf(stderr, "upbc: Failed to write to to output\n"); |
|
abort(); |
|
} |
|
ptr_ = static_cast<char*>(ptr); |
|
size_ = size; |
|
} |
|
} |
|
|
|
protobuf::io::ZeroCopyOutputStream* stream_; |
|
char *ptr_ = nullptr; |
|
size_t size_ = 0; |
|
}; |
|
|
|
namespace upbc { |
|
|
|
class Generator : public protoc::CodeGenerator { |
|
~Generator() override {} |
|
bool Generate(const protobuf::FileDescriptor* file, |
|
const std::string& parameter, protoc::GeneratorContext* context, |
|
std::string* error) const override; |
|
uint64_t GetSupportedFeatures() const override { |
|
return FEATURE_PROTO3_OPTIONAL; |
|
} |
|
}; |
|
|
|
void AddMessages(const protobuf::Descriptor* message, |
|
std::vector<const protobuf::Descriptor*>* messages) { |
|
messages->push_back(message); |
|
for (int i = 0; i < message->nested_type_count(); i++) { |
|
AddMessages(message->nested_type(i), messages); |
|
} |
|
} |
|
|
|
void AddEnums(const protobuf::Descriptor* message, |
|
std::vector<const protobuf::EnumDescriptor*>* enums) { |
|
for (int i = 0; i < message->enum_type_count(); i++) { |
|
enums->push_back(message->enum_type(i)); |
|
} |
|
for (int i = 0; i < message->nested_type_count(); i++) { |
|
AddEnums(message->nested_type(i), enums); |
|
} |
|
} |
|
|
|
template <class T> |
|
void SortDefs(std::vector<T>* defs) { |
|
std::sort(defs->begin(), defs->end(), |
|
[](T a, T b) { return a->full_name() < b->full_name(); }); |
|
} |
|
|
|
std::vector<const protobuf::Descriptor*> SortedMessages( |
|
const protobuf::FileDescriptor* file) { |
|
std::vector<const protobuf::Descriptor*> messages; |
|
for (int i = 0; i < file->message_type_count(); i++) { |
|
AddMessages(file->message_type(i), &messages); |
|
} |
|
return messages; |
|
} |
|
|
|
std::vector<const protobuf::EnumDescriptor*> SortedEnums( |
|
const protobuf::FileDescriptor* file) { |
|
std::vector<const protobuf::EnumDescriptor*> enums; |
|
for (int i = 0; i < file->enum_type_count(); i++) { |
|
enums.push_back(file->enum_type(i)); |
|
} |
|
for (int i = 0; i < file->message_type_count(); i++) { |
|
AddEnums(file->message_type(i), &enums); |
|
} |
|
SortDefs(&enums); |
|
return enums; |
|
} |
|
|
|
std::vector<const protobuf::FieldDescriptor*> FieldNumberOrder( |
|
const protobuf::Descriptor* message) { |
|
std::vector<const protobuf::FieldDescriptor*> messages; |
|
for (int i = 0; i < message->field_count(); i++) { |
|
messages.push_back(message->field(i)); |
|
} |
|
std::sort(messages.begin(), messages.end(), |
|
[](const protobuf::FieldDescriptor* a, |
|
const protobuf::FieldDescriptor* b) { |
|
return a->number() < b->number(); |
|
}); |
|
return messages; |
|
} |
|
|
|
std::vector<const protobuf::FieldDescriptor*> SortedSubmessages( |
|
const protobuf::Descriptor* message) { |
|
std::vector<const protobuf::FieldDescriptor*> ret; |
|
for (int i = 0; i < message->field_count(); i++) { |
|
if (message->field(i)->cpp_type() == |
|
protobuf::FieldDescriptor::CPPTYPE_MESSAGE) { |
|
ret.push_back(message->field(i)); |
|
} |
|
} |
|
std::sort(ret.begin(), ret.end(), |
|
[](const protobuf::FieldDescriptor* a, |
|
const protobuf::FieldDescriptor* b) { |
|
return a->message_type()->full_name() < |
|
b->message_type()->full_name(); |
|
}); |
|
return ret; |
|
} |
|
|
|
std::string ToCIdent(absl::string_view str) { |
|
return absl::StrReplaceAll(str, {{".", "_"}, {"/", "_"}}); |
|
} |
|
|
|
std::string DefInitSymbol(const protobuf::FileDescriptor *file) { |
|
return ToCIdent(file->name()) + "_upbdefinit"; |
|
} |
|
|
|
std::string ToPreproc(absl::string_view str) { |
|
return absl::AsciiStrToUpper(ToCIdent(str)); |
|
} |
|
|
|
std::string EnumValueSymbol(const protobuf::EnumValueDescriptor* value) { |
|
return ToCIdent(value->full_name()); |
|
} |
|
|
|
std::string GetSizeInit(const MessageLayout::Size& size) { |
|
return absl::Substitute("UPB_SIZE($0, $1)", size.size32, size.size64); |
|
} |
|
|
|
std::string MessageName(const protobuf::Descriptor* descriptor) { |
|
return ToCIdent(descriptor->full_name()); |
|
} |
|
|
|
std::string MessageInit(const protobuf::Descriptor* descriptor) { |
|
return MessageName(descriptor) + "_msginit"; |
|
} |
|
|
|
std::string CTypeInternal(const protobuf::FieldDescriptor* field, |
|
bool is_const) { |
|
std::string maybe_const = is_const ? "const " : ""; |
|
switch (field->cpp_type()) { |
|
case protobuf::FieldDescriptor::CPPTYPE_MESSAGE: { |
|
std::string maybe_struct = |
|
field->file() != field->message_type()->file() ? "struct " : ""; |
|
return maybe_const + maybe_struct + MessageName(field->message_type()) + |
|
"*"; |
|
} |
|
case protobuf::FieldDescriptor::CPPTYPE_BOOL: |
|
return "bool"; |
|
case protobuf::FieldDescriptor::CPPTYPE_FLOAT: |
|
return "float"; |
|
case protobuf::FieldDescriptor::CPPTYPE_INT32: |
|
case protobuf::FieldDescriptor::CPPTYPE_ENUM: |
|
return "int32_t"; |
|
case protobuf::FieldDescriptor::CPPTYPE_UINT32: |
|
return "uint32_t"; |
|
case protobuf::FieldDescriptor::CPPTYPE_DOUBLE: |
|
return "double"; |
|
case protobuf::FieldDescriptor::CPPTYPE_INT64: |
|
return "int64_t"; |
|
case protobuf::FieldDescriptor::CPPTYPE_UINT64: |
|
return "uint64_t"; |
|
case protobuf::FieldDescriptor::CPPTYPE_STRING: |
|
return "upb_strview"; |
|
default: |
|
fprintf(stderr, "Unexpected type"); |
|
abort(); |
|
} |
|
} |
|
|
|
std::string SizeLg2(const protobuf::FieldDescriptor* field) { |
|
switch (field->cpp_type()) { |
|
case protobuf::FieldDescriptor::CPPTYPE_MESSAGE: |
|
return "UPB_SIZE(2, 3)"; |
|
case protobuf::FieldDescriptor::CPPTYPE_ENUM: |
|
return std::to_string(2); |
|
case protobuf::FieldDescriptor::CPPTYPE_BOOL: |
|
return std::to_string(1); |
|
case protobuf::FieldDescriptor::CPPTYPE_FLOAT: |
|
return std::to_string(2); |
|
case protobuf::FieldDescriptor::CPPTYPE_INT32: |
|
return std::to_string(2); |
|
case protobuf::FieldDescriptor::CPPTYPE_UINT32: |
|
return std::to_string(2); |
|
case protobuf::FieldDescriptor::CPPTYPE_DOUBLE: |
|
return std::to_string(3); |
|
case protobuf::FieldDescriptor::CPPTYPE_INT64: |
|
return std::to_string(3); |
|
case protobuf::FieldDescriptor::CPPTYPE_UINT64: |
|
return std::to_string(3); |
|
case protobuf::FieldDescriptor::CPPTYPE_STRING: |
|
return "UPB_SIZE(3, 4)"; |
|
default: |
|
fprintf(stderr, "Unexpected type"); |
|
abort(); |
|
} |
|
} |
|
|
|
std::string FieldDefault(const protobuf::FieldDescriptor* field) { |
|
switch (field->cpp_type()) { |
|
case protobuf::FieldDescriptor::CPPTYPE_MESSAGE: |
|
return "NULL"; |
|
case protobuf::FieldDescriptor::CPPTYPE_STRING: |
|
return absl::Substitute("upb_strview_make(\"$0\", strlen(\"$0\"))", |
|
absl::CEscape(field->default_value_string())); |
|
case protobuf::FieldDescriptor::CPPTYPE_INT32: |
|
return absl::StrCat(field->default_value_int32()); |
|
case protobuf::FieldDescriptor::CPPTYPE_INT64: |
|
return absl::StrCat(field->default_value_int64()); |
|
case protobuf::FieldDescriptor::CPPTYPE_UINT32: |
|
return absl::StrCat(field->default_value_uint32()); |
|
case protobuf::FieldDescriptor::CPPTYPE_UINT64: |
|
return absl::StrCat(field->default_value_uint64()); |
|
case protobuf::FieldDescriptor::CPPTYPE_FLOAT: |
|
return absl::StrCat(field->default_value_float()); |
|
case protobuf::FieldDescriptor::CPPTYPE_DOUBLE: |
|
return absl::StrCat(field->default_value_double()); |
|
case protobuf::FieldDescriptor::CPPTYPE_BOOL: |
|
return field->default_value_bool() ? "true" : "false"; |
|
case protobuf::FieldDescriptor::CPPTYPE_ENUM: |
|
// Use a number instead of a symbolic name so that we don't require |
|
// this enum's header to be included. |
|
return absl::StrCat(field->default_value_enum()->number()); |
|
} |
|
ABSL_ASSERT(false); |
|
return "XXX"; |
|
} |
|
|
|
std::string CType(const protobuf::FieldDescriptor* field) { |
|
return CTypeInternal(field, false); |
|
} |
|
|
|
std::string CTypeConst(const protobuf::FieldDescriptor* field) { |
|
return CTypeInternal(field, true); |
|
} |
|
|
|
void DumpEnumValues(const protobuf::EnumDescriptor* desc, Output& output) { |
|
std::vector<const protobuf::EnumValueDescriptor*> values; |
|
for (int i = 0; i < desc->value_count(); i++) { |
|
values.push_back(desc->value(i)); |
|
} |
|
std::sort(values.begin(), values.end(), |
|
[](const protobuf::EnumValueDescriptor* a, |
|
const protobuf::EnumValueDescriptor* b) { |
|
return a->number() < b->number(); |
|
}); |
|
|
|
for (size_t i = 0; i < values.size(); i++) { |
|
auto value = values[i]; |
|
output(" $0 = $1", EnumValueSymbol(value), value->number()); |
|
if (i != values.size() - 1) { |
|
output(","); |
|
} |
|
output("\n"); |
|
} |
|
} |
|
|
|
void EmitFileWarning(const protobuf::FileDescriptor* file, Output& output) { |
|
output( |
|
"/* This file was generated by upbc (the upb compiler) from the input\n" |
|
" * file:\n" |
|
" *\n" |
|
" * $0\n" |
|
" *\n" |
|
" * Do not edit -- your changes will be discarded when the file is\n" |
|
" * regenerated. */\n\n", |
|
file->name()); |
|
} |
|
|
|
void GenerateMessageInHeader(const protobuf::Descriptor* message, Output& output) { |
|
MessageLayout layout(message); |
|
|
|
output("/* $0 */\n\n", message->full_name()); |
|
std::string msgname = ToCIdent(message->full_name()); |
|
|
|
if (!message->options().map_entry()) { |
|
output( |
|
"UPB_INLINE $0 *$0_new(upb_arena *arena) {\n" |
|
" return ($0 *)_upb_msg_new(&$1, arena);\n" |
|
"}\n" |
|
"UPB_INLINE $0 *$0_parse(const char *buf, size_t size,\n" |
|
" upb_arena *arena) {\n" |
|
" $0 *ret = $0_new(arena);\n" |
|
" return (ret && upb_decode(buf, size, ret, &$1, arena)) ? ret : NULL;\n" |
|
"}\n" |
|
"UPB_INLINE char *$0_serialize(const $0 *msg, upb_arena *arena, size_t " |
|
"*len) {\n" |
|
" return upb_encode(msg, &$1, arena, len);\n" |
|
"}\n" |
|
"\n", |
|
MessageName(message), MessageInit(message)); |
|
} |
|
|
|
for (int i = 0; i < message->real_oneof_decl_count(); i++) { |
|
const protobuf::OneofDescriptor* oneof = message->oneof_decl(i); |
|
std::string fullname = ToCIdent(oneof->full_name()); |
|
output("typedef enum {\n"); |
|
for (int j = 0; j < oneof->field_count(); j++) { |
|
const protobuf::FieldDescriptor* field = oneof->field(j); |
|
output(" $0_$1 = $2,\n", fullname, field->name(), field->number()); |
|
} |
|
output( |
|
" $0_NOT_SET = 0\n" |
|
"} $0_oneofcases;\n", |
|
fullname); |
|
output( |
|
"UPB_INLINE $0_oneofcases $1_$2_case(const $1* msg) { " |
|
"return ($0_oneofcases)*UPB_PTR_AT(msg, $3, int32_t); }\n" |
|
"\n", |
|
fullname, msgname, oneof->name(), |
|
GetSizeInit(layout.GetOneofCaseOffset(oneof))); |
|
} |
|
|
|
// Generate const methods. |
|
|
|
for (auto field : FieldNumberOrder(message)) { |
|
// Generate hazzer (if any). |
|
if (layout.HasHasbit(field)) { |
|
output( |
|
"UPB_INLINE bool $0_has_$1(const $0 *msg) { " |
|
"return _upb_hasbit(msg, $2); }\n", |
|
msgname, field->name(), layout.GetHasbitIndex(field)); |
|
} else if (field->real_containing_oneof()) { |
|
output( |
|
"UPB_INLINE bool $0_has_$1(const $0 *msg) { " |
|
"return _upb_getoneofcase(msg, $2) == $3; }\n", |
|
msgname, field->name(), |
|
GetSizeInit( |
|
layout.GetOneofCaseOffset(field->real_containing_oneof())), |
|
field->number()); |
|
} else if (field->message_type()) { |
|
output( |
|
"UPB_INLINE bool $0_has_$1(const $0 *msg) { " |
|
"return _upb_has_submsg_nohasbit(msg, $2); }\n", |
|
msgname, field->name(), GetSizeInit(layout.GetFieldOffset(field))); |
|
} |
|
|
|
// Generate getter. |
|
if (field->is_map()) { |
|
const protobuf::Descriptor* entry = field->message_type(); |
|
const protobuf::FieldDescriptor* key = entry->FindFieldByNumber(1); |
|
const protobuf::FieldDescriptor* val = entry->FindFieldByNumber(2); |
|
output( |
|
"UPB_INLINE size_t $0_$1_size(const $0 *msg) {" |
|
"return _upb_msg_map_size(msg, $2); }\n", |
|
msgname, field->name(), GetSizeInit(layout.GetFieldOffset(field))); |
|
output( |
|
"UPB_INLINE bool $0_$1_get(const $0 *msg, $2 key, $3 *val) { " |
|
"return _upb_msg_map_get(msg, $4, &key, $5, val, $6); }\n", |
|
msgname, field->name(), CType(key), CType(val), |
|
GetSizeInit(layout.GetFieldOffset(field)), |
|
key->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_STRING |
|
? "0" |
|
: "sizeof(key)", |
|
val->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_STRING |
|
? "0" |
|
: "sizeof(*val)"); |
|
output( |
|
"UPB_INLINE $0 $1_$2_next(const $1 *msg, size_t* iter) { " |
|
"return ($0)_upb_msg_map_next(msg, $3, iter); }\n", |
|
CTypeConst(field), msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field))); |
|
} else if (message->options().map_entry()) { |
|
output( |
|
"UPB_INLINE $0 $1_$2(const $1 *msg) {\n" |
|
" $3 ret;\n" |
|
" _upb_msg_map_$2(msg, &ret, $4);\n" |
|
" return ret;\n" |
|
"}\n", |
|
CTypeConst(field), msgname, field->name(), CType(field), |
|
field->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_STRING |
|
? "0" |
|
: "sizeof(ret)"); |
|
} else if (field->is_repeated()) { |
|
output( |
|
"UPB_INLINE $0 const* $1_$2(const $1 *msg, size_t *len) { " |
|
"return ($0 const*)_upb_array_accessor(msg, $3, len); }\n", |
|
CTypeConst(field), msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field))); |
|
} else if (field->real_containing_oneof()) { |
|
output( |
|
"UPB_INLINE $0 $1_$2(const $1 *msg) { " |
|
"return UPB_READ_ONEOF(msg, $0, $3, $4, $5, $6); }\n", |
|
CTypeConst(field), msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field)), |
|
GetSizeInit(layout.GetOneofCaseOffset(field->real_containing_oneof())), |
|
field->number(), FieldDefault(field)); |
|
} else { |
|
output( |
|
"UPB_INLINE $0 $1_$2(const $1 *msg) { " |
|
"return *UPB_PTR_AT(msg, $3, $0); }\n", |
|
CTypeConst(field), msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field))); |
|
} |
|
} |
|
|
|
output("\n"); |
|
|
|
// Generate mutable methods. |
|
|
|
for (auto field : FieldNumberOrder(message)) { |
|
if (field->is_map()) { |
|
// TODO(haberman): add map-based mutators. |
|
const protobuf::Descriptor* entry = field->message_type(); |
|
const protobuf::FieldDescriptor* key = entry->FindFieldByNumber(1); |
|
const protobuf::FieldDescriptor* val = entry->FindFieldByNumber(2); |
|
output( |
|
"UPB_INLINE void $0_$1_clear($0 *msg) { _upb_msg_map_clear(msg, $2); }\n", |
|
msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field))); |
|
output( |
|
"UPB_INLINE bool $0_$1_set($0 *msg, $2 key, $3 val, upb_arena *a) { " |
|
"return _upb_msg_map_set(msg, $4, &key, $5, &val, $6, a); }\n", |
|
msgname, field->name(), CType(key), CType(val), |
|
GetSizeInit(layout.GetFieldOffset(field)), |
|
key->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_STRING |
|
? "0" |
|
: "sizeof(key)", |
|
val->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_STRING |
|
? "0" |
|
: "sizeof(val)"); |
|
output( |
|
"UPB_INLINE bool $0_$1_delete($0 *msg, $2 key) { " |
|
"return _upb_msg_map_delete(msg, $3, &key, $4); }\n", |
|
msgname, field->name(), CType(key), |
|
GetSizeInit(layout.GetFieldOffset(field)), |
|
key->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_STRING |
|
? "0" |
|
: "sizeof(key)"); |
|
output( |
|
"UPB_INLINE $0 $1_$2_nextmutable($1 *msg, size_t* iter) { " |
|
"return ($0)_upb_msg_map_next(msg, $3, iter); }\n", |
|
CType(field), msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field))); |
|
} else if (field->is_repeated()) { |
|
output( |
|
"UPB_INLINE $0* $1_mutable_$2($1 *msg, size_t *len) {\n" |
|
" return ($0*)_upb_array_mutable_accessor(msg, $3, len);\n" |
|
"}\n", |
|
CType(field), msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field))); |
|
output( |
|
"UPB_INLINE $0* $1_resize_$2($1 *msg, size_t len, " |
|
"upb_arena *arena) {\n" |
|
" return ($0*)_upb_array_resize_accessor(msg, $3, len, $4, arena);\n" |
|
"}\n", |
|
CType(field), msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field)), |
|
SizeLg2(field)); |
|
if (field->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_MESSAGE) { |
|
output( |
|
"UPB_INLINE struct $0* $1_add_$2($1 *msg, upb_arena *arena) {\n" |
|
" struct $0* sub = (struct $0*)_upb_msg_new(&$3, arena);\n" |
|
" bool ok = _upb_array_append_accessor(\n" |
|
" msg, $4, $5, $6, &sub, arena);\n" |
|
" if (!ok) return NULL;\n" |
|
" return sub;\n" |
|
"}\n", |
|
MessageName(field->message_type()), msgname, field->name(), |
|
MessageInit(field->message_type()), |
|
GetSizeInit(layout.GetFieldOffset(field)), |
|
GetSizeInit(MessageLayout::SizeOfUnwrapped(field).size), |
|
SizeLg2(field)); |
|
} else { |
|
output( |
|
"UPB_INLINE bool $1_add_$2($1 *msg, $0 val, upb_arena *arena) {\n" |
|
" return _upb_array_append_accessor(msg, $3, $4, $5, &val,\n" |
|
" arena);\n" |
|
"}\n", |
|
CType(field), msgname, field->name(), |
|
GetSizeInit(layout.GetFieldOffset(field)), |
|
GetSizeInit(MessageLayout::SizeOfUnwrapped(field).size), |
|
SizeLg2(field)); |
|
} |
|
} else { |
|
// Non-repeated field. |
|
if (message->options().map_entry() && field->name() == "key") { |
|
// Key cannot be mutated. |
|
continue; |
|
} |
|
|
|
// The common function signature for all setters. Varying implementations |
|
// follow. |
|
output("UPB_INLINE void $0_set_$1($0 *msg, $2 value) {\n", msgname, |
|
field->name(), CType(field)); |
|
|
|
if (message->options().map_entry()) { |
|
output( |
|
" _upb_msg_map_set_value(msg, &value, $0);\n" |
|
"}\n", |
|
field->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_STRING |
|
? "0" |
|
: "sizeof(" + CType(field) + ")"); |
|
} else if (field->real_containing_oneof()) { |
|
output( |
|
" UPB_WRITE_ONEOF(msg, $0, $1, value, $2, $3);\n" |
|
"}\n", |
|
CType(field), GetSizeInit(layout.GetFieldOffset(field)), |
|
GetSizeInit( |
|
layout.GetOneofCaseOffset(field->real_containing_oneof())), |
|
field->number()); |
|
} else { |
|
if (MessageLayout::HasHasbit(field)) { |
|
output(" _upb_sethas(msg, $0);\n", layout.GetHasbitIndex(field)); |
|
} |
|
output( |
|
" *UPB_PTR_AT(msg, $1, $0) = value;\n" |
|
"}\n", |
|
CType(field), GetSizeInit(layout.GetFieldOffset(field))); |
|
} |
|
|
|
if (field->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_MESSAGE && |
|
!message->options().map_entry()) { |
|
output( |
|
"UPB_INLINE struct $0* $1_mutable_$2($1 *msg, upb_arena *arena) {\n" |
|
" struct $0* sub = (struct $0*)$1_$2(msg);\n" |
|
" if (sub == NULL) {\n" |
|
" sub = (struct $0*)_upb_msg_new(&$3, arena);\n" |
|
" if (!sub) return NULL;\n" |
|
" $1_set_$2(msg, sub);\n" |
|
" }\n" |
|
" return sub;\n" |
|
"}\n", |
|
MessageName(field->message_type()), msgname, field->name(), |
|
MessageInit(field->message_type())); |
|
} |
|
} |
|
} |
|
|
|
output("\n"); |
|
} |
|
|
|
void WriteHeader(const protobuf::FileDescriptor* file, Output& output) { |
|
EmitFileWarning(file, output); |
|
output( |
|
"#ifndef $0_UPB_H_\n" |
|
"#define $0_UPB_H_\n\n" |
|
"#include \"upb/msg.h\"\n" |
|
"#include \"upb/decode.h\"\n" |
|
"#include \"upb/decode_fast.h\"\n" |
|
"#include \"upb/encode.h\"\n\n", |
|
ToPreproc(file->name())); |
|
|
|
for (int i = 0; i < file->public_dependency_count(); i++) { |
|
const auto& name = file->public_dependency(i)->name(); |
|
if (i == 0) { |
|
output("/* Public Imports. */\n"); |
|
} |
|
output("#include \"$0\"\n", HeaderFilename(name)); |
|
if (i == file->public_dependency_count() - 1) { |
|
output("\n"); |
|
} |
|
} |
|
|
|
output( |
|
"#include \"upb/port_def.inc\"\n" |
|
"\n" |
|
"#ifdef __cplusplus\n" |
|
"extern \"C\" {\n" |
|
"#endif\n" |
|
"\n"); |
|
|
|
std::vector<const protobuf::Descriptor*> this_file_messages = |
|
SortedMessages(file); |
|
|
|
// Forward-declare types defined in this file. |
|
for (auto message : this_file_messages) { |
|
output("struct $0;\n", ToCIdent(message->full_name())); |
|
} |
|
for (auto message : this_file_messages) { |
|
output("typedef struct $0 $0;\n", ToCIdent(message->full_name())); |
|
} |
|
for (auto message : this_file_messages) { |
|
output("extern const upb_msglayout $0;\n", MessageInit(message)); |
|
} |
|
|
|
// Forward-declare types not in this file, but used as submessages. |
|
// Order by full name for consistent ordering. |
|
std::map<std::string, const protobuf::Descriptor*> forward_messages; |
|
|
|
for (auto message : SortedMessages(file)) { |
|
for (int i = 0; i < message->field_count(); i++) { |
|
const protobuf::FieldDescriptor* field = message->field(i); |
|
if (field->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_MESSAGE && |
|
field->file() != field->message_type()->file()) { |
|
forward_messages[field->message_type()->full_name()] = |
|
field->message_type(); |
|
} |
|
} |
|
} |
|
for (const auto& pair : forward_messages) { |
|
output("struct $0;\n", MessageName(pair.second)); |
|
} |
|
for (const auto& pair : forward_messages) { |
|
output("extern const upb_msglayout $0;\n", MessageInit(pair.second)); |
|
} |
|
|
|
if (!this_file_messages.empty()) { |
|
output("\n"); |
|
} |
|
|
|
std::vector<const protobuf::EnumDescriptor*> this_file_enums = |
|
SortedEnums(file); |
|
|
|
for (auto enumdesc : this_file_enums) { |
|
output("typedef enum {\n"); |
|
DumpEnumValues(enumdesc, output); |
|
output("} $0;\n\n", ToCIdent(enumdesc->full_name())); |
|
} |
|
|
|
output("\n"); |
|
|
|
for (auto message : this_file_messages) { |
|
GenerateMessageInHeader(message, output); |
|
} |
|
|
|
output( |
|
"#ifdef __cplusplus\n" |
|
"} /* extern \"C\" */\n" |
|
"#endif\n" |
|
"\n" |
|
"#include \"upb/port_undef.inc\"\n" |
|
"\n" |
|
"#endif /* $0_UPB_H_ */\n", |
|
ToPreproc(file->name())); |
|
} |
|
|
|
int TableDescriptorType(const protobuf::FieldDescriptor* field) { |
|
if (field->file()->syntax() == protobuf::FileDescriptor::SYNTAX_PROTO2 && |
|
field->type() == protobuf::FieldDescriptor::TYPE_STRING) { |
|
// From the perspective of the binary encoder/decoder, proto2 string fields |
|
// are identical to bytes fields. Only in proto3 do we check UTF-8 for |
|
// string fields at parse time. |
|
// |
|
// If we ever use these tables for JSON encoding/decoding (for example by |
|
// embedding field names on the side) we will have to revisit this, because |
|
// string vs. bytes behavior is not affected by proto2 vs proto3. |
|
return protobuf::FieldDescriptor::TYPE_BYTES; |
|
} else { |
|
return field->type(); |
|
} |
|
} |
|
|
|
struct SubmsgArray { |
|
public: |
|
SubmsgArray(const protobuf::Descriptor* message) : message_(message) { |
|
MessageLayout layout(message); |
|
std::vector<const protobuf::FieldDescriptor*> sorted_submsgs = |
|
SortedSubmessages(message); |
|
int i = 0; |
|
for (auto submsg : sorted_submsgs) { |
|
if (indexes_.find(submsg->message_type()) != indexes_.end()) { |
|
continue; |
|
} |
|
submsgs_.push_back(submsg->message_type()); |
|
indexes_[submsg->message_type()] = i++; |
|
} |
|
} |
|
|
|
const std::vector<const protobuf::Descriptor*>& submsgs() const { |
|
return submsgs_; |
|
} |
|
|
|
int GetIndex(const protobuf::FieldDescriptor* field) { |
|
(void)message_; |
|
assert(field->containing_type() == message_); |
|
auto it = indexes_.find(field->message_type()); |
|
assert(it != indexes_.end()); |
|
return it->second; |
|
} |
|
|
|
private: |
|
const protobuf::Descriptor* message_; |
|
std::vector<const protobuf::Descriptor*> submsgs_; |
|
absl::flat_hash_map<const protobuf::Descriptor*, int> indexes_; |
|
}; |
|
|
|
typedef std::pair<std::string, MessageLayout::Size> TableEntry; |
|
|
|
void TryFillTableEntry(const protobuf::Descriptor* message, |
|
const MessageLayout& layout, int num, TableEntry& ent) { |
|
const protobuf::FieldDescriptor* field = message->FindFieldByNumber(num); |
|
if (!field) return; |
|
|
|
std::string type = ""; |
|
std::string cardinality = ""; |
|
uint8_t wire_type = 0; |
|
switch (field->type()) { |
|
case protobuf::FieldDescriptor::TYPE_BOOL: |
|
type = "b1"; |
|
break; |
|
case protobuf::FieldDescriptor::TYPE_INT32: |
|
case protobuf::FieldDescriptor::TYPE_ENUM: |
|
case protobuf::FieldDescriptor::TYPE_UINT32: |
|
type = "v4"; |
|
break; |
|
case protobuf::FieldDescriptor::TYPE_INT64: |
|
case protobuf::FieldDescriptor::TYPE_UINT64: |
|
type = "v8"; |
|
break; |
|
case protobuf::FieldDescriptor::TYPE_SINT32: |
|
type = "z4"; |
|
break; |
|
case protobuf::FieldDescriptor::TYPE_SINT64: |
|
type = "z8"; |
|
break; |
|
case protobuf::FieldDescriptor::TYPE_STRING: |
|
case protobuf::FieldDescriptor::TYPE_BYTES: |
|
type = "s"; |
|
wire_type = 2; |
|
break; |
|
case protobuf::FieldDescriptor::TYPE_MESSAGE: |
|
if (field->is_map()) { |
|
return; // Not supported yet (ever?). |
|
} |
|
type = "m"; |
|
wire_type = 2; |
|
break; |
|
default: |
|
return; // Not supported yet. |
|
} |
|
|
|
switch (field->label()) { |
|
case protobuf::FieldDescriptor::LABEL_REPEATED: |
|
if (field->type() == protobuf::FieldDescriptor::TYPE_MESSAGE) { |
|
cardinality = "r"; |
|
break; |
|
} else { |
|
return; // Not supported yet. |
|
} |
|
case protobuf::FieldDescriptor::LABEL_OPTIONAL: |
|
case protobuf::FieldDescriptor::LABEL_REQUIRED: |
|
if (field->real_containing_oneof()) { |
|
return; // Not supported yet. |
|
} else { |
|
cardinality = "s"; |
|
} |
|
break; |
|
} |
|
|
|
uint16_t expected_tag = (num << 3) | wire_type; |
|
if (num > 15) expected_tag |= 0x100; |
|
MessageLayout::Size offset = layout.GetFieldOffset(field); |
|
uint64_t hasbit_index = 0; // Zero means no hasbits. |
|
|
|
if (layout.HasHasbit(field)) { |
|
hasbit_index = layout.GetHasbitIndex(field); |
|
if (hasbit_index > 31) return; |
|
// thas hasbits mask in the parser occupies bits 16-48 |
|
// in the 64 bit register. |
|
hasbit_index += 16; // account for the shifted hasbits |
|
} |
|
|
|
MessageLayout::Size data; |
|
|
|
data.size32 = ((uint64_t)offset.size32 << 48) | expected_tag; |
|
data.size64 = ((uint64_t)offset.size64 << 48) | expected_tag; |
|
|
|
if (field->type() == protobuf::FieldDescriptor::TYPE_MESSAGE) { |
|
SubmsgArray submsg_array(message); |
|
uint64_t idx = submsg_array.GetIndex(field); |
|
data.size32 |= idx << 16 | hasbit_index << 32; |
|
data.size64 |= idx << 16 | hasbit_index << 32; |
|
} else { |
|
uint64_t hasbit_mask = (1ull << hasbit_index) & -0x10000; |
|
data.size32 |= (uint64_t)hasbit_mask; |
|
data.size64 |= (uint64_t)hasbit_mask; |
|
} |
|
|
|
|
|
if (field->type() == protobuf::FieldDescriptor::TYPE_MESSAGE) { |
|
std::string size_ceil = "max"; |
|
size_t size = SIZE_MAX; |
|
if (field->message_type()->file() == field->file()) { |
|
MessageLayout sub_layout(field->message_type()); |
|
size = sub_layout.message_size().size64 + 8; |
|
} |
|
std::vector<size_t> breaks = {64, 128, 192, 256}; |
|
for (auto brk : breaks) { |
|
if (size <= brk) { |
|
size_ceil = std::to_string(brk); |
|
break; |
|
} |
|
} |
|
ent.first = absl::Substitute("upb_p$0$1_$2bt_max$3b", cardinality, type, |
|
(num > 15) ? "2" : "1", size_ceil); |
|
|
|
} else { |
|
ent.first = absl::Substitute("upb_p$0$1_$2bt", cardinality, type, |
|
(num > 15) ? "2" : "1"); |
|
} |
|
ent.second = data; |
|
} |
|
|
|
std::vector<TableEntry> FastDecodeTable(const protobuf::Descriptor* message, |
|
const MessageLayout& layout) { |
|
int table_size = 1; |
|
for (int i = 0; i < message->field_count(); i++) { |
|
int num = message->field(i)->number(); |
|
while (num >= table_size && num < 32) { |
|
table_size *= 2; |
|
} |
|
} |
|
|
|
std::vector<TableEntry> table; |
|
MessageLayout::Size empty_size; |
|
empty_size.size32 = 0; |
|
empty_size.size64 = 0; |
|
for (int i = 0; i < table_size; i++) { |
|
table.emplace_back(TableEntry{"fastdecode_generic", empty_size}); |
|
TryFillTableEntry(message, layout, i, table.back()); |
|
} |
|
return table; |
|
} |
|
|
|
void WriteSource(const protobuf::FileDescriptor* file, Output& output) { |
|
EmitFileWarning(file, output); |
|
|
|
output( |
|
"#include <stddef.h>\n" |
|
"#include \"upb/msg.h\"\n" |
|
"#include \"$0\"\n", |
|
HeaderFilename(file->name())); |
|
|
|
for (int i = 0; i < file->dependency_count(); i++) { |
|
output("#include \"$0\"\n", HeaderFilename(file->dependency(i)->name())); |
|
} |
|
|
|
output( |
|
"\n" |
|
"#include \"upb/port_def.inc\"\n" |
|
"\n"); |
|
|
|
|
|
for (auto message : SortedMessages(file)) { |
|
std::string msgname = ToCIdent(message->full_name()); |
|
std::string fields_array_ref = "NULL"; |
|
std::string submsgs_array_ref = "NULL"; |
|
MessageLayout layout(message); |
|
SubmsgArray submsg_array(message); |
|
|
|
if (!submsg_array.submsgs().empty()) { |
|
// TODO(haberman): could save a little bit of space by only generating a |
|
// "submsgs" array for every strongly-connected component. |
|
std::string submsgs_array_name = msgname + "_submsgs"; |
|
submsgs_array_ref = "&" + submsgs_array_name + "[0]"; |
|
output("static const upb_msglayout *const $0[$1] = {\n", |
|
submsgs_array_name, submsg_array.submsgs().size()); |
|
|
|
for (auto submsg : submsg_array.submsgs()) { |
|
output(" &$0,\n", MessageInit(submsg)); |
|
} |
|
|
|
output("};\n\n"); |
|
} |
|
|
|
std::vector<const protobuf::FieldDescriptor*> field_number_order = |
|
FieldNumberOrder(message); |
|
if (!field_number_order.empty()) { |
|
std::string fields_array_name = msgname + "__fields"; |
|
fields_array_ref = "&" + fields_array_name + "[0]"; |
|
output("static const upb_msglayout_field $0[$1] = {\n", |
|
fields_array_name, field_number_order.size()); |
|
for (auto field : field_number_order) { |
|
int submsg_index = 0; |
|
std::string presence = "0"; |
|
|
|
if (field->cpp_type() == protobuf::FieldDescriptor::CPPTYPE_MESSAGE) { |
|
submsg_index = submsg_array.GetIndex(field); |
|
} |
|
|
|
if (MessageLayout::HasHasbit(field)) { |
|
int index = layout.GetHasbitIndex(field); |
|
assert(index != 0); |
|
presence = absl::StrCat(index); |
|
} else if (field->real_containing_oneof()) { |
|
MessageLayout::Size case_offset = |
|
layout.GetOneofCaseOffset(field->real_containing_oneof()); |
|
|
|
// We encode as negative to distinguish from hasbits. |
|
case_offset.size32 = ~case_offset.size32; |
|
case_offset.size64 = ~case_offset.size64; |
|
assert(case_offset.size32 < 0); |
|
assert(case_offset.size64 < 0); |
|
presence = GetSizeInit(case_offset); |
|
} |
|
|
|
std::string label; |
|
if (field->is_map()) { |
|
label = "_UPB_LABEL_MAP"; |
|
} else if (field->is_packed()) { |
|
label = "_UPB_LABEL_PACKED"; |
|
} else { |
|
label = absl::StrCat(field->label()); |
|
} |
|
|
|
output(" {$0, $1, $2, $3, $4, $5},\n", |
|
field->number(), |
|
GetSizeInit(layout.GetFieldOffset(field)), |
|
presence, |
|
submsg_index, |
|
TableDescriptorType(field), |
|
label); |
|
} |
|
output("};\n\n"); |
|
} |
|
|
|
std::vector<TableEntry> table = FastDecodeTable(message, layout); |
|
|
|
output("const upb_msglayout $0 = {\n", MessageInit(message)); |
|
output(" $0,\n", submsgs_array_ref); |
|
output(" $0,\n", fields_array_ref); |
|
output(" $0,\n", (table.size() - 1) << 3); |
|
output(" $0, $1, $2,\n", GetSizeInit(layout.message_size()), |
|
field_number_order.size(), |
|
"false" // TODO: extendable |
|
); |
|
output(" {\n"); |
|
for (const auto& ent : table) { |
|
output(" {&$0, $1},\n", ent.first, GetSizeInit(ent.second)); |
|
} |
|
output(" },\n"); |
|
|
|
output("};\n\n"); |
|
} |
|
|
|
output("#include \"upb/port_undef.inc\"\n"); |
|
output("\n"); |
|
} |
|
|
|
void GenerateMessageDefAccessor(const protobuf::Descriptor* d, Output& output) { |
|
output("UPB_INLINE const upb_msgdef *$0_getmsgdef(upb_symtab *s) {\n", |
|
ToCIdent(d->full_name())); |
|
output(" _upb_symtab_loaddefinit(s, &$0);\n", DefInitSymbol(d->file())); |
|
output(" return upb_symtab_lookupmsg(s, \"$0\");\n", d->full_name()); |
|
output("}\n"); |
|
output("\n"); |
|
|
|
for (int i = 0; i < d->nested_type_count(); i++) { |
|
GenerateMessageDefAccessor(d->nested_type(i), output); |
|
} |
|
} |
|
|
|
void WriteDefHeader(const protobuf::FileDescriptor* file, Output& output) { |
|
EmitFileWarning(file, output); |
|
|
|
output( |
|
"#ifndef $0_UPBDEFS_H_\n" |
|
"#define $0_UPBDEFS_H_\n\n" |
|
"#include \"upb/def.h\"\n" |
|
"#include \"upb/port_def.inc\"\n" |
|
"#ifdef __cplusplus\n" |
|
"extern \"C\" {\n" |
|
"#endif\n\n", |
|
ToPreproc(file->name())); |
|
|
|
output("#include \"upb/def.h\"\n"); |
|
output("\n"); |
|
output("#include \"upb/port_def.inc\"\n"); |
|
output("\n"); |
|
|
|
output("extern upb_def_init $0;\n", DefInitSymbol(file)); |
|
output("\n"); |
|
|
|
for (int i = 0; i < file->message_type_count(); i++) { |
|
GenerateMessageDefAccessor(file->message_type(i), output); |
|
} |
|
|
|
output( |
|
"#ifdef __cplusplus\n" |
|
"} /* extern \"C\" */\n" |
|
"#endif\n" |
|
"\n" |
|
"#include \"upb/port_undef.inc\"\n" |
|
"\n" |
|
"#endif /* $0_UPBDEFS_H_ */\n", |
|
ToPreproc(file->name())); |
|
} |
|
|
|
// Escape C++ trigraphs by escaping question marks to \? |
|
std::string EscapeTrigraphs(absl::string_view to_escape) { |
|
return absl::StrReplaceAll(to_escape, {{"?", "\\?"}}); |
|
} |
|
|
|
void WriteDefSource(const protobuf::FileDescriptor* file, Output& output) { |
|
EmitFileWarning(file, output); |
|
|
|
output("#include \"upb/def.h\"\n"); |
|
output("#include \"$0\"\n", DefHeaderFilename(file->name())); |
|
output("\n"); |
|
|
|
for (int i = 0; i < file->dependency_count(); i++) { |
|
output("extern upb_def_init $0;\n", DefInitSymbol(file->dependency(i))); |
|
} |
|
|
|
std::vector<const protobuf::Descriptor*> file_messages = |
|
SortedMessages(file); |
|
|
|
for (auto message : file_messages) { |
|
output("extern const upb_msglayout $0;\n", MessageInit(message)); |
|
} |
|
output("\n"); |
|
|
|
if (!file_messages.empty()) { |
|
output("static const upb_msglayout *layouts[$0] = {\n", file_messages.size()); |
|
for (auto message : file_messages) { |
|
output(" &$0,\n", MessageInit(message)); |
|
} |
|
output("};\n"); |
|
output("\n"); |
|
} |
|
|
|
protobuf::FileDescriptorProto file_proto; |
|
file->CopyTo(&file_proto); |
|
std::string file_data; |
|
file_proto.SerializeToString(&file_data); |
|
|
|
output("static const char descriptor[$0] = {", file_data.size()); |
|
|
|
// C90 only guarantees that strings can be up to 509 characters, and some |
|
// implementations have limits here (for example, MSVC only allows 64k: |
|
// https://docs.microsoft.com/en-us/cpp/error-messages/compiler-errors-1/fatal-error-c1091. |
|
// So we always emit an array instead of a string. |
|
for (size_t i = 0; i < file_data.size();) { |
|
for (size_t j = 0; j < 25 && i < file_data.size(); ++i, ++j) { |
|
output("'$0', ", absl::CEscape(file_data.substr(i, 1))); |
|
} |
|
output("\n"); |
|
} |
|
output("};\n\n"); |
|
|
|
output("static upb_def_init *deps[$0] = {\n", file->dependency_count() + 1); |
|
for (int i = 0; i < file->dependency_count(); i++) { |
|
output(" &$0,\n", DefInitSymbol(file->dependency(i))); |
|
} |
|
output(" NULL\n"); |
|
output("};\n"); |
|
output("\n"); |
|
|
|
output("upb_def_init $0 = {\n", DefInitSymbol(file)); |
|
output(" deps,\n"); |
|
if (file_messages.empty()) { |
|
output(" NULL,\n"); |
|
} else { |
|
output(" layouts,\n"); |
|
} |
|
output(" \"$0\",\n", file->name()); |
|
output(" UPB_STRVIEW_INIT(descriptor, $0)\n", file_data.size()); |
|
output("};\n"); |
|
} |
|
|
|
bool Generator::Generate(const protobuf::FileDescriptor* file, |
|
const std::string& /* parameter */, |
|
protoc::GeneratorContext* context, |
|
std::string* /* error */) const { |
|
Output h_output(context->Open(HeaderFilename(file->name()))); |
|
WriteHeader(file, h_output); |
|
|
|
Output c_output(context->Open(SourceFilename(file->name()))); |
|
WriteSource(file, c_output); |
|
|
|
Output h_def_output(context->Open(DefHeaderFilename(file->name()))); |
|
WriteDefHeader(file, h_def_output); |
|
|
|
Output c_def_output(context->Open(DefSourceFilename(file->name()))); |
|
WriteDefSource(file, c_def_output); |
|
|
|
return true; |
|
} |
|
|
|
std::unique_ptr<google::protobuf::compiler::CodeGenerator> GetGenerator() { |
|
return std::unique_ptr<google::protobuf::compiler::CodeGenerator>( |
|
new Generator()); |
|
} |
|
|
|
} // namespace upbc
|
|
|