parent
a2004150f8
commit
273398ca5f
5 changed files with 49 additions and 429 deletions
@ -1,233 +0,0 @@ |
|||||||
// Copyright (c) 2009-2021, Google LLC
|
|
||||||
// All rights reserved.
|
|
||||||
//
|
|
||||||
// Redistribution and use in source and binary forms, with or without
|
|
||||||
// modification, are permitted provided that the following conditions are met:
|
|
||||||
// * Redistributions of source code must retain the above copyright
|
|
||||||
// notice, this list of conditions and the following disclaimer.
|
|
||||||
// * Redistributions in binary form must reproduce the above copyright
|
|
||||||
// notice, this list of conditions and the following disclaimer in the
|
|
||||||
// documentation and/or other materials provided with the distribution.
|
|
||||||
// * Neither the name of Google LLC nor the
|
|
||||||
// names of its contributors may be used to endorse or promote products
|
|
||||||
// derived from this software without specific prior written permission.
|
|
||||||
//
|
|
||||||
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
||||||
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
||||||
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
||||||
// ARE DISCLAIMED. IN NO EVENT SHALL Google LLC BE LIABLE FOR ANY DIRECT,
|
|
||||||
// INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
|
||||||
// (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
|
|
||||||
// LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
|
|
||||||
// ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
||||||
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
||||||
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
||||||
|
|
||||||
#include "upbc/message_layout.h" |
|
||||||
|
|
||||||
#include "google/protobuf/descriptor.pb.h" |
|
||||||
|
|
||||||
namespace upbc { |
|
||||||
|
|
||||||
namespace protobuf = ::google::protobuf; |
|
||||||
|
|
||||||
static int64_t DivRoundUp(int64_t a, int64_t b) { |
|
||||||
ABSL_ASSERT(a >= 0); |
|
||||||
ABSL_ASSERT(b > 0); |
|
||||||
return (a + b - 1) / b; |
|
||||||
} |
|
||||||
|
|
||||||
MessageLayout::Size MessageLayout::Place( |
|
||||||
MessageLayout::SizeAndAlign size_and_align) { |
|
||||||
Size offset = size_; |
|
||||||
offset.AlignUp(size_and_align.align); |
|
||||||
size_ = offset; |
|
||||||
size_.Add(size_and_align.size); |
|
||||||
ABSL_ASSERT(IsPowerOfTwo(size_and_align.align.size32)); |
|
||||||
ABSL_ASSERT(IsPowerOfTwo(size_and_align.align.size64)); |
|
||||||
maxalign_.MaxFrom(size_and_align.align); |
|
||||||
return offset; |
|
||||||
} |
|
||||||
|
|
||||||
bool MessageLayout::HasHasbit(const protobuf::FieldDescriptor* field) { |
|
||||||
return field->has_presence() && !field->real_containing_oneof() && |
|
||||||
!field->containing_type()->options().map_entry(); |
|
||||||
} |
|
||||||
|
|
||||||
MessageLayout::SizeAndAlign MessageLayout::SizeOf( |
|
||||||
const protobuf::FieldDescriptor* field) { |
|
||||||
if (field->is_repeated()) { |
|
||||||
return {{4, 8}, {4, 8}}; // Pointer to array object.
|
|
||||||
} else { |
|
||||||
return SizeOfUnwrapped(field); |
|
||||||
} |
|
||||||
} |
|
||||||
|
|
||||||
MessageLayout::SizeAndAlign MessageLayout::SizeOfUnwrapped( |
|
||||||
const protobuf::FieldDescriptor* field) { |
|
||||||
switch (field->cpp_type()) { |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_MESSAGE: |
|
||||||
return {{4, 8}, {4, 8}}; // Pointer to message.
|
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_STRING: |
|
||||||
return {{8, 16}, {4, 8}}; // upb_StringView
|
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_BOOL: |
|
||||||
return {{1, 1}, {1, 1}}; |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_FLOAT: |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_INT32: |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_UINT32: |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_ENUM: |
|
||||||
return {{4, 4}, {4, 4}}; |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_INT64: |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_UINT64: |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_DOUBLE: |
|
||||||
return {{8, 8}, {8, 8}}; |
|
||||||
} |
|
||||||
assert(false); |
|
||||||
return {{-1, -1}, {-1, -1}}; |
|
||||||
} |
|
||||||
|
|
||||||
int64_t MessageLayout::FieldLayoutRank(const protobuf::FieldDescriptor* field) { |
|
||||||
// Order:
|
|
||||||
// 1, 2, 3. primitive fields (8, 4, 1 byte)
|
|
||||||
// 4. string fields
|
|
||||||
// 5. submessage fields
|
|
||||||
// 6. repeated fields
|
|
||||||
//
|
|
||||||
// This has the following nice properties:
|
|
||||||
//
|
|
||||||
// 1. padding alignment is (nearly) minimized.
|
|
||||||
// 2. fields that might have defaults (1-4) are segregated
|
|
||||||
// from fields that are always zero-initialized (5-7).
|
|
||||||
//
|
|
||||||
// We skip oneof fields, because they are emitted in a separate pass.
|
|
||||||
int64_t rank; |
|
||||||
if (field->containing_oneof()) { |
|
||||||
fprintf(stderr, "shouldn't have oneofs here.\n"); |
|
||||||
abort(); |
|
||||||
} else if (field->label() == protobuf::FieldDescriptor::LABEL_REPEATED) { |
|
||||||
rank = 6; |
|
||||||
} else { |
|
||||||
switch (field->cpp_type()) { |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_MESSAGE: |
|
||||||
rank = 5; |
|
||||||
break; |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_STRING: |
|
||||||
rank = 4; |
|
||||||
break; |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_BOOL: |
|
||||||
rank = 3; |
|
||||||
break; |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_FLOAT: |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_INT32: |
|
||||||
case protobuf::FieldDescriptor::CPPTYPE_UINT32: |
|
||||||
rank = 2; |
|
||||||
break; |
|
||||||
default: |
|
||||||
rank = 1; |
|
||||||
break; |
|
||||||
} |
|
||||||
} |
|
||||||
|
|
||||||
// Break ties with field number.
|
|
||||||
return (rank << 29) | field->number(); |
|
||||||
} |
|
||||||
|
|
||||||
void MessageLayout::ComputeLayout(const protobuf::Descriptor* descriptor) { |
|
||||||
size_ = Size{0, 0}; |
|
||||||
maxalign_ = Size{8, 8}; |
|
||||||
|
|
||||||
if (descriptor->options().map_entry()) { |
|
||||||
// Map entries aren't actually stored, they are only used during parsing.
|
|
||||||
// For parsing, it helps a lot if all map entry messages have the same
|
|
||||||
// layout.
|
|
||||||
SizeAndAlign size{{8, 16}, {4, 8}}; // upb_StringView
|
|
||||||
field_offsets_[descriptor->FindFieldByNumber(1)] = Place(size); |
|
||||||
field_offsets_[descriptor->FindFieldByNumber(2)] = Place(size); |
|
||||||
} else { |
|
||||||
PlaceNonOneofFields(descriptor); |
|
||||||
PlaceOneofFields(descriptor); |
|
||||||
} |
|
||||||
|
|
||||||
// Align overall size up to max size.
|
|
||||||
size_.AlignUp(maxalign_); |
|
||||||
} |
|
||||||
|
|
||||||
void MessageLayout::PlaceNonOneofFields( |
|
||||||
const protobuf::Descriptor* descriptor) { |
|
||||||
std::vector<const protobuf::FieldDescriptor*> field_order; |
|
||||||
for (int i = 0; i < descriptor->field_count(); i++) { |
|
||||||
const protobuf::FieldDescriptor* field = descriptor->field(i); |
|
||||||
if (!field->containing_oneof()) { |
|
||||||
field_order.push_back(descriptor->field(i)); |
|
||||||
} |
|
||||||
} |
|
||||||
std::sort(field_order.begin(), field_order.end(), |
|
||||||
[](const protobuf::FieldDescriptor* a, |
|
||||||
const protobuf::FieldDescriptor* b) { |
|
||||||
return FieldLayoutRank(a) < FieldLayoutRank(b); |
|
||||||
}); |
|
||||||
|
|
||||||
// Place/count hasbits.
|
|
||||||
hasbit_count_ = 0; |
|
||||||
required_count_ = 0; |
|
||||||
for (auto field : FieldHotnessOrder(descriptor)) { |
|
||||||
if (HasHasbit(field)) { |
|
||||||
// We don't use hasbit 0, so that 0 can indicate "no presence" in the
|
|
||||||
// table. This wastes one hasbit, but we don't worry about it for now.
|
|
||||||
int index = ++hasbit_count_; |
|
||||||
hasbit_indexes_[field] = index; |
|
||||||
if (field->is_required()) { |
|
||||||
if (index > 63) { |
|
||||||
// This could be fixed in the decoder without too much trouble. But
|
|
||||||
// we expect this to be so rare that we don't worry about it for now.
|
|
||||||
std::cerr << "upb does not support messages with more than 63 " |
|
||||||
"required fields: " |
|
||||||
<< field->full_name() << "\n"; |
|
||||||
exit(1); |
|
||||||
} |
|
||||||
required_count_++; |
|
||||||
} |
|
||||||
} |
|
||||||
} |
|
||||||
|
|
||||||
// Place hasbits at the beginning.
|
|
||||||
hasbit_bytes_ = hasbit_count_ ? DivRoundUp(hasbit_count_ + 1, 8) : 0; |
|
||||||
Place(SizeAndAlign{{hasbit_bytes_, hasbit_bytes_}, {1, 1}}); |
|
||||||
|
|
||||||
// Place non-oneof fields.
|
|
||||||
for (auto field : field_order) { |
|
||||||
field_offsets_[field] = Place(SizeOf(field)); |
|
||||||
} |
|
||||||
} |
|
||||||
|
|
||||||
void MessageLayout::PlaceOneofFields(const protobuf::Descriptor* descriptor) { |
|
||||||
std::vector<const protobuf::OneofDescriptor*> oneof_order; |
|
||||||
for (int i = 0; i < descriptor->oneof_decl_count(); i++) { |
|
||||||
oneof_order.push_back(descriptor->oneof_decl(i)); |
|
||||||
} |
|
||||||
std::sort(oneof_order.begin(), oneof_order.end(), |
|
||||||
[](const protobuf::OneofDescriptor* a, |
|
||||||
const protobuf::OneofDescriptor* b) { |
|
||||||
return a->full_name() < b->full_name(); |
|
||||||
}); |
|
||||||
|
|
||||||
for (auto oneof : oneof_order) { |
|
||||||
SizeAndAlign oneof_maxsize{{0, 0}, {0, 0}}; |
|
||||||
// Calculate max size.
|
|
||||||
for (int i = 0; i < oneof->field_count(); i++) { |
|
||||||
oneof_maxsize.MaxFrom(SizeOf(oneof->field(i))); |
|
||||||
} |
|
||||||
|
|
||||||
// Place discriminator enum and data.
|
|
||||||
Size data = Place(oneof_maxsize); |
|
||||||
Size discriminator = Place(SizeAndAlign{{4, 4}, {4, 4}}); |
|
||||||
|
|
||||||
oneof_case_offsets_[oneof] = discriminator; |
|
||||||
|
|
||||||
for (int i = 0; i < oneof->field_count(); i++) { |
|
||||||
field_offsets_[oneof->field(i)] = data; |
|
||||||
} |
|
||||||
} |
|
||||||
} |
|
||||||
|
|
||||||
} // namespace upbc
|
|
@ -1,163 +0,0 @@ |
|||||||
/*
|
|
||||||
* Copyright (c) 2009-2021, Google LLC |
|
||||||
* All rights reserved. |
|
||||||
* |
|
||||||
* Redistribution and use in source and binary forms, with or without |
|
||||||
* modification, are permitted provided that the following conditions are met: |
|
||||||
* * Redistributions of source code must retain the above copyright |
|
||||||
* notice, this list of conditions and the following disclaimer. |
|
||||||
* * Redistributions in binary form must reproduce the above copyright |
|
||||||
* notice, this list of conditions and the following disclaimer in the |
|
||||||
* documentation and/or other materials provided with the distribution. |
|
||||||
* * Neither the name of Google LLC nor the |
|
||||||
* names of its contributors may be used to endorse or promote products |
|
||||||
* derived from this software without specific prior written permission. |
|
||||||
* |
|
||||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" |
|
||||||
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
|
||||||
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
|
||||||
* ARE DISCLAIMED. IN NO EVENT SHALL Google LLC BE LIABLE FOR ANY DIRECT, |
|
||||||
* INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |
|
||||||
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |
|
||||||
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |
|
||||||
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
|
||||||
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
|
||||||
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
||||||
*/ |
|
||||||
|
|
||||||
#ifndef UPBC_MESSAGE_LAYOUT_H |
|
||||||
#define UPBC_MESSAGE_LAYOUT_H |
|
||||||
|
|
||||||
#include "absl/base/macros.h" |
|
||||||
#include "absl/container/flat_hash_map.h" |
|
||||||
#include "google/protobuf/descriptor.h" |
|
||||||
#include "upb/upb.hpp" |
|
||||||
#include "upb/mini_table.h" |
|
||||||
|
|
||||||
namespace upbc { |
|
||||||
|
|
||||||
class MessageLayout { |
|
||||||
public: |
|
||||||
struct Size { |
|
||||||
void Add(const Size& other) { |
|
||||||
size32 += other.size32; |
|
||||||
size64 += other.size64; |
|
||||||
} |
|
||||||
|
|
||||||
void MaxFrom(const Size& other) { |
|
||||||
size32 = std::max(size32, other.size32); |
|
||||||
size64 = std::max(size64, other.size64); |
|
||||||
} |
|
||||||
|
|
||||||
void AlignUp(const Size& align) { |
|
||||||
size32 = Align(size32, align.size32); |
|
||||||
size64 = Align(size64, align.size64); |
|
||||||
} |
|
||||||
|
|
||||||
int64_t size32; |
|
||||||
int64_t size64; |
|
||||||
}; |
|
||||||
|
|
||||||
struct SizeAndAlign { |
|
||||||
Size size; |
|
||||||
Size align; |
|
||||||
|
|
||||||
void MaxFrom(const SizeAndAlign& other) { |
|
||||||
size.MaxFrom(other.size); |
|
||||||
align.MaxFrom(other.align); |
|
||||||
} |
|
||||||
}; |
|
||||||
|
|
||||||
MessageLayout(const google::protobuf::Descriptor* descriptor) { |
|
||||||
ComputeLayout(descriptor); |
|
||||||
} |
|
||||||
|
|
||||||
Size GetFieldOffset(const google::protobuf::FieldDescriptor* field) const { |
|
||||||
return GetMapValue(field_offsets_, field); |
|
||||||
} |
|
||||||
|
|
||||||
Size GetOneofCaseOffset( |
|
||||||
const google::protobuf::OneofDescriptor* oneof) const { |
|
||||||
return GetMapValue(oneof_case_offsets_, oneof); |
|
||||||
} |
|
||||||
|
|
||||||
int GetHasbitIndex(const google::protobuf::FieldDescriptor* field) const { |
|
||||||
return GetMapValue(hasbit_indexes_, field); |
|
||||||
} |
|
||||||
|
|
||||||
Size message_size() const { return size_; } |
|
||||||
|
|
||||||
int hasbit_count() const { return hasbit_count_; } |
|
||||||
int hasbit_bytes() const { return hasbit_bytes_; } |
|
||||||
|
|
||||||
// Required fields always have the lowest hasbits.
|
|
||||||
int required_count() const { return required_count_; } |
|
||||||
|
|
||||||
static bool HasHasbit(const google::protobuf::FieldDescriptor* field); |
|
||||||
static SizeAndAlign SizeOfUnwrapped( |
|
||||||
const google::protobuf::FieldDescriptor* field); |
|
||||||
|
|
||||||
private: |
|
||||||
void ComputeLayout(const google::protobuf::Descriptor* descriptor); |
|
||||||
void PlaceNonOneofFields(const google::protobuf::Descriptor* descriptor); |
|
||||||
void PlaceOneofFields(const google::protobuf::Descriptor* descriptor); |
|
||||||
Size Place(SizeAndAlign size_and_align); |
|
||||||
|
|
||||||
template <class K, class V> |
|
||||||
static V GetMapValue(const absl::flat_hash_map<K, V>& map, K key) { |
|
||||||
auto iter = map.find(key); |
|
||||||
if (iter == map.end()) { |
|
||||||
fprintf(stderr, "No value for field.\n"); |
|
||||||
abort(); |
|
||||||
} |
|
||||||
return iter->second; |
|
||||||
} |
|
||||||
|
|
||||||
static bool IsPowerOfTwo(size_t val) { return (val & (val - 1)) == 0; } |
|
||||||
|
|
||||||
static size_t Align(size_t val, size_t align) { |
|
||||||
if (!IsPowerOfTwo(align)) { |
|
||||||
fprintf(stderr, "YO! Align is: %d\n", (int)align); |
|
||||||
} |
|
||||||
ABSL_ASSERT(IsPowerOfTwo(align)); |
|
||||||
return (val + align - 1) & ~(align - 1); |
|
||||||
} |
|
||||||
|
|
||||||
static SizeAndAlign SizeOf(const google::protobuf::FieldDescriptor* field); |
|
||||||
static int64_t FieldLayoutRank( |
|
||||||
const google::protobuf::FieldDescriptor* field); |
|
||||||
|
|
||||||
absl::flat_hash_map<const google::protobuf::FieldDescriptor*, Size> |
|
||||||
field_offsets_; |
|
||||||
absl::flat_hash_map<const google::protobuf::FieldDescriptor*, int> |
|
||||||
hasbit_indexes_; |
|
||||||
absl::flat_hash_map<const google::protobuf::OneofDescriptor*, Size> |
|
||||||
oneof_case_offsets_; |
|
||||||
Size maxalign_; |
|
||||||
Size size_; |
|
||||||
int hasbit_count_; |
|
||||||
int hasbit_bytes_; |
|
||||||
int required_count_ = 0; |
|
||||||
}; |
|
||||||
|
|
||||||
// Returns fields in order of "hotness", eg. how frequently they appear in
|
|
||||||
// serialized payloads. Ideally this will use a profile. When we don't have
|
|
||||||
// that, we assume that fields with smaller numbers are used more frequently.
|
|
||||||
inline std::vector<const google::protobuf::FieldDescriptor*> FieldHotnessOrder( |
|
||||||
const google::protobuf::Descriptor* message) { |
|
||||||
std::vector<const google::protobuf::FieldDescriptor*> fields; |
|
||||||
for (int i = 0; i < message->field_count(); i++) { |
|
||||||
fields.push_back(message->field(i)); |
|
||||||
} |
|
||||||
std::sort(fields.begin(), fields.end(), |
|
||||||
[](const google::protobuf::FieldDescriptor* a, |
|
||||||
const google::protobuf::FieldDescriptor* b) { |
|
||||||
return std::make_pair(!a->is_required(), a->number()) < |
|
||||||
std::make_pair(!b->is_required(), b->number()); |
|
||||||
}); |
|
||||||
return fields; |
|
||||||
} |
|
||||||
|
|
||||||
} // namespace upbc
|
|
||||||
|
|
||||||
#endif // UPBC_MESSAGE_LAYOUT_H
|
|
Loading…
Reference in new issue