Set up editions codegen tests for python

These tests aren't super useful for python because of how little codegen we actually do, but the pyi ones specifically will guard against major editions regressions.

PiperOrigin-RevId: 577495652
pull/14553/head
Mike Kruskal 1 year ago committed by Copybara-Service
parent b2efcdc1c5
commit 57bb1e55f1
  1. 157
      src/google/protobuf/compiler/python/generator.cc
  2. 6
      src/google/protobuf/compiler/python/generator.h
  3. 7
      src/google/protobuf/compiler/python/pyi_generator.cc
  4. 8
      src/google/protobuf/compiler/python/pyi_generator.h

@ -22,6 +22,8 @@
#include "google/protobuf/compiler/python/generator.h" #include "google/protobuf/compiler/python/generator.h"
#include <algorithm> #include <algorithm>
#include <cstddef>
#include <cstdint>
#include <limits> #include <limits>
#include <memory> #include <memory>
#include <string> #include <string>
@ -35,10 +37,12 @@
#include "absl/strings/escaping.h" #include "absl/strings/escaping.h"
#include "absl/strings/str_cat.h" #include "absl/strings/str_cat.h"
#include "absl/strings/str_format.h" #include "absl/strings/str_format.h"
#include "absl/strings/str_join.h"
#include "absl/strings/str_replace.h" #include "absl/strings/str_replace.h"
#include "absl/strings/string_view.h" #include "absl/strings/string_view.h"
#include "absl/strings/strip.h" #include "absl/strings/strip.h"
#include "absl/strings/substitute.h" #include "absl/strings/substitute.h"
#include "google/protobuf/compiler/code_generator.h"
#include "google/protobuf/compiler/python/helpers.h" #include "google/protobuf/compiler/python/helpers.h"
#include "google/protobuf/compiler/python/pyi_generator.h" #include "google/protobuf/compiler/python/pyi_generator.h"
#include "google/protobuf/compiler/retention.h" #include "google/protobuf/compiler/retention.h"
@ -49,6 +53,7 @@
#include "google/protobuf/io/printer.h" #include "google/protobuf/io/printer.h"
#include "google/protobuf/io/strtod.h" #include "google/protobuf/io/strtod.h"
#include "google/protobuf/io/zero_copy_stream.h" #include "google/protobuf/io/zero_copy_stream.h"
#include "google/protobuf/message.h"
namespace google { namespace google {
namespace protobuf { namespace protobuf {
@ -152,21 +157,6 @@ std::string StringifyDefaultValue(const FieldDescriptor& field) {
return ""; return "";
} }
std::string StringifySyntax(FileDescriptorLegacy::Syntax syntax) {
switch (syntax) {
case FileDescriptorLegacy::Syntax::SYNTAX_PROTO2:
return "proto2";
case FileDescriptorLegacy::Syntax::SYNTAX_PROTO3:
return "proto3";
case FileDescriptorLegacy::Syntax::SYNTAX_UNKNOWN:
default:
ABSL_LOG(FATAL)
<< "Unsupported syntax; this generator only supports proto2 "
"and proto3 syntax.";
return "";
}
}
} // namespace } // namespace
Generator::Generator() : file_(nullptr) {} Generator::Generator() : file_(nullptr) {}
@ -194,6 +184,8 @@ GeneratorOptions Generator::ParseParameter(absl::string_view parameter,
options.generate_pyi = true; options.generate_pyi = true;
} else if (option.first == "annotate_code") { } else if (option.first == "annotate_code") {
options.annotate_pyi = true; options.annotate_pyi = true;
} else if (option.first == "experimental_strip_nonfunctional_codegen") {
options.strip_nonfunctional_codegen = true;
} else { } else {
*error = absl::StrCat("Unknown generator option: ", option.first); *error = absl::StrCat("Unknown generator option: ", option.first);
} }
@ -211,8 +203,15 @@ bool Generator::Generate(const FileDescriptor* file,
// Generate pyi typing information // Generate pyi typing information
if (options.generate_pyi) { if (options.generate_pyi) {
python::PyiGenerator pyi_generator; python::PyiGenerator pyi_generator;
std::string pyi_options = options.annotate_pyi ? "annotate_code" : ""; std::vector<std::string> pyi_options;
if (!pyi_generator.Generate(file, pyi_options, context, error)) { if (options.annotate_pyi) {
pyi_options.push_back("annotate_code");
}
if (options.strip_nonfunctional_codegen) {
pyi_options.push_back("experimental_strip_nonfunctional_codegen");
}
if (!pyi_generator.Generate(file, absl::StrJoin(pyi_options, ","), context,
error)) {
return false; return false;
} }
} }
@ -423,7 +422,8 @@ void Generator::PrintFileDescriptor() const {
m["descriptor_name"] = kDescriptorKey; m["descriptor_name"] = kDescriptorKey;
m["name"] = file_->name(); m["name"] = file_->name();
m["package"] = file_->package(); m["package"] = file_->package();
m["syntax"] = StringifySyntax(FileDescriptorLegacy(file_).syntax()); m["syntax"] = std::string(
FileDescriptorLegacy::SyntaxName(FileDescriptorLegacy(file_).syntax()));
m["options"] = OptionsValue( m["options"] = OptionsValue(
StripLocalSourceRetentionOptions(*file_).SerializeAsString()); StripLocalSourceRetentionOptions(*file_).SerializeAsString());
m["serialized_descriptor"] = absl::CHexEscape(file_descriptor_serialized_); m["serialized_descriptor"] = absl::CHexEscape(file_descriptor_serialized_);
@ -677,8 +677,7 @@ void Generator::PrintDescriptor(const Descriptor& message_descriptor) const {
"options_value", OptionsValue(options_string), "extendable", "options_value", OptionsValue(options_string), "extendable",
message_descriptor.extension_range_count() > 0 ? "True" : "False", message_descriptor.extension_range_count() > 0 ? "True" : "False",
"syntax", "syntax",
StringifySyntax( FileDescriptorLegacy::SyntaxName(FileDescriptorLegacy(file_).syntax()));
FileDescriptorLegacy(message_descriptor.file()).syntax()));
printer_->Print(",\n"); printer_->Print(",\n");
// Extension ranges // Extension ranges
@ -1167,7 +1166,7 @@ void Generator::PrintSerializedPbInterval(
const DescriptorProtoT& descriptor_proto, absl::string_view name) const { const DescriptorProtoT& descriptor_proto, absl::string_view name) const {
std::string sp; std::string sp;
descriptor_proto.SerializeToString(&sp); descriptor_proto.SerializeToString(&sp);
int offset = file_descriptor_serialized_.find(sp); size_t offset = file_descriptor_serialized_.find(sp);
ABSL_CHECK_GE(offset, 0); ABSL_CHECK_GE(offset, 0);
printer_->Print( printer_->Print(
@ -1177,26 +1176,34 @@ void Generator::PrintSerializedPbInterval(
absl::StrCat(offset + sp.size())); absl::StrCat(offset + sp.size()));
} }
namespace { template <typename DescriptorT>
void PrintDescriptorOptionsFixingCode(absl::string_view descriptor, bool Generator::PrintDescriptorOptionsFixingCode(
absl::string_view options, const DescriptorT& descriptor, absl::string_view descriptor_str) const {
io::Printer* printer) { std::string options = OptionsValue(
StripLocalSourceRetentionOptions(descriptor).SerializeAsString());
// Reset the _options to None thus DescriptorBase.GetOptions() can // Reset the _options to None thus DescriptorBase.GetOptions() can
// parse _options again after extensions are registered. // parse _options again after extensions are registered.
size_t dot_pos = descriptor.find('.'); size_t dot_pos = descriptor_str.find('.');
std::string descriptor_name; std::string descriptor_name;
if (dot_pos == std::string::npos) { if (dot_pos == std::string::npos) {
descriptor_name = absl::StrCat("_globals['", descriptor, "']"); descriptor_name = absl::StrCat("_globals['", descriptor_str, "']");
} else { } else {
descriptor_name = absl::StrCat("_globals['", descriptor.substr(0, dot_pos), descriptor_name =
"']", descriptor.substr(dot_pos)); absl::StrCat("_globals['", descriptor_str.substr(0, dot_pos), "']",
descriptor_str.substr(dot_pos));
}
if (options == "None") {
return false;
} }
printer->Print(
printer_->Print(
"$descriptor_name$._options = None\n" "$descriptor_name$._options = None\n"
"$descriptor_name$._serialized_options = $serialized_value$\n", "$descriptor_name$._serialized_options = $serialized_value$\n",
"descriptor_name", descriptor_name, "serialized_value", options); "descriptor_name", descriptor_name, "serialized_value", options);
return true;
} }
} // namespace
// Generates the start and end offsets for each entity in the serialized file // Generates the start and end offsets for each entity in the serialized file
// descriptor. The file argument must exactly match what was serialized into // descriptor. The file argument must exactly match what was serialized into
@ -1246,11 +1253,7 @@ void Generator::SetMessagePbInterval(const DescriptorProto& message_proto,
// Prints expressions that set the options field of all descriptors. // Prints expressions that set the options field of all descriptors.
void Generator::FixAllDescriptorOptions() const { void Generator::FixAllDescriptorOptions() const {
// Prints an expression that sets the file descriptor's options. // Prints an expression that sets the file descriptor's options.
std::string file_options = OptionsValue( if (!PrintDescriptorOptionsFixingCode(*file_, kDescriptorKey)) {
StripLocalSourceRetentionOptions(*file_).SerializeAsString());
if (file_options != "None") {
PrintDescriptorOptionsFixingCode(kDescriptorKey, file_options, printer_);
} else {
printer_->Print("DESCRIPTOR._options = None\n"); printer_->Print("DESCRIPTOR._options = None\n");
} }
// Prints expressions that set the options for all top level enums. // Prints expressions that set the options for all top level enums.
@ -1275,35 +1278,23 @@ void Generator::FixAllDescriptorOptions() const {
} }
void Generator::FixOptionsForOneof(const OneofDescriptor& oneof) const { void Generator::FixOptionsForOneof(const OneofDescriptor& oneof) const {
std::string oneof_options = std::string oneof_name = absl::Substitute(
OptionsValue(StripLocalSourceRetentionOptions(oneof).SerializeAsString()); "$0.$1['$2']", ModuleLevelDescriptorName(*oneof.containing_type()),
if (oneof_options != "None") { "oneofs_by_name", oneof.name());
std::string oneof_name = absl::Substitute( PrintDescriptorOptionsFixingCode(oneof, oneof_name);
"$0.$1['$2']", ModuleLevelDescriptorName(*oneof.containing_type()),
"oneofs_by_name", oneof.name());
PrintDescriptorOptionsFixingCode(oneof_name, oneof_options, printer_);
}
} }
// Prints expressions that set the options for an enum descriptor and its // Prints expressions that set the options for an enum descriptor and its
// value descriptors. // value descriptors.
void Generator::FixOptionsForEnum(const EnumDescriptor& enum_descriptor) const { void Generator::FixOptionsForEnum(const EnumDescriptor& enum_descriptor) const {
std::string descriptor_name = ModuleLevelDescriptorName(enum_descriptor); std::string descriptor_name = ModuleLevelDescriptorName(enum_descriptor);
std::string enum_options = OptionsValue( PrintDescriptorOptionsFixingCode(enum_descriptor, descriptor_name);
StripLocalSourceRetentionOptions(enum_descriptor).SerializeAsString());
if (enum_options != "None") {
PrintDescriptorOptionsFixingCode(descriptor_name, enum_options, printer_);
}
for (int i = 0; i < enum_descriptor.value_count(); ++i) { for (int i = 0; i < enum_descriptor.value_count(); ++i) {
const EnumValueDescriptor& value_descriptor = *enum_descriptor.value(i); const EnumValueDescriptor& value_descriptor = *enum_descriptor.value(i);
std::string value_options = OptionsValue( PrintDescriptorOptionsFixingCode(
StripLocalSourceRetentionOptions(value_descriptor).SerializeAsString()); value_descriptor,
if (value_options != "None") { absl::StrFormat("%s.values_by_name[\"%s\"]", descriptor_name.c_str(),
PrintDescriptorOptionsFixingCode( value_descriptor.name().c_str()));
absl::StrFormat("%s.values_by_name[\"%s\"]", descriptor_name.c_str(),
value_descriptor.name().c_str()),
value_options, printer_);
}
} }
} }
@ -1313,46 +1304,33 @@ void Generator::FixOptionsForService(
const ServiceDescriptor& service_descriptor) const { const ServiceDescriptor& service_descriptor) const {
std::string descriptor_name = std::string descriptor_name =
ModuleLevelServiceDescriptorName(service_descriptor); ModuleLevelServiceDescriptorName(service_descriptor);
std::string service_options = OptionsValue( PrintDescriptorOptionsFixingCode(service_descriptor, descriptor_name);
StripLocalSourceRetentionOptions(service_descriptor).SerializeAsString());
if (service_options != "None") {
PrintDescriptorOptionsFixingCode(descriptor_name, service_options,
printer_);
}
for (int i = 0; i < service_descriptor.method_count(); ++i) { for (int i = 0; i < service_descriptor.method_count(); ++i) {
const MethodDescriptor* method = service_descriptor.method(i); const MethodDescriptor* method = service_descriptor.method(i);
std::string method_options = OptionsValue( PrintDescriptorOptionsFixingCode(
StripLocalSourceRetentionOptions(*method).SerializeAsString()); *method, absl::StrCat(descriptor_name, ".methods_by_name['",
if (method_options != "None") { method->name(), "']"));
std::string method_name = absl::StrCat(
descriptor_name, ".methods_by_name['", method->name(), "']");
PrintDescriptorOptionsFixingCode(method_name, method_options, printer_);
}
} }
} }
// Prints expressions that set the options for field descriptors (including // Prints expressions that set the options for field descriptors (including
// extensions). // extensions).
void Generator::FixOptionsForField(const FieldDescriptor& field) const { void Generator::FixOptionsForField(const FieldDescriptor& field) const {
std::string field_options = std::string field_name;
OptionsValue(StripLocalSourceRetentionOptions(field).SerializeAsString()); if (field.is_extension()) {
if (field_options != "None") { if (field.extension_scope() == nullptr) {
std::string field_name; // Top level extensions.
if (field.is_extension()) { field_name = field.name();
if (field.extension_scope() == nullptr) {
// Top level extensions.
field_name = field.name();
} else {
field_name = FieldReferencingExpression(field.extension_scope(), field,
"extensions_by_name");
}
} else { } else {
field_name = FieldReferencingExpression(field.containing_type(), field, field_name = FieldReferencingExpression(field.extension_scope(), field,
"fields_by_name"); "extensions_by_name");
} }
PrintDescriptorOptionsFixingCode(field_name, field_options, printer_); } else {
field_name = FieldReferencingExpression(field.containing_type(), field,
"fields_by_name");
} }
PrintDescriptorOptionsFixingCode(field, field_name);
} }
// Prints expressions that set the options for a message and all its inner // Prints expressions that set the options for a message and all its inner
@ -1381,13 +1359,8 @@ void Generator::FixOptionsForMessage(const Descriptor& descriptor) const {
FixOptionsForField(field); FixOptionsForField(field);
} }
// Message option for this message. // Message option for this message.
std::string message_options = OptionsValue( PrintDescriptorOptionsFixingCode(descriptor,
StripLocalSourceRetentionOptions(descriptor).SerializeAsString()); ModuleLevelDescriptorName(descriptor));
if (message_options != "None") {
std::string descriptor_name = ModuleLevelDescriptorName(descriptor);
PrintDescriptorOptionsFixingCode(descriptor_name, message_options,
printer_);
}
} }
// If a dependency forwards other files through public dependencies, let's // If a dependency forwards other files through public dependencies, let's

@ -12,6 +12,7 @@
#ifndef GOOGLE_PROTOBUF_COMPILER_PYTHON_GENERATOR_H__ #ifndef GOOGLE_PROTOBUF_COMPILER_PYTHON_GENERATOR_H__
#define GOOGLE_PROTOBUF_COMPILER_PYTHON_GENERATOR_H__ #define GOOGLE_PROTOBUF_COMPILER_PYTHON_GENERATOR_H__
#include <cstdint>
#include <string> #include <string>
#include <vector> #include <vector>
@ -49,6 +50,7 @@ struct GeneratorOptions {
bool generate_pyi = false; bool generate_pyi = false;
bool annotate_pyi = false; bool annotate_pyi = false;
bool bootstrap = false; bool bootstrap = false;
bool strip_nonfunctional_codegen = false;
}; };
class PROTOC_EXPORT Generator : public CodeGenerator { class PROTOC_EXPORT Generator : public CodeGenerator {
@ -141,6 +143,10 @@ class PROTOC_EXPORT Generator : public CodeGenerator {
void PrintSerializedPbInterval(const DescriptorProtoT& descriptor_proto, void PrintSerializedPbInterval(const DescriptorProtoT& descriptor_proto,
absl::string_view name) const; absl::string_view name) const;
template <typename DescriptorT>
bool PrintDescriptorOptionsFixingCode(const DescriptorT& descriptor,
absl::string_view descriptor_str) const;
void FixAllDescriptorOptions() const; void FixAllDescriptorOptions() const;
void FixOptionsForField(const FieldDescriptor& field) const; void FixOptionsForField(const FieldDescriptor& field) const;
void FixOptionsForOneof(const OneofDescriptor& oneof) const; void FixOptionsForOneof(const OneofDescriptor& oneof) const;

@ -18,6 +18,7 @@
#include "absl/strings/match.h" #include "absl/strings/match.h"
#include "absl/strings/str_split.h" #include "absl/strings/str_split.h"
#include "absl/strings/string_view.h" #include "absl/strings/string_view.h"
#include "google/protobuf/compiler/code_generator.h"
#include "google/protobuf/compiler/python/helpers.h" #include "google/protobuf/compiler/python/helpers.h"
#include "google/protobuf/descriptor.h" #include "google/protobuf/descriptor.h"
#include "google/protobuf/descriptor.pb.h" #include "google/protobuf/descriptor.pb.h"
@ -169,6 +170,9 @@ void PyiGenerator::PrintImports() const {
bool has_importlib = false; bool has_importlib = false;
for (int i = 0; i < file_->dependency_count(); ++i) { for (int i = 0; i < file_->dependency_count(); ++i) {
const FileDescriptor* dep = file_->dependency(i); const FileDescriptor* dep = file_->dependency(i);
if (strip_nonfunctional_codegen_ && IsKnownFeatureProto(dep->name())) {
continue;
}
PrintImportForDescriptor(*dep, &seen_aliases, &has_importlib); PrintImportForDescriptor(*dep, &seen_aliases, &has_importlib);
for (int j = 0; j < dep->public_dependency_count(); ++j) { for (int j = 0; j < dep->public_dependency_count(); ++j) {
PrintImportForDescriptor(*dep->public_dependency(j), &seen_aliases, PrintImportForDescriptor(*dep->public_dependency(j), &seen_aliases,
@ -570,11 +574,14 @@ bool PyiGenerator::Generate(const FileDescriptor* file,
std::string filename; std::string filename;
bool annotate_code = false; bool annotate_code = false;
strip_nonfunctional_codegen_ = false;
for (const std::pair<std::string, std::string>& option : options) { for (const std::pair<std::string, std::string>& option : options) {
if (option.first == "annotate_code") { if (option.first == "annotate_code") {
annotate_code = true; annotate_code = true;
} else if (absl::EndsWith(option.first, ".pyi")) { } else if (absl::EndsWith(option.first, ".pyi")) {
filename = option.first; filename = option.first;
} else if (option.first == "experimental_strip_nonfunctional_codegen") {
strip_nonfunctional_codegen_ = true;
} else { } else {
*error = absl::StrCat("Unknown generator option: ", option.first); *error = absl::StrCat("Unknown generator option: ", option.first);
return false; return false;

@ -13,6 +13,7 @@
#define GOOGLE_PROTOBUF_COMPILER_PYTHON_PYI_GENERATOR_H__ #define GOOGLE_PROTOBUF_COMPILER_PYTHON_PYI_GENERATOR_H__
#include <string> #include <string>
#include <vector>
#include "absl/container/flat_hash_map.h" #include "absl/container/flat_hash_map.h"
#include "absl/container/flat_hash_set.h" #include "absl/container/flat_hash_set.h"
@ -53,6 +54,12 @@ class PROTOC_EXPORT PyiGenerator : public google::protobuf::compiler::CodeGenera
GeneratorContext* generator_context, GeneratorContext* generator_context,
std::string* error) const override; std::string* error) const override;
Edition GetMinimumEdition() const override { return Edition::EDITION_PROTO2; }
Edition GetMaximumEdition() const override { return Edition::EDITION_2023; }
std::vector<const FieldDescriptor*> GetFeatureExtensions() const override {
return {};
}
private: private:
void PrintImportForDescriptor(const FileDescriptor& desc, void PrintImportForDescriptor(const FileDescriptor& desc,
absl::flat_hash_set<std::string>* seen_aliases, absl::flat_hash_set<std::string>* seen_aliases,
@ -83,6 +90,7 @@ class PROTOC_EXPORT PyiGenerator : public google::protobuf::compiler::CodeGenera
mutable absl::Mutex mutex_; mutable absl::Mutex mutex_;
mutable const FileDescriptor* file_; // Set in Generate(). Under mutex_. mutable const FileDescriptor* file_; // Set in Generate(). Under mutex_.
mutable io::Printer* printer_; // Set in Generate(). Under mutex_. mutable io::Printer* printer_; // Set in Generate(). Under mutex_.
mutable bool strip_nonfunctional_codegen_ = false; // Set in Generate().
// import_map will be a mapping from filename to module alias, e.g. // import_map will be a mapping from filename to module alias, e.g.
// "google3/foo/bar.py" -> "_bar" // "google3/foo/bar.py" -> "_bar"
mutable absl::flat_hash_map<std::string, std::string> import_map_; mutable absl::flat_hash_map<std::string, std::string> import_map_;

Loading…
Cancel
Save