#!/usr/bin/python # # Protocol Buffers - Google's data interchange format # Copyright 2023 Google LLC. All rights reserved. # https://developers.google.com/protocol-buffers/ # # Redistribution and use in source and binary forms, with or without # modification, are permitted provided that the following conditions are # met: # # * Redistributions of source code must retain the above copyright # notice, this list of conditions and the following disclaimer. # * Redistributions in binary form must reproduce the above # copyright notice, this list of conditions and the following disclaimer # in the documentation and/or other materials provided with the # distribution. # * Neither the name of Google LLC nor the names of its # contributors may be used to endorse or promote products derived from # this software without specific prior written permission. # # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. import sys import re import os INCLUDE_RE = re.compile('^#include "([^"]*)"') def parse_include(line): match = INCLUDE_RE.match(line) return match.groups()[0] if match else None class Amalgamator: def __init__(self, h_out, c_out): self.include_paths = ["."] self.included = set() self.output_h = open(h_out, "w") self.output_c = open(c_out, "w") self.h_out = h_out.split("/")[-1] def amalgamate(self, h_files, c_files): self.h_files = set(h_files) self.output_c.write("/* Amalgamated source file */\n") self.output_c.write('#include "%s"\n' % (self.h_out)) if self.h_out == "ruby-upb.h": self.output_h.write("// Ruby is still using proto3 enum semantics for proto2\n") self.output_h.write("#define UPB_DISABLE_PROTO2_ENUM_CHECKING\n") self.output_h.write("/* Amalgamated source file */\n") port_def = self._find_include_file("upb/port/def.inc") port_undef = self._find_include_file("upb/port/undef.inc") self._process_file(port_def, self.output_h) self._process_file(port_def, self.output_c) for file in c_files: self._process_file(file, self.output_c) self._process_file(port_undef, self.output_h) self._process_file(port_undef, self.output_c) def _process_file(self, infile_name, outfile): lines = open(infile_name).readlines() has_copyright = lines[0].startswith( "// Protocol Buffers - Google's data interchange format" ) if has_copyright: while not lines[0].startswith( "// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH" " DAMAGE" ) and not lines[0].startswith( "// https://developers.google.com/open-source/licenses/bsd" ): lines.pop(0) lines.pop(0) for line in lines: if not self._process_include(line): outfile.write(line) def _find_include_file(self, name): for h_file in self.h_files: if h_file.endswith(name): return h_file def _process_include(self, line): include = parse_include(line) if not include: return False if not (include.startswith("upb") or include.startswith("google")): return False if include and (include.endswith("port/def.inc") or include.endswith("port/undef.inc")): # Skip, we handle this separately return True if include.endswith("hpp"): # Skip, we don't support the amalgamation from C++. return True elif include in self.included: return True else: # Include this upb header inline. h_file = self._find_include_file(include) if h_file: self.h_files.remove(h_file) self.included.add(include) self._process_file(h_file, self.output_h) return True raise RuntimeError("Couldn't find include: " + include + ", h_files=" + repr(self.h_files)) # ---- main ---- c_out = sys.argv[1] h_out = sys.argv[2] amalgamator = Amalgamator(h_out, c_out) c_files = [] h_files = [] for arg in sys.argv[3:]: arg = arg.strip() if arg.endswith(".h") or arg.endswith(".inc"): h_files.append(arg) else: c_files.append(arg) amalgamator.amalgamate(h_files, c_files)