#!/usr/bin/env python3 # Copyright 2015 gRPC authors. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. import argparse import datetime import os import re import subprocess import sys # find our home ROOT = os.path.abspath(os.path.join(os.path.dirname(sys.argv[0]), "../..")) os.chdir(ROOT) # parse command line argp = argparse.ArgumentParser(description="copyright checker") argp.add_argument( "-o", "--output", default="details", choices=["list", "details"] ) argp.add_argument("-s", "--skips", default=0, action="store_const", const=1) argp.add_argument("-a", "--ancient", default=0, action="store_const", const=1) argp.add_argument("--precommit", action="store_true") argp.add_argument("--fix", action="store_true") args = argp.parse_args() # open the license text with open("NOTICE.txt") as f: LICENSE_NOTICE = f.read().splitlines() # license format by file extension # key is the file extension, value is a format string # that given a line of license text, returns what should # be in the file LICENSE_PREFIX_RE = { ".bat": r"@rem\s*", ".c": r"\s*(?://|\*)\s*", ".cc": r"\s*(?://|\*)\s*", ".h": r"\s*(?://|\*)\s*", ".m": r"\s*\*\s*", ".mm": r"\s*\*\s*", ".php": r"\s*\*\s*", ".js": r"\s*\*\s*", ".py": r"#\s*", ".pyx": r"#\s*", ".pxd": r"#\s*", ".pxi": r"#\s*", ".rb": r"#\s*", ".sh": r"#\s*", ".proto": r"//\s*", ".cs": r"//\s*", ".mak": r"#\s*", ".bazel": r"#\s*", ".bzl": r"#\s*", "Makefile": r"#\s*", "Dockerfile": r"#\s*", "BUILD": r"#\s*", } # The key is the file extension, while the value is a tuple of fields # (header, prefix, footer). # For example, for javascript multi-line comments, the header will be '/*', the # prefix will be '*' and the footer will be '*/'. # If header and footer are irrelevant for a specific file extension, they are # set to None. LICENSE_PREFIX_TEXT = { ".bat": (None, "@rem", None), ".c": (None, "//", None), ".cc": (None, "//", None), ".h": (None, "//", None), ".m": ("/**", " *", " */"), ".mm": ("/**", " *", " */"), ".php": ("/**", " *", " */"), ".js": ("/**", " *", " */"), ".py": (None, "#", None), ".pyx": (None, "#", None), ".pxd": (None, "#", None), ".pxi": (None, "#", None), ".rb": (None, "#", None), ".sh": (None, "#", None), ".proto": (None, "//", None), ".cs": (None, "//", None), ".mak": (None, "#", None), ".bazel": (None, "#", None), ".bzl": (None, "#", None), "Makefile": (None, "#", None), "Dockerfile": (None, "#", None), "BUILD": (None, "#", None), } _EXEMPT = frozenset( ( # Generated protocol compiler output. "examples/python/helloworld/helloworld_pb2.py", "examples/python/helloworld/helloworld_pb2_grpc.py", "examples/python/multiplex/helloworld_pb2.py", "examples/python/multiplex/helloworld_pb2_grpc.py", "examples/python/multiplex/route_guide_pb2.py", "examples/python/multiplex/route_guide_pb2_grpc.py", "examples/python/route_guide/route_guide_pb2.py", "examples/python/route_guide/route_guide_pb2_grpc.py", # Generated doxygen config file "tools/doxygen/Doxyfile.php", # An older file originally from outside gRPC. "src/php/tests/bootstrap.php", # census.proto copied from github "tools/grpcz/census.proto", # status.proto copied from googleapis "src/proto/grpc/status/status.proto", # Gradle wrappers used to build for Android "examples/android/helloworld/gradlew.bat", "src/android/test/interop/gradlew.bat", # Designer-generated source "examples/csharp/HelloworldXamarin/Droid/Resources/Resource.designer.cs", "examples/csharp/HelloworldXamarin/iOS/ViewController.designer.cs", # BoringSSL generated header. It has commit version information at the head # of the file so we cannot check the license info. "src/boringssl/boringssl_prefix_symbols.h", ) ) _ENFORCE_CPP_STYLE_COMMENT_PATH_PREFIX = tuple( [ "include/grpc++/", "include/grpcpp/", "src/core/", "src/cpp/", "test/core/", "test/cpp/", "fuzztest/", ] ) RE_YEAR = ( r"Copyright (?P[0-9]+\-)?(?P[0-9]+) ([Tt]he )?gRPC" r" [Aa]uthors(\.|)" ) RE_LICENSE = dict( ( k, r"\n".join( LICENSE_PREFIX_RE[k] + (RE_YEAR if re.search(RE_YEAR, line) else re.escape(line)) for line in LICENSE_NOTICE ), ) for k, v in list(LICENSE_PREFIX_RE.items()) ) RE_C_STYLE_COMMENT_START = r"^/\*\s*\n" RE_C_STYLE_COMMENT_OPTIONAL_LINE = r"(?:\s*\*\s*\n)*" RE_C_STYLE_COMMENT_END = r"\s*\*/" RE_C_STYLE_COMMENT_LICENSE = ( RE_C_STYLE_COMMENT_START + RE_C_STYLE_COMMENT_OPTIONAL_LINE + r"\n".join( r"\s*(?:\*)\s*" + (RE_YEAR if re.search(RE_YEAR, line) else re.escape(line)) for line in LICENSE_NOTICE ) + r"\n" + RE_C_STYLE_COMMENT_OPTIONAL_LINE + RE_C_STYLE_COMMENT_END ) RE_CPP_STYLE_COMMENT_LICENSE = r"\n".join( r"\s*(?://)\s*" + (RE_YEAR if re.search(RE_YEAR, line) else re.escape(line)) for line in LICENSE_NOTICE ) YEAR = datetime.datetime.now().year LICENSE_YEAR = f"Copyright {YEAR} gRPC authors." def join_license_text(header, prefix, footer, notice): text = (header + "\n") if header else "" def add_prefix(prefix, line): # Don't put whitespace between prefix and empty line to avoid having # trailing whitespaces. return prefix + ("" if len(line) == 0 else " ") + line text += "\n".join( add_prefix(prefix, (LICENSE_YEAR if re.search(RE_YEAR, line) else line)) for line in LICENSE_NOTICE ) text += "\n" if footer: text += footer + "\n" return text LICENSE_TEXT = dict( ( k, join_license_text( LICENSE_PREFIX_TEXT[k][0], LICENSE_PREFIX_TEXT[k][1], LICENSE_PREFIX_TEXT[k][2], LICENSE_NOTICE, ), ) for k, v in list(LICENSE_PREFIX_TEXT.items()) ) if args.precommit: FILE_LIST_COMMAND = ( "git status -z | grep -Poz '(?<=^[MARC][MARCD ] )[^\s]+'" ) else: FILE_LIST_COMMAND = ( "git ls-tree -r --name-only -r HEAD | " "grep -v ^third_party/ |" 'grep -v "\(ares_config.h\|ares_build.h\)"' ) def load(name): with open(name) as f: return f.read() def save(name, text): with open(name, "w") as f: f.write(text) assert re.search(RE_LICENSE["Makefile"], load("Makefile")) def log(cond, why, filename): if not cond: return if args.output == "details": print(("%s: %s" % (why, filename))) else: print(filename) def write_copyright(license_text, file_text, filename): shebang = "" lines = file_text.split("\n") if lines and lines[0].startswith("#!"): shebang = lines[0] + "\n" file_text = file_text[len(shebang) :] rewritten_text = shebang + license_text + "\n" + file_text with open(filename, "w") as f: f.write(rewritten_text) def replace_copyright(license_text, file_text, filename): m = re.search(RE_C_STYLE_COMMENT_LICENSE, text) if m: rewritten_text = license_text + file_text[m.end() :] with open(filename, "w") as f: f.write(rewritten_text) return True return False # scan files, validate the text ok = True filename_list = [] try: filename_list = ( subprocess.check_output(FILE_LIST_COMMAND, shell=True) .decode() .splitlines() ) except subprocess.CalledProcessError: sys.exit(0) for filename in filename_list: enforce_cpp_style_comment = False if filename in _EXEMPT: continue # Skip check for upb generated code. if ( filename.endswith(".upb.h") or filename.endswith(".upb.c") or filename.endswith(".upbdefs.h") or filename.endswith(".upbdefs.c") ): continue ext = os.path.splitext(filename)[1] base = os.path.basename(filename) if filename.startswith(_ENFORCE_CPP_STYLE_COMMENT_PATH_PREFIX) and ext in [ ".cc", ".h", ]: enforce_cpp_style_comment = True re_license = RE_CPP_STYLE_COMMENT_LICENSE license_text = LICENSE_TEXT[ext] elif ext in RE_LICENSE: re_license = RE_LICENSE[ext] license_text = LICENSE_TEXT[ext] elif base in RE_LICENSE: re_license = RE_LICENSE[base] license_text = LICENSE_TEXT[base] else: log(args.skips, "skip", filename) continue try: text = load(filename) except: continue m = re.search(re_license, text) if m: pass elif enforce_cpp_style_comment: log( 1, "copyright missing or does not use cpp-style copyright header", filename, ) if args.fix: # Attempt fix: search for c-style copyright header and replace it # with cpp-style copyright header. If that doesn't work # (e.g. missing copyright header), write cpp-style copyright header. if not replace_copyright(license_text, text, filename): write_copyright(license_text, text, filename) ok = False elif "DO NOT EDIT" not in text: if args.fix: write_copyright(license_text, text, filename) log(1, "copyright missing (fixed)", filename) else: log(1, "copyright missing", filename) ok = False if not ok and not args.fix: print( "You may use following command to automatically fix copyright headers:" ) print(" tools/distrib/check_copyright.py --fix") sys.exit(0 if ok else 1)