protobuf/upb/bazel/amalgamate.py

137 lines
4.7 KiB
Python
Executable File

#!/usr/bin/python
#
# Protocol Buffers - Google's data interchange format
# Copyright 2023 Google LLC. All rights reserved.
# https://developers.google.com/protocol-buffers/
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are
# met:
#
# * Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
# * Redistributions in binary form must reproduce the above
# copyright notice, this list of conditions and the following disclaimer
# in the documentation and/or other materials provided with the
# distribution.
# * Neither the name of Google LLC nor the names of its
# contributors may be used to endorse or promote products derived from
# this software without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
import sys
import re
import os
INCLUDE_RE = re.compile('^#include "([^"]*)"')
def parse_include(line):
match = INCLUDE_RE.match(line)
return match.groups()[0] if match else None
class Amalgamator:
def __init__(self, h_out, c_out):
self.include_paths = ["."]
self.included = set()
self.output_h = open(h_out, "w")
self.output_c = open(c_out, "w")
self.h_out = h_out.split("/")[-1]
def amalgamate(self, h_files, c_files):
self.h_files = set(h_files)
self.output_c.write("/* Amalgamated source file */\n")
self.output_c.write('#include "%s"\n' % (self.h_out))
if self.h_out == "ruby-upb.h":
self.output_h.write("// Ruby is still using proto3 enum semantics for proto2\n")
self.output_h.write("#define UPB_DISABLE_CLOSED_ENUM_CHECKING\n")
self.output_h.write("/* Amalgamated source file */\n")
port_def = self._find_include_file("upb/port/def.inc")
port_undef = self._find_include_file("upb/port/undef.inc")
self._process_file(port_def, self.output_h)
self._process_file(port_def, self.output_c)
for file in c_files:
self._process_file(file, self.output_c)
self._process_file(port_undef, self.output_h)
self._process_file(port_undef, self.output_c)
def _process_file(self, infile_name, outfile):
lines = open(infile_name).readlines()
has_copyright = lines[0].startswith(
"// Protocol Buffers - Google's data interchange format"
)
if has_copyright:
while not lines[0].startswith(
"// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH"
" DAMAGE"
) and not lines[0].startswith(
"// https://developers.google.com/open-source/licenses/bsd"
):
lines.pop(0)
lines.pop(0)
for line in lines:
if not self._process_include(line):
outfile.write(line)
def _find_include_file(self, name):
for h_file in self.h_files:
if h_file.endswith(name):
return h_file
def _process_include(self, line):
include = parse_include(line)
if not include:
return False
if not (include.startswith("upb") or include.startswith("google")):
return False
if include and (include.endswith("port/def.inc") or include.endswith("port/undef.inc")):
# Skip, we handle this separately
return True
if include.endswith("hpp"):
# Skip, we don't support the amalgamation from C++.
return True
elif include in self.included:
return True
else:
# Include this upb header inline.
h_file = self._find_include_file(include)
if h_file:
self.h_files.remove(h_file)
self.included.add(include)
self._process_file(h_file, self.output_h)
return True
raise RuntimeError("Couldn't find include: " + include + ", h_files=" + repr(self.h_files))
# ---- main ----
c_out = sys.argv[1]
h_out = sys.argv[2]
amalgamator = Amalgamator(h_out, c_out)
c_files = []
h_files = []
for arg in sys.argv[3:]:
arg = arg.strip()
if arg.endswith(".h") or arg.endswith(".inc"):
h_files.append(arg)
else:
c_files.append(arg)
amalgamator.amalgamate(h_files, c_files)