upb/bazel/amalgamate.py - third_party/github/protocolbuffers/protobuf - Git at Google

 #!/usr/bin/python
 #
 # Protocol Buffers - Google's data interchange format
 # Copyright 2023 Google LLC.  All rights reserved.
 # https://developers.google.com/protocol-buffers/
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions are
 # met:
 #
 #     * Redistributions of source code must retain the above copyright
 # notice, this list of conditions and the following disclaimer.
 #     * Redistributions in binary form must reproduce the above
 # copyright notice, this list of conditions and the following disclaimer
 # in the documentation and/or other materials provided with the
 # distribution.
 #     * Neither the name of Google LLC nor the names of its
 # contributors may be used to endorse or promote products derived from
 # this software without specific prior written permission.
 #
 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 import sys
 import re
 import os

 INCLUDE_RE = re.compile('^#include "([^"]*)"')

 def parse_include(line):
   match = INCLUDE_RE.match(line)
   return match.groups()[0] if match else None

 class Amalgamator:
   def __init__(self, h_out, c_out):
     self.include_paths = ["."]
     self.included = set()
     self.output_h = open(h_out, "w")
     self.output_c = open(c_out, "w")
     self.h_out = h_out.split("/")[-1]

   def amalgamate(self, h_files, c_files):
     self.h_files = set(h_files)
     self.output_c.write("/* Amalgamated source file */\n")
     self.output_c.write('#include "%s"\n' % (self.h_out))
     if self.h_out == "ruby-upb.h":
       self.output_h.write("// Ruby is still using proto3 enum semantics for proto2\n")
       self.output_h.write("#define UPB_DISABLE_CLOSED_ENUM_CHECKING\n")

     self.output_h.write("/* Amalgamated source file */\n")

     port_def = self._find_include_file("upb/port/def.inc")
     port_undef = self._find_include_file("upb/port/undef.inc")
     self._process_file(port_def, self.output_h)
     self._process_file(port_def, self.output_c)

     for file in c_files:
       self._process_file(file, self.output_c)

     self._process_file(port_undef, self.output_h)
     self._process_file(port_undef, self.output_c)

   def _process_file(self, infile_name, outfile):
     lines = open(infile_name).readlines()

     has_copyright = lines[0].startswith(
         "// Protocol Buffers - Google's data interchange format"
     )
     if has_copyright:
       while not lines[0].startswith(
           "// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH"
           " DAMAGE"
       ) and not lines[0].startswith(
           "// https://developers.google.com/open-source/licenses/bsd"
       ):
         lines.pop(0)
       lines.pop(0)

     for line in lines:
       if not self._process_include(line):
         outfile.write(line)

   def _find_include_file(self, name):
     for h_file in self.h_files:
       if h_file.endswith(name):
         return h_file

   def _process_include(self, line):
     include = parse_include(line)
     if not include:
       return False
     if not (include.startswith("upb") or include.startswith("google")):
       return False
     if include and (include.endswith("port/def.inc") or include.endswith("port/undef.inc")):
       # Skip, we handle this separately
       return True
     if include.endswith("hpp"):
       # Skip, we don't support the amalgamation from C++.
       return True
     if re.search(r"stage\d/", include):
       return True
     elif include in self.included:
       return True
     else:
       # Include this upb header inline.
       h_file = self._find_include_file(include)
       if h_file:
         self.h_files.remove(h_file)
         self.included.add(include)
         self._process_file(h_file, self.output_h)
         return True
       raise RuntimeError("Couldn't find include: " + include + ", h_files=" + repr(self.h_files))

 # ---- main ----

 c_out = sys.argv[1]
 h_out = sys.argv[2]
 amalgamator = Amalgamator(h_out, c_out)
 c_files = []
 h_files = []

 for arg in sys.argv[3:]:
   arg = arg.strip()
   if arg.endswith(".h") or arg.endswith(".inc"):
     h_files.append(arg)
   else:
     c_files.append(arg)

 amalgamator.amalgamate(h_files, c_files)
	#!/usr/bin/python
	#
	# Protocol Buffers - Google's data interchange format
	# Copyright 2023 Google LLC. All rights reserved.
	# https://developers.google.com/protocol-buffers/
	#
	# Redistribution and use in source and binary forms, with or without
	# modification, are permitted provided that the following conditions are
	# met:
	#
	# * Redistributions of source code must retain the above copyright
	# notice, this list of conditions and the following disclaimer.
	# * Redistributions in binary form must reproduce the above
	# copyright notice, this list of conditions and the following disclaimer
	# in the documentation and/or other materials provided with the
	# distribution.
	# * Neither the name of Google LLC nor the names of its
	# contributors may be used to endorse or promote products derived from
	# this software without specific prior written permission.
	#
	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	import sys
	import re
	import os

	INCLUDE_RE = re.compile('^#include "([^"]*)"')

	def parse_include(line):
	match = INCLUDE_RE.match(line)
	return match.groups()[0] if match else None

	class Amalgamator:
	def __init__(self, h_out, c_out):
	self.include_paths = ["."]
	self.included = set()
	self.output_h = open(h_out, "w")
	self.output_c = open(c_out, "w")
	self.h_out = h_out.split("/")[-1]

	def amalgamate(self, h_files, c_files):
	self.h_files = set(h_files)
	self.output_c.write("/* Amalgamated source file */\n")
	self.output_c.write('#include "%s"\n' % (self.h_out))
	if self.h_out == "ruby-upb.h":
	self.output_h.write("// Ruby is still using proto3 enum semantics for proto2\n")
	self.output_h.write("#define UPB_DISABLE_CLOSED_ENUM_CHECKING\n")

	self.output_h.write("/* Amalgamated source file */\n")

	port_def = self._find_include_file("upb/port/def.inc")
	port_undef = self._find_include_file("upb/port/undef.inc")
	self._process_file(port_def, self.output_h)
	self._process_file(port_def, self.output_c)

	for file in c_files:
	self._process_file(file, self.output_c)

	self._process_file(port_undef, self.output_h)
	self._process_file(port_undef, self.output_c)

	def _process_file(self, infile_name, outfile):
	lines = open(infile_name).readlines()

	has_copyright = lines[0].startswith(
	"// Protocol Buffers - Google's data interchange format"
	)
	if has_copyright:
	while not lines[0].startswith(
	"// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH"
	" DAMAGE"
	) and not lines[0].startswith(
	"// https://developers.google.com/open-source/licenses/bsd"
	):
	lines.pop(0)
	lines.pop(0)

	for line in lines:
	if not self._process_include(line):
	outfile.write(line)

	def _find_include_file(self, name):
	for h_file in self.h_files:
	if h_file.endswith(name):
	return h_file

	def _process_include(self, line):
	include = parse_include(line)
	if not include:
	return False
	if not (include.startswith("upb") or include.startswith("google")):
	return False
	if include and (include.endswith("port/def.inc") or include.endswith("port/undef.inc")):
	# Skip, we handle this separately
	return True
	if include.endswith("hpp"):
	# Skip, we don't support the amalgamation from C++.
	return True
	if re.search(r"stage\d/", include):
	return True
	elif include in self.included:
	return True
	else:
	# Include this upb header inline.
	h_file = self._find_include_file(include)
	if h_file:
	self.h_files.remove(h_file)
	self.included.add(include)
	self._process_file(h_file, self.output_h)
	return True
	raise RuntimeError("Couldn't find include: " + include + ", h_files=" + repr(self.h_files))

	# ---- main ----

	c_out = sys.argv[1]
	h_out = sys.argv[2]
	amalgamator = Amalgamator(h_out, c_out)
	c_files = []
	h_files = []

	for arg in sys.argv[3:]:
	arg = arg.strip()
	if arg.endswith(".h") or arg.endswith(".inc"):
	h_files.append(arg)
	else:
	c_files.append(arg)

	amalgamator.amalgamate(h_files, c_files)