python/private/local_runtime_repo.bzl - third_party/github/bazelbuild/rules_python - Git at Google

 # Copyright 2024 The Bazel Authors. All rights reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #    http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.

 """Create a repository for a locally installed Python runtime."""

 load(":enum.bzl", "enum")
 load(":repo_utils.bzl", "REPO_DEBUG_ENV_VAR", "repo_utils")

 # buildifier: disable=name-conventions
 _OnFailure = enum(
     SKIP = "skip",
     WARN = "warn",
     FAIL = "fail",
 )

 _TOOLCHAIN_IMPL_TEMPLATE = """\
 # Generated by python/private/local_runtime_repo.bzl

 load("@rules_python//python/private:local_runtime_repo_setup.bzl", "define_local_runtime_toolchain_impl")

 define_local_runtime_toolchain_impl(
     name = "local_runtime",
     major = "{major}",
     minor = "{minor}",
     micro = "{micro}",
     interpreter_path = "{interpreter_path}",
     interface_library = {interface_library},
     libraries = {libraries},
     implementation_name = "{implementation_name}",
     os = "{os}",
 )
 """

 def _norm_path(path):
     """Returns a path using '/' separators and no trailing slash."""
     path = path.replace("\\", "/")
     if path[-1] == "/":
         path = path[:-1]
     return path

 def _symlink_first_library(rctx, logger, libraries):
     """Symlinks the shared libraries into the lib/ directory.

     Args:
         rctx: A repository_ctx object
         logger: A repo_utils.logger object
         libraries: A list of static library paths to potentially symlink.
     Returns:
         A single library path linked by the action.
     """
     linked = None
     for target in libraries:
         origin = rctx.path(target)
         if not origin.exists:
             # The reported names don't always exist; it depends on the particulars
             # of the runtime installation.
             continue
         if target.endswith("/Python"):
             linked = "lib/{}.dylib".format(origin.basename)
         else:
             linked = "lib/{}".format(origin.basename)
         logger.debug("Symlinking {} to {}".format(origin, linked))
         repo_utils.watch(rctx, origin)
         rctx.symlink(origin, linked)
         break

     return linked

 def _local_runtime_repo_impl(rctx):
     logger = repo_utils.logger(rctx)
     on_failure = rctx.attr.on_failure

     def _emit_log(msg):
         if on_failure == "fail":
             logger.fail(msg)
         elif on_failure == "warn":
             logger.warn(msg)
         else:
             logger.debug(msg)

     result = _resolve_interpreter_path(rctx)
     if not result.resolved_path:
         _emit_log(lambda: "interpreter not found: {}".format(result.describe_failure()))

         # else, on_failure must be skip
         rctx.file("BUILD.bazel", _expand_incompatible_template())
         return
     else:
         interpreter_path = result.resolved_path

     logger.info(lambda: "resolved interpreter {} to {}".format(rctx.attr.interpreter_path, interpreter_path))

     exec_result = repo_utils.execute_unchecked(
         rctx,
         op = "local_runtime_repo.GetPythonInfo({})".format(rctx.name),
         arguments = [
             interpreter_path,
             rctx.path(rctx.attr._get_local_runtime_info),
         ],
         quiet = True,
         logger = logger,
     )
     if exec_result.return_code != 0:
         _emit_log(lambda: "GetPythonInfo failed: {}".format(exec_result.describe_failure()))

         # else, on_failure must be skip
         rctx.file("BUILD.bazel", _expand_incompatible_template())
         return

     info = json.decode(exec_result.stdout)
     logger.info(lambda: _format_get_info_result(info))

     # We use base_executable because we want the path within a Python
     # installation directory ("PYTHONHOME"). The problems with sys.executable
     # are:
     # * If we're in an activated venv, then we don't want the venv's
     #   `bin/python3` path to be used -- it isn't an actual Python installation.
     # * If sys.executable is a wrapper (e.g. pyenv), then (1) it may not be
     #   located within an actual Python installation directory, and (2) it
     #   can interfer with Python recognizing when it's within a venv.
     #
     # In some cases, it may be a symlink (usually e.g. `python3->python3.12`),
     # but we don't realpath() it to respect what it has decided is the
     # appropriate path.
     interpreter_path = info["base_executable"]

     # NOTE: Keep in sync with recursive glob in define_local_runtime_toolchain_impl
     include_path = rctx.path(info["include"])

     # The reported include path may not exist, and watching a non-existant
     # path is an error. Silently skip, since includes are only necessary
     # if C extensions are built.
     if include_path.exists and include_path.is_dir:
         repo_utils.watch_tree(rctx, include_path)
     else:
         pass

     # The cc_library.includes values have to be non-absolute paths, otherwise
     # the toolchain will give an error. Work around this error by making them
     # appear as part of this repo.
     rctx.symlink(include_path, "include")

     rctx.report_progress("Symlinking external Python shared libraries")
     interface_library = _symlink_first_library(rctx, logger, info["interface_libraries"])
     shared_library = _symlink_first_library(rctx, logger, info["dynamic_libraries"])
     static_library = _symlink_first_library(rctx, logger, info["static_libraries"])

     libraries = []
     if shared_library:
         libraries.append(shared_library)
     elif static_library:
         libraries.append(static_library)
     else:
         logger.warn("No external python libraries found.")

     build_bazel = _TOOLCHAIN_IMPL_TEMPLATE.format(
         major = info["major"],
         minor = info["minor"],
         micro = info["micro"],
         interpreter_path = _norm_path(interpreter_path),
         interface_library = repr(interface_library),
         libraries = repr(libraries),
         implementation_name = info["implementation_name"],
         os = "@platforms//os:{}".format(repo_utils.get_platforms_os_name(rctx)),
     )
     logger.debug(lambda: "BUILD.bazel\n{}".format(build_bazel))

     rctx.file("WORKSPACE", "")
     rctx.file("MODULE.bazel", "")
     rctx.file("REPO.bazel", "")
     rctx.file("BUILD.bazel", build_bazel)

 local_runtime_repo = repository_rule(
     implementation = _local_runtime_repo_impl,
     doc = """
 Use a locally installed Python runtime as a toolchain implementation.

 Note this uses the runtime as a *platform runtime*. A platform runtime means
 means targets don't include the runtime itself as part of their runfiles or
 inputs. Instead, users must assure that where the targets run have the runtime
 pre-installed or otherwise available.

 This results in lighter weight binaries (in particular, Bazel doesn't have to
 create thousands of files for every `py_test`), at the risk of having to rely on
 a system having the necessary Python installed.
 """,
     attrs = {
         "interpreter_path": attr.string(
             doc = """
 An absolute path or program name on the `PATH` env var.

 Values with slashes are assumed to be the path to a program. Otherwise, it is
 treated as something to search for on `PATH`

 Note that, when a plain program name is used, the path to the interpreter is
 resolved at repository evalution time, not runtime of any resulting binaries.
 """,
             default = "python3",
         ),
         "on_failure": attr.string(
             default = _OnFailure.SKIP,
             values = sorted(_OnFailure.__members__.values()),
             doc = """
 How to handle errors when trying to automatically determine settings.

 * `skip` will silently skip creating a runtime. Instead, a non-functional
   runtime will be generated and marked as incompatible so it cannot be used.
   This is best if a local runtime is known not to work or be available
   in certain cases and that's OK. e.g., one use windows paths when there
   are people running on linux.
 * `warn` will print a warning message. This is useful when you expect
   a runtime to be available, but are OK with it missing and falling back
   to some other runtime.
 * `fail` will result in a failure. This is only recommended if you must
   ensure the runtime is available.
 """,
         ),
         "_get_local_runtime_info": attr.label(
             allow_single_file = True,
             default = "//python/private:get_local_runtime_info.py",
         ),
         "_rule_name": attr.string(default = "local_runtime_repo"),
     },
     environ = ["PATH", REPO_DEBUG_ENV_VAR],
 )

 def _expand_incompatible_template():
     return _TOOLCHAIN_IMPL_TEMPLATE.format(
         interpreter_path = "/incompatible",
         implementation_name = "incompatible",
         interface_library = "None",
         libraries = "[]",
         major = "0",
         minor = "0",
         micro = "0",
         os = "@platforms//:incompatible",
     )

 def _resolve_interpreter_path(rctx):
     """Find the absolute path for an interpreter.

     Args:
         rctx: A repository_ctx object

     Returns:
         `struct` with the following fields:
         * `resolved_path`: `path` object of a path that exists
         * `describe_failure`: `Callable | None`. If a path that doesn't exist,
           returns a description of why it couldn't be resolved
         A path object or None. The path may not exist.
     """
     if "/" not in rctx.attr.interpreter_path and "\\" not in rctx.attr.interpreter_path:
         # Provide a bit nicer integration with pyenv: recalculate the runtime if the
         # user changes the python version using e.g. `pyenv shell`
         repo_utils.getenv(rctx, "PYENV_VERSION")
         result = repo_utils.which_unchecked(rctx, rctx.attr.interpreter_path)
         resolved_path = result.binary
         describe_failure = result.describe_failure
     else:
         repo_utils.watch(rctx, rctx.attr.interpreter_path)
         resolved_path = rctx.path(rctx.attr.interpreter_path)
         if not resolved_path.exists:
             describe_failure = lambda: "Path not found: {}".format(repr(rctx.attr.interpreter_path))
         else:
             describe_failure = None

     return struct(
         resolved_path = resolved_path,
         describe_failure = describe_failure,
     )

 def _format_get_info_result(info):
     lines = ["GetPythonInfo result:"]
     for key, value in sorted(info.items()):
         lines.append("  {}: {}".format(key, value if value != "" else "<empty string>"))
     return "\n".join(lines)
	# Copyright 2024 The Bazel Authors. All rights reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	"""Create a repository for a locally installed Python runtime."""

	load(":enum.bzl", "enum")
	load(":repo_utils.bzl", "REPO_DEBUG_ENV_VAR", "repo_utils")

	# buildifier: disable=name-conventions
	_OnFailure = enum(
	SKIP = "skip",
	WARN = "warn",
	FAIL = "fail",
	)

	_TOOLCHAIN_IMPL_TEMPLATE = """\
	# Generated by python/private/local_runtime_repo.bzl

	load("@rules_python//python/private:local_runtime_repo_setup.bzl", "define_local_runtime_toolchain_impl")

	define_local_runtime_toolchain_impl(
	name = "local_runtime",
	major = "{major}",
	minor = "{minor}",
	micro = "{micro}",
	interpreter_path = "{interpreter_path}",
	interface_library = {interface_library},
	libraries = {libraries},
	implementation_name = "{implementation_name}",
	os = "{os}",
	)
	"""

	def _norm_path(path):
	"""Returns a path using '/' separators and no trailing slash."""
	path = path.replace("\\", "/")
	if path[-1] == "/":
	path = path[:-1]
	return path

	def _symlink_first_library(rctx, logger, libraries):
	"""Symlinks the shared libraries into the lib/ directory.

	Args:
	rctx: A repository_ctx object
	logger: A repo_utils.logger object
	libraries: A list of static library paths to potentially symlink.
	Returns:
	A single library path linked by the action.
	"""
	linked = None
	for target in libraries:
	origin = rctx.path(target)
	if not origin.exists:
	# The reported names don't always exist; it depends on the particulars
	# of the runtime installation.
	continue
	if target.endswith("/Python"):
	linked = "lib/{}.dylib".format(origin.basename)
	else:
	linked = "lib/{}".format(origin.basename)
	logger.debug("Symlinking {} to {}".format(origin, linked))
	repo_utils.watch(rctx, origin)
	rctx.symlink(origin, linked)
	break

	return linked

	def _local_runtime_repo_impl(rctx):
	logger = repo_utils.logger(rctx)
	on_failure = rctx.attr.on_failure

	def _emit_log(msg):
	if on_failure == "fail":
	logger.fail(msg)
	elif on_failure == "warn":
	logger.warn(msg)
	else:
	logger.debug(msg)

	result = _resolve_interpreter_path(rctx)
	if not result.resolved_path:
	_emit_log(lambda: "interpreter not found: {}".format(result.describe_failure()))

	# else, on_failure must be skip
	rctx.file("BUILD.bazel", _expand_incompatible_template())
	return
	else:
	interpreter_path = result.resolved_path

	logger.info(lambda: "resolved interpreter {} to {}".format(rctx.attr.interpreter_path, interpreter_path))

	exec_result = repo_utils.execute_unchecked(
	rctx,
	op = "local_runtime_repo.GetPythonInfo({})".format(rctx.name),
	arguments = [
	interpreter_path,
	rctx.path(rctx.attr._get_local_runtime_info),
	],
	quiet = True,
	logger = logger,
	)
	if exec_result.return_code != 0:
	_emit_log(lambda: "GetPythonInfo failed: {}".format(exec_result.describe_failure()))

	# else, on_failure must be skip
	rctx.file("BUILD.bazel", _expand_incompatible_template())
	return

	info = json.decode(exec_result.stdout)
	logger.info(lambda: _format_get_info_result(info))

	# We use base_executable because we want the path within a Python
	# installation directory ("PYTHONHOME"). The problems with sys.executable
	# are:
	# * If we're in an activated venv, then we don't want the venv's
	# `bin/python3` path to be used -- it isn't an actual Python installation.
	# * If sys.executable is a wrapper (e.g. pyenv), then (1) it may not be
	# located within an actual Python installation directory, and (2) it
	# can interfer with Python recognizing when it's within a venv.
	#
	# In some cases, it may be a symlink (usually e.g. `python3->python3.12`),
	# but we don't realpath() it to respect what it has decided is the
	# appropriate path.
	interpreter_path = info["base_executable"]

	# NOTE: Keep in sync with recursive glob in define_local_runtime_toolchain_impl
	include_path = rctx.path(info["include"])

	# The reported include path may not exist, and watching a non-existant
	# path is an error. Silently skip, since includes are only necessary
	# if C extensions are built.
	if include_path.exists and include_path.is_dir:
	repo_utils.watch_tree(rctx, include_path)
	else:
	pass

	# The cc_library.includes values have to be non-absolute paths, otherwise
	# the toolchain will give an error. Work around this error by making them
	# appear as part of this repo.
	rctx.symlink(include_path, "include")

	rctx.report_progress("Symlinking external Python shared libraries")
	interface_library = _symlink_first_library(rctx, logger, info["interface_libraries"])
	shared_library = _symlink_first_library(rctx, logger, info["dynamic_libraries"])
	static_library = _symlink_first_library(rctx, logger, info["static_libraries"])

	libraries = []
	if shared_library:
	libraries.append(shared_library)
	elif static_library:
	libraries.append(static_library)
	else:
	logger.warn("No external python libraries found.")

	build_bazel = _TOOLCHAIN_IMPL_TEMPLATE.format(
	major = info["major"],
	minor = info["minor"],
	micro = info["micro"],
	interpreter_path = _norm_path(interpreter_path),
	interface_library = repr(interface_library),
	libraries = repr(libraries),
	implementation_name = info["implementation_name"],
	os = "@platforms//os:{}".format(repo_utils.get_platforms_os_name(rctx)),
	)
	logger.debug(lambda: "BUILD.bazel\n{}".format(build_bazel))

	rctx.file("WORKSPACE", "")
	rctx.file("MODULE.bazel", "")
	rctx.file("REPO.bazel", "")
	rctx.file("BUILD.bazel", build_bazel)

	local_runtime_repo = repository_rule(
	implementation = _local_runtime_repo_impl,
	doc = """
	Use a locally installed Python runtime as a toolchain implementation.

	Note this uses the runtime as a platform runtime. A platform runtime means
	means targets don't include the runtime itself as part of their runfiles or
	inputs. Instead, users must assure that where the targets run have the runtime
	pre-installed or otherwise available.

	This results in lighter weight binaries (in particular, Bazel doesn't have to
	create thousands of files for every `py_test`), at the risk of having to rely on
	a system having the necessary Python installed.
	""",
	attrs = {
	"interpreter_path": attr.string(
	doc = """
	An absolute path or program name on the `PATH` env var.

	Values with slashes are assumed to be the path to a program. Otherwise, it is
	treated as something to search for on `PATH`

	Note that, when a plain program name is used, the path to the interpreter is
	resolved at repository evalution time, not runtime of any resulting binaries.
	""",
	default = "python3",
	),
	"on_failure": attr.string(
	default = _OnFailure.SKIP,
	values = sorted(_OnFailure.__members__.values()),
	doc = """
	How to handle errors when trying to automatically determine settings.

	* `skip` will silently skip creating a runtime. Instead, a non-functional
	runtime will be generated and marked as incompatible so it cannot be used.
	This is best if a local runtime is known not to work or be available
	in certain cases and that's OK. e.g., one use windows paths when there
	are people running on linux.
	* `warn` will print a warning message. This is useful when you expect
	a runtime to be available, but are OK with it missing and falling back
	to some other runtime.
	* `fail` will result in a failure. This is only recommended if you must
	ensure the runtime is available.
	""",
	),
	"_get_local_runtime_info": attr.label(
	allow_single_file = True,
	default = "//python/private:get_local_runtime_info.py",
	),
	"_rule_name": attr.string(default = "local_runtime_repo"),
	},
	environ = ["PATH", REPO_DEBUG_ENV_VAR],
	)

	def _expand_incompatible_template():
	return _TOOLCHAIN_IMPL_TEMPLATE.format(
	interpreter_path = "/incompatible",
	implementation_name = "incompatible",
	interface_library = "None",
	libraries = "[]",
	major = "0",
	minor = "0",
	micro = "0",
	os = "@platforms//:incompatible",
	)

	def _resolve_interpreter_path(rctx):
	"""Find the absolute path for an interpreter.

	Args:
	rctx: A repository_ctx object

	Returns:
	`struct` with the following fields:
	* `resolved_path`: `path` object of a path that exists
	* `describe_failure`: `Callable \| None`. If a path that doesn't exist,
	returns a description of why it couldn't be resolved
	A path object or None. The path may not exist.
	"""
	if "/" not in rctx.attr.interpreter_path and "\\" not in rctx.attr.interpreter_path:
	# Provide a bit nicer integration with pyenv: recalculate the runtime if the
	# user changes the python version using e.g. `pyenv shell`
	repo_utils.getenv(rctx, "PYENV_VERSION")
	result = repo_utils.which_unchecked(rctx, rctx.attr.interpreter_path)
	resolved_path = result.binary
	describe_failure = result.describe_failure
	else:
	repo_utils.watch(rctx, rctx.attr.interpreter_path)
	resolved_path = rctx.path(rctx.attr.interpreter_path)
	if not resolved_path.exists:
	describe_failure = lambda: "Path not found: {}".format(repr(rctx.attr.interpreter_path))
	else:
	describe_failure = None

	return struct(
	resolved_path = resolved_path,
	describe_failure = describe_failure,
	)

	def _format_get_info_result(info):
	lines = ["GetPythonInfo result:"]
	for key, value in sorted(info.items()):
	lines.append(" {}: {}".format(key, value if value != "" else "<empty string>"))
	return "\n".join(lines)