blob: 1998e4fb3391ea43320e216ad8aa7d2ed0c338fc [file] [log] [blame]
# Copyright 2024 The Bazel Authors. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
A file that houses private functions used in the `bzlmod` extension with the same name.
"""
# Just list them here and me super conservative
_KNOWN_EXTS = [
# Note, the following source in pip has more extensions
# https://github.com/pypa/pip/blob/3c5a189141a965f21a473e46c3107e689eb9f79f/src/pip/_vendor/distlib/locators.py#L90
#
# ".tar.bz2",
# ".tar",
# ".tgz",
# ".tbz",
#
# But we support only the following, used in 'packaging'
# https://github.com/pypa/pip/blob/3c5a189141a965f21a473e46c3107e689eb9f79f/src/pip/_vendor/packaging/utils.py#L137
".whl",
".tar.gz",
".zip",
]
def index_sources(line):
"""Get PyPI sources from a requirements.txt line.
We interpret the spec described in
https://pip.pypa.io/en/stable/reference/requirement-specifiers/#requirement-specifiers
Args:
line(str): The requirements.txt entry.
Returns:
A struct with shas attribute containing:
* `shas` - list[str]; shas to download from pypi_index.
* `version` - str; version of the package.
* `marker` - str; the marker expression, as per PEP508 spec.
* `requirement` - str; a requirement line without the marker. This can
be given to `pip` to install a package.
* `url` - str; URL if the requirement specifies a direct URL, empty string otherwise.
"""
line = line.replace("\\", " ")
head, _, maybe_hashes = line.partition(";")
_, _, version = head.partition("==")
version = version.partition(" ")[0].strip()
marker, _, _ = maybe_hashes.partition("--hash=")
maybe_hashes = maybe_hashes or line
shas = [
sha.strip()
for sha in maybe_hashes.split("--hash=sha256:")[1:]
]
marker = marker.strip()
if head == line:
requirement = line.partition("--hash=")[0].strip()
else:
requirement = head.strip()
requirement_line = "{} {}".format(
requirement,
" ".join(["--hash=sha256:{}".format(sha) for sha in shas]),
).strip()
url = ""
filename = ""
if "@" in head:
maybe_requirement, _, url_and_rest = requirement.partition("@")
url = url_and_rest.strip().partition(" ")[0].strip()
url, _, sha256 = url.partition("#sha256=")
if sha256:
shas.append(sha256)
_, _, filename = url.rpartition("/")
# Replace URL encoded characters and luckily there is only one case
filename = filename.replace("%2B", "+")
is_known_ext = False
for ext in _KNOWN_EXTS:
if filename.endswith(ext):
is_known_ext = True
break
requirement = requirement_line
if filename.endswith(".whl"):
requirement = maybe_requirement.strip()
elif not is_known_ext:
# could not detect filename from the URL
filename = ""
return struct(
requirement = requirement,
requirement_line = requirement_line,
version = version,
shas = sorted(shas),
marker = marker,
url = url,
filename = filename,
)