Skip to content

Commit

Permalink
Add support for remote_files for http_archive
Browse files Browse the repository at this point in the history
This issue adds support necessary to tackle
bazelbuild/bazel-central-registry#1566

Add two new attributes to http_archive: remote_file_urls and
remote_file_integrity.

The purpose of these two attributes is to allow files to effectively be
overlaid ontop of an http_archive. The goal of such functionality would
be useful for BCR since the BUILD & WORKSPACE files need no longer be
stored as patch files.

This means we could probably deprecate `build_file` since that could be
referenced as a file:// url in the remote_file_urls attribute.

Co-authored-by: Mark Williams <mark.r.williams@google.com>
  • Loading branch information
fzakaria and Mark Williams committed Apr 26, 2024
1 parent 7e862eb commit 2899c6e
Show file tree
Hide file tree
Showing 4 changed files with 196 additions and 0 deletions.
11 changes: 11 additions & 0 deletions src/test/shell/bazel/BUILD
Original file line number Diff line number Diff line change
Expand Up @@ -803,6 +803,17 @@ sh_test(
shard_count = 3,
)

sh_test(
name = "external_remote_file_test",
size = "small",
srcs = ["external_remote_file_test.sh"],
data = [
":test-deps",
"@bazel_tools//tools/bash/runfiles",
],
# shard_count = 3,
)

sh_test(
name = "external_path_test",
size = "medium",
Expand Down
142 changes: 142 additions & 0 deletions src/test/shell/bazel/external_remote_file_test.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,142 @@
#!/bin/bash
#
# Copyright 2017 The Bazel Authors. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# Tests the patching functionality of external repositories.

set -euo pipefail
# --- begin runfiles.bash initialization ---
if [[ ! -d "${RUNFILES_DIR:-/dev/null}" && ! -f "${RUNFILES_MANIFEST_FILE:-/dev/null}" ]]; then
if [[ -f "$0.runfiles_manifest" ]]; then
export RUNFILES_MANIFEST_FILE="$0.runfiles_manifest"
elif [[ -f "$0.runfiles/MANIFEST" ]]; then
export RUNFILES_MANIFEST_FILE="$0.runfiles/MANIFEST"
elif [[ -f "$0.runfiles/bazel_tools/tools/bash/runfiles/runfiles.bash" ]]; then
export RUNFILES_DIR="$0.runfiles"
fi
fi
if [[ -f "${RUNFILES_DIR:-/dev/null}/bazel_tools/tools/bash/runfiles/runfiles.bash" ]]; then
source "${RUNFILES_DIR}/bazel_tools/tools/bash/runfiles/runfiles.bash"
elif [[ -f "${RUNFILES_MANIFEST_FILE:-/dev/null}" ]]; then
source "$(grep -m1 "^bazel_tools/tools/bash/runfiles/runfiles.bash " \
"$RUNFILES_MANIFEST_FILE" | cut -d ' ' -f 2-)"
else
echo >&2 "ERROR: cannot find @bazel_tools//tools/bash/runfiles:runfiles.bash"
exit 1
fi
# --- end runfiles.bash initialization ---

source "$(rlocation "io_bazel/src/test/shell/integration_test_setup.sh")" \
|| { echo "integration_test_setup.sh not found!" >&2; exit 1; }

# `uname` returns the current platform, e.g "MSYS_NT-10.0" or "Linux".
# `tr` converts all upper case letters to lower case.
# `case` matches the result if the `uname | tr` expression to string prefixes
# that use the same wildcards as names do in Bash, i.e. "msys*" matches strings
# starting with "msys", and "*" matches everything (it's the default case).
case "$(uname -s | tr [:upper:] [:lower:])" in
msys*)
# As of 2019-01-15, Bazel on Windows only supports MSYS Bash.
declare -r is_windows=true
;;
*)
declare -r is_windows=false
;;
esac

if "$is_windows"; then
# Disable MSYS path conversion that converts path-looking command arguments to
# Windows paths (even if they arguments are not in fact paths).
export MSYS_NO_PATHCONV=1
export MSYS2_ARG_CONV_EXCL="*"
fi


if $is_windows; then
export MSYS_NO_PATHCONV=1
export MSYS2_ARG_CONV_EXCL="*"
fi

set_up() {
WRKDIR=$(mktemp -d "${TEST_TMPDIR}/testXXXXXX")
cd "${WRKDIR}"
write_default_lockfile "MODULE.bazel.lock"
# create an archive file with files interesting for patching
mkdir hello_world-0.1.2
cat > hello_world-0.1.2/hello_world.c <<'EOF'
#include <stdio.h>
int main() {
printf("Hello, world!\n");
return 0;
}
EOF
zip hello_world.zip hello_world-0.1.2/*
rm -rf hello_world-0.1.2
}

function get_extrepourl() {
if $is_windows; then
echo "file:///$(cygpath -m $1)"
else
echo "file://$1"
fi
}


test_overlay_remote_file_with_integrity() {
EXTREPODIR=`pwd`
EXTREPOURL="$(get_extrepourl ${EXTREPODIR})"

# Generate the remote files to overlay
# this could be like the Bazel Central Repository
# Generate the remote patch file
cat > BUILD.bazel <<'EOF'
load("@rules_cc//cc:defs.bzl", "cc_binary")
cc_binary(
name = "hello_world",
srcs = ["hello_world.c"],
)
EOF
touch WORKSPACE

# Test that the patches attribute of http_archive is honored
mkdir main
cd main
cat > WORKSPACE <<EOF
load("@bazel_tools//tools/build_defs/repo:http.bzl", "http_archive")
http_archive(
name="hello_world",
strip_prefix="hello_world-0.1.2",
urls=["${EXTREPOURL}/hello_world.zip"],
remote_file_urls={
"WORKSPACE": ["${EXTREPOURL}/WORKSPACE"],
"BUILD.bazel": ["${EXTREPOURL}/BUILD.bazel"],
},
remote_file_integrity={
"WORKSPACE": "sha256-47DEQpj8HBSa+/TImW+5JCeuQeRkm5NMpJWZG3hSuFU=",
"BUILD.bazel": "sha256-0bs+dwSOzHTbNAgDS02I3giLAZu2/NLn7BJWwQGN/Pk=",
},
)
EOF
write_default_lockfile "MODULE.bazel.lock"

# TODO(fzakaria): I found this command to fail since it tries to spawn sandbox
# within a sandbox. I'm not sure how the other tests that build cc_binary get
# around this.
bazel build @hello_world//:hello_world --spawn_strategy=local
}

run_suite "external remote file tests"
19 changes: 19 additions & 0 deletions tools/build_defs/repo/http.bzl
Original file line number Diff line number Diff line change
Expand Up @@ -53,6 +53,7 @@ load(
":utils.bzl",
"get_auth",
"patch",
"remote_files",
"update_attrs",
"workspace_and_buildfile",
)
Expand Down Expand Up @@ -139,6 +140,8 @@ def _http_archive_impl(ctx):
auth = get_auth(ctx, all_urls)

download_info = ctx.download_and_extract(
# TODO(fzakaria): all_urls here has the remote_patch URL which is incorrect
# I believe this to be a file
all_urls,
ctx.attr.add_prefix,
ctx.attr.sha256,
Expand All @@ -149,6 +152,8 @@ def _http_archive_impl(ctx):
integrity = ctx.attr.integrity,
)
workspace_and_buildfile(ctx)

remote_files(ctx, auth = auth)
patch(ctx, auth = auth)

return _update_integrity_attr(ctx, _http_archive_attrs, download_info)
Expand Down Expand Up @@ -304,6 +309,20 @@ following: `"zip"`, `"jar"`, `"war"`, `"aar"`, `"tar"`, `"tar.gz"`, `"tgz"`,
"patch command line tool if `patch_tool` attribute is specified or there are " +
"arguments other than `-p` in `patch_args` attribute.",
),
"remote_file_urls": attr.string_list_dict(
default = {},
doc =
"A list of URLs to files that are to be downloaded and made available to be used as " +
"overlaid files. This is useful when you want to add WORKSPACE or BUILD.bazel files " +
"atop an existing repository. The files are downloaded before applying " +
"the patches in the `patches` attribute.",
),
"remote_file_integrity": attr.string_dict(
default = {},
doc =
"A map of file URL to its integrity value. These URLs should map to the files in " +
"the `remote_file_urls` attribute.",
),
"remote_patches": attr.string_dict(
default = {},
doc =
Expand Down
24 changes: 24 additions & 0 deletions tools/build_defs/repo/utils.bzl
Original file line number Diff line number Diff line change
Expand Up @@ -91,6 +91,30 @@ def _download_patch(ctx, patch_url, integrity, auth):
)
return patch_path

def remote_files(ctx, auth = None):
"""Utility function for downloading remote files.
This rule is intended to be used in the implementation function of
a repository rule. It assumes the parameters `remote_file_urls` and
`remote_file_integrity` to be present in `ctx.attr`.
Args:
ctx: The repository context of the repository rule calling this utility
function.
auth: An optional dict specifying authentication information for some of the URLs.
"""
for path, remote_file_urls in ctx.attr.remote_file_urls.items():
# integrity is optional but really recommended
integrity = ctx.attr.remote_file_integrity.get(path)

ctx.download(
remote_file_urls,
path,
canonical_id = ctx.attr.canonical_id,
auth = auth,
integrity = integrity,
)

def patch(ctx, patches = None, patch_cmds = None, patch_cmds_win = None, patch_tool = None, patch_args = None, auth = None):
"""Implementation of patching an already extracted repository.
Expand Down

0 comments on commit 2899c6e

Please sign in to comment.