| From d20698e4802b801807d0474f1d1d003b13c78277 Mon Sep 17 00:00:00 2001 |
| From: Tim Windelschmidt <tim@monogon.tech> |
| Date: Fri, 12 Jan 2024 15:44:41 +0100 |
| Subject: [PATCH] Improve reproducibility |
| |
| Fixes a few issues with rules_rust/rustc reproducibility when the same code is |
| being built in slightly different BuildConfigurations. |
| |
| Even if BuildConfigurations differ only by insignificant (to rules_rust) |
| configuration flags, the resulting output directory will be different (keyed by |
| an 'ST-hash' which is generated from the configuration). |
| |
| Unfortunately, rust/rules_rust really likes to embed bazel-out/<dir>/bin paths |
| into the binaries by default, thus embedding the ST-hash, thus leading to |
| different bit-for-bit binaries when built across two slightly different |
| configs. |
| |
| We fix this by doing two changes: |
| |
| 1. We override the codegen metadata hash suffix to not depend on the ST-hash |
| directory name. Otherwise, built rlibs will have a numeric .XXX suffix that |
| changes depending on the ST-hash. We have to do this separately for prost |
| codegen, too. |
| 2. We add a remap path option to rustc that replaces bazel-out/<dir>/bin/ with |
| bin/. |
| --- |
| proto/prost/private/prost.bzl | 4 +++- |
| proto/protobuf/proto.bzl | 2 +- |
| rust/private/clippy.bzl | 2 +- |
| rust/private/rust.bzl | 6 +++--- |
| rust/private/rustc.bzl | 4 ++++ |
| rust/private/utils.bzl | 7 +++++-- |
| 6 files changed, 17 insertions(+), 8 deletions(-) |
| |
| diff --git a/proto/prost/private/prost.bzl b/proto/prost/private/prost.bzl |
| index e3e5e382..b91123f3 100644 |
| --- a/proto/prost/private/prost.bzl |
| +++ b/proto/prost/private/prost.bzl |
| @@ -125,7 +125,9 @@ def _compile_rust(ctx, attr, crate_name, src, deps, edition): |
| A DepVariantInfo provider. |
| """ |
| toolchain = ctx.toolchains["@rules_rust//rust:toolchain_type"] |
| - output_hash = repr(hash(src.path + ".prost")) |
| + src_path = src.path.replace(ctx.bin_dir.path, 'bin') |
| + print(src.path, src_path) |
| + output_hash = repr(hash(src_path + ".prost")) |
| |
| lib_name = "{prefix}{name}-{lib_hash}{extension}".format( |
| prefix = "lib", |
| diff --git a/proto/protobuf/proto.bzl b/proto/protobuf/proto.bzl |
| index 7b254305..d61a1cbc 100644 |
| --- a/proto/protobuf/proto.bzl |
| +++ b/proto/protobuf/proto.bzl |
| @@ -187,7 +187,7 @@ def _rust_proto_compile(protos, descriptor_sets, imports, crate_name, ctx, is_gr |
| srcs.append(lib_rs) |
| |
| # And simulate rust_library behavior |
| - output_hash = determine_output_hash(lib_rs, ctx.label) |
| + output_hash = determine_output_hash(ctx.bin_dir, lib_rs, ctx.label) |
| rust_lib = ctx.actions.declare_file("%s/lib%s-%s.rlib" % ( |
| output_dir, |
| crate_name, |
| diff --git a/rust/private/clippy.bzl b/rust/private/clippy.bzl |
| index 9fd9842c..54a0547c 100644 |
| --- a/rust/private/clippy.bzl |
| +++ b/rust/private/clippy.bzl |
| @@ -120,7 +120,7 @@ def _clippy_aspect_impl(target, ctx): |
| dep_info = dep_info, |
| linkstamp_outs = linkstamp_outs, |
| ambiguous_libs = ambiguous_libs, |
| - output_hash = determine_output_hash(crate_info.root, ctx.label), |
| + output_hash = determine_output_hash(ctx.bin_dir, crate_info.root, ctx.label), |
| rust_flags = [], |
| out_dir = out_dir, |
| build_env_files = build_env_files, |
| diff --git a/rust/private/rust.bzl b/rust/private/rust.bzl |
| index 7727febb..217f1059 100644 |
| --- a/rust/private/rust.bzl |
| +++ b/rust/private/rust.bzl |
| @@ -159,7 +159,7 @@ def _rust_library_common(ctx, crate_type): |
| if crate_type in ["cdylib", "staticlib"]: |
| output_hash = None |
| else: |
| - output_hash = determine_output_hash(crate_root, ctx.label) |
| + output_hash = determine_output_hash(ctx.bin_dir, crate_root, ctx.label) |
| |
| rust_lib_name = determine_lib_name( |
| crate_name, |
| @@ -310,7 +310,7 @@ def _rust_test_impl(ctx): |
| # Target is building the crate in `test` config |
| crate = ctx.attr.crate[rust_common.crate_info] if rust_common.crate_info in ctx.attr.crate else ctx.attr.crate[rust_common.test_crate_info].crate |
| |
| - output_hash = determine_output_hash(crate.root, ctx.label) |
| + output_hash = determine_output_hash(ctx.bin_dir, crate.root, ctx.label) |
| output = ctx.actions.declare_file( |
| "test-%s/%s%s" % ( |
| output_hash, |
| @@ -369,7 +369,7 @@ def _rust_test_impl(ctx): |
| crate_root = crate_root_src(ctx.attr.name, ctx.files.srcs, crate_root_type) |
| srcs, crate_root = transform_sources(ctx, ctx.files.srcs, crate_root) |
| |
| - output_hash = determine_output_hash(crate_root, ctx.label) |
| + output_hash = determine_output_hash(ctx.bin_dir, crate_root, ctx.label) |
| output = ctx.actions.declare_file( |
| "test-%s/%s%s" % ( |
| output_hash, |
| diff --git a/rust/private/rustc.bzl b/rust/private/rustc.bzl |
| index ef3479e5..06c94574 100644 |
| --- a/rust/private/rustc.bzl |
| +++ b/rust/private/rustc.bzl |
| @@ -966,6 +966,10 @@ def construct_arguments( |
| if remap_path_prefix != None: |
| rustc_flags.add("--remap-path-prefix=${{pwd}}={}".format(remap_path_prefix)) |
| |
| + # Replace unstable bindir path (based on ST-hash which is in turn based on |
| + # build configuration) with a stable bin/ path. |
| + rustc_flags.add("--remap-path-prefix={}=bin".format(ctx.bin_dir.path)) |
| + |
| if emit: |
| rustc_flags.add_joined(emit_with_paths, format_joined = "--emit=%s", join_with = ",") |
| if error_format != "json": |
| diff --git a/rust/private/utils.bzl b/rust/private/utils.bzl |
| index 4e9b4b79..82317359 100644 |
| --- a/rust/private/utils.bzl |
| +++ b/rust/private/utils.bzl |
| @@ -182,7 +182,7 @@ def abs(value): |
| return -value |
| return value |
| |
| -def determine_output_hash(crate_root, label): |
| +def determine_output_hash(bin_dir, crate_root, label): |
| """Generates a hash of the crate root file's path. |
| |
| Args: |
| @@ -193,8 +193,11 @@ def determine_output_hash(crate_root, label): |
| str: A string representation of the hash. |
| """ |
| |
| + # Remove any unstable BuildConfiguration derived dir fragments to unify |
| + # hashes between different configs. |
| + crate_root_path = crate_root.path.replace(bin_dir.path, 'bin') |
| # Take the absolute value of hash() since it could be negative. |
| - h = abs(hash(crate_root.path) + hash(repr(label))) |
| + h = abs(hash(crate_root_path) + hash(repr(label))) |
| return repr(h) |
| |
| def get_preferred_artifact(library_to_link, use_pic): |
| -- |
| 2.42.0 |
| |