Skip to content

Commit

Permalink
Achieve perfect reproducibility for dev setups
Browse files Browse the repository at this point in the history
This commit changes the default C++ toolchain to the custom nix-backed
clang toolchain.

- Update custom stdenv to use Clang/LLVM 18
- Regenerate LRE toolchains.
- Remove obsolete zig_cc toolchain
- Expand LRE CI to build C++ parts of NativeLink remotely in K8s and the
  rest of rules_rust locally.

Fixes TraceMachina#694
Closes TraceMachina#477
  • Loading branch information
aaronmondal committed Apr 23, 2024
1 parent f79b59b commit 2739656
Show file tree
Hide file tree
Showing 19 changed files with 2,865 additions and 2,859 deletions.
32 changes: 14 additions & 18 deletions .bazelrc
Original file line number Diff line number Diff line change
Expand Up @@ -75,24 +75,6 @@ build:windows --enable_runfiles
# toolchains are resolved before the rust toolchains.
build --extra_toolchains=@rust_toolchains//:all

# Option to test the zig toolchain on Linux. Prefer the default `linux`
# toolchain which builds cc targets roughly twice as fast.
#
# WARNING:
#
# We're using an incredibly old target glibc here. Builds created with this
# toolchain have maximum compatibility (theoretically down to Ubuntu 18), but
# miss out on half a decade of optimizations. Don't use this for production
# builds if you're running a non-ancient OS and care about performance.
#
# TODO(aaronmondal): Migrate to a statically linked musl as soon as rules_rust
# supports it. This way we get to keep (or even improve)
# backwards compatibility without sacrificing performance.
build:linux_zig --host_platform=@zig_sdk//platform:linux_amd64
build:linux_zig --extra_toolchains=@zig_sdk//libc_aware/toolchain:linux_amd64_gnu.2.28
build:linux_zig --repo_env=BAZEL_DO_NOT_DETECT_CPP_TOOLCHAIN=1


# Local Remote Execution.
build:lre --extra_execution_platforms=@local-remote-execution//generated-cc/config:platform
build:lre --extra_toolchains=@local-remote-execution//generated-cc/config:cc-toolchain"
Expand All @@ -105,5 +87,19 @@ build:lre --repo_env=BAZEL_DO_NOT_DETECT_CPP_TOOLCHAIN=1
# is resolved.
build:lre --define=EXECUTOR=remote

# rules_rust doesn't properly work with remote execution.
#
# Note(aaronmondal): It's technically possible to run this build in some remote
# execution images, such as ubuntu-based images. Those images only pretend to be
# reproducible (think /usr/bin/clang which could be any version of clang). This
# disables anything that doesn't "properly" execute remotely.
common:lre --strategy=Rustc=local
common:lre --strategy=CargoBuildScriptRun=local
common:lre --strategy=Rustfmt=local
common:lre --strategy=Clippy=local
common:lre --strategy=TestRunner=local
common:lre --strategy=Rustdoc=local
common:lre --strategy=Genrule=local # Genrules break remotely as well.

# Allow user-side customization.
try-import %workspace%/.bazelrc.user
20 changes: 20 additions & 0 deletions .github/workflows/lre.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -42,6 +42,15 @@ jobs:
--verbose_failures \
@local-remote-execution//examples:hello_lre"
- name: Build NativeLink with LRE.
run: >
nix develop --impure --command
bash -c "bazel test \
--config=lre \
--verbose_failures \
..."
remote:
strategy:
fail-fast: false
Expand Down Expand Up @@ -109,3 +118,14 @@ jobs:
--remote_executor=grpc://$scheduler_ip:50052 \
--verbose_failures \
@local-remote-execution//examples:hello_lre"
- name: Build NativeLink with LRE.
run: >
nix develop --impure --command
bash -c "bazel test \
--config=lre \
--remote_instance_name=main \
--remote_cache=grpc://$cache_ip:50051 \
--remote_executor=grpc://$scheduler_ip:50052 \
--verbose_failures \
..."
4 changes: 2 additions & 2 deletions .github/workflows/main.yml
Original file line number Diff line number Diff line change
Expand Up @@ -58,15 +58,15 @@ jobs:
cd ../../ && \
docker run --rm --net=host -w /root/nativelink -v $PWD:/root/nativelink trace_machina/nativelink:builder sh -c ' \
bazel clean && \
bazel test --config=linux_zig //... \
bazel test //... \
--remote_instance_name=main \
--remote_cache=grpc://127.0.0.1:50051 \
--remote_executor=grpc://127.0.0.1:50052 \
--remote_default_exec_properties=cpu_count=1 \
' && \
docker run --rm --net=host -w /root/nativelink -v $PWD:/root/nativelink trace_machina/nativelink:builder sh -c ' \
bazel clean && \
bazel test --config=linux_zig //... \
bazel test //... \
--remote_instance_name=main \
--remote_cache=grpc://127.0.0.1:50051 \
--remote_executor=grpc://127.0.0.1:50052 \
Expand Down
34 changes: 0 additions & 34 deletions .github/workflows/native-bazel.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -69,37 +69,3 @@ jobs:
exit 1
fi
shell: bash

zig-cc-unit-tests:
strategy:
fail-fast: false
matrix:
os: [ubuntu-20.04, ubuntu-22.04]
name: zig-cc ${{ matrix.os }}
runs-on: ${{ matrix.os }}
steps:

- name: Checkout
uses: >- # v4.1.1
actions/checkout@b4ffde65f46336ab88eb53be808477a3936bae11
- name: Setup Bazelisk
uses: >- # v0.8.1
bazel-contrib/setup-bazel@b388b84bb637e50cdae241d0f255670d4bd79f29
with:
bazelisk-cache: true

- name: Mount bazel cache
uses: >- # v4.0.1
actions/cache@ab5e6d0c87105b4c9c2047343972218f562e4319
with:
path: |
~/.cache/bazel
key: |
${{ matrix.os }}-bazel-legacy-${{ hashFiles('.bazelversion', '.bazelrc', 'WORKSPACE.bazel', 'MODULE.bazel') }}
restore-keys: |
${{ matrix.os }}-bazel-legacy-
- name: Run Bazel tests
run: |
bazel test --config=linux_zig //... --verbose_failures
2 changes: 1 addition & 1 deletion .github/workflows/nix.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ jobs:
run: |
if [ "$RUNNER_OS" == "Linux" ]; then
nix develop --impure --command \
bash -c "bazel test --config=linux_zig ... --verbose_failures"
bash -c "bazel test ... --verbose_failures"
elif [ "$RUNNER_OS" == "macOS" ]; then
nix develop --impure --command \
bash -c "bazel test //... --verbose_failures"
Expand Down
10 changes: 1 addition & 9 deletions MODULE.bazel
Original file line number Diff line number Diff line change
Expand Up @@ -18,14 +18,6 @@ python.toolchain(
)
use_repo(python, python = "python_versions")

bazel_dep(name = "hermetic_cc_toolchain", version = "3.0.1")

zig_toolchains = use_extension(
"@hermetic_cc_toolchain//toolchain:ext.bzl",
"toolchains",
)
use_repo(zig_toolchains, "zig_sdk")

bazel_dep(name = "rules_rust", version = "0.42.1")

rust = use_extension("@rules_rust//rust:extensions.bzl", "rust")
Expand Down Expand Up @@ -72,7 +64,7 @@ crate.from_cargo(
)
use_repo(crate, "crates")

bazel_dep(name = "protobuf", version = "23.1")
bazel_dep(name = "protobuf", version = "26.0")

# Local remote execution.
bazel_dep(name = "local-remote-execution", version = "0.0.0")
Expand Down
24 changes: 12 additions & 12 deletions flake.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

102 changes: 53 additions & 49 deletions flake.nix
Original file line number Diff line number Diff line change
Expand Up @@ -73,8 +73,6 @@

customStdenv = import ./tools/llvmStdenv.nix {inherit pkgs;};

# TODO(aaronmondal): This doesn't work with rules_rust yet.
# Tracked in https://github.com/TraceMachina/nativelink/issues/477.
customClang = pkgs.callPackage ./tools/customClang.nix {
inherit pkgs;
stdenv = customStdenv;
Expand Down Expand Up @@ -154,10 +152,17 @@
};
};
in rec {
_module.args.pkgs = import self.inputs.nixpkgs {
inherit system;
overlays = [(import rust-overlay)];
};
_module.args.pkgs = let
nixpkgs-patched = (import self.inputs.nixpkgs {inherit system;}).applyPatches {
name = "nixpkgs-patched";
src = self.inputs.nixpkgs;
patches = [./tools/nixpkgs_link_libunwind_and_libcxx.diff];
};
in
import nixpkgs-patched {
inherit system;
overlays = [(import rust-overlay)];
};
apps = {
default = {
type = "app";
Expand Down Expand Up @@ -206,49 +211,48 @@
# });
};
pre-commit.settings = {inherit hooks;};
devShells.default = pkgs.mkShell {
nativeBuildInputs =
[
# Development tooling goes here.
stable-rust-native.default
pkgs.pre-commit
pkgs.bazel_7
pkgs.awscli2
pkgs.skopeo
pkgs.dive
pkgs.cosign
pkgs.kubectl
pkgs.kubernetes-helm
pkgs.cilium-cli
pkgs.yarn
pkgs.vale
pkgs.trivy
pkgs.docker-client
pkgs.kind
pkgs.tektoncd-cli
(pkgs.pulumi.withPackages (ps: [ps.pulumi-language-go]))
pkgs.go

# Additional tools from within our development environment.
local-image-test
generate-toolchains
customClang
native-cli
]
++ maybeDarwinDeps;
shellHook = ''
# Generate the .pre-commit-config.yaml symlink when entering the
# development shell.
${config.pre-commit.installationScript}
# The Bazel and Cargo builds in nix require a Clang toolchain.
# TODO(aaronmondal): The Bazel build currently uses the
# irreproducible host C++ toolchain. Provide
# this toolchain via nix for bitwise identical
# binaries across machines.
export CC=clang
'';
};
devShells.default =
pkgs.mkShell.override {
stdenv = customStdenv;
} {
nativeBuildInputs =
[
# Development tooling goes here.
stable-rust-native.default
pkgs.pre-commit
pkgs.bazel_7
pkgs.awscli2
pkgs.skopeo
pkgs.dive
pkgs.cosign
pkgs.kubectl
pkgs.kubernetes-helm
pkgs.cilium-cli
pkgs.yarn
pkgs.vale
pkgs.trivy
pkgs.docker-client
pkgs.kind
pkgs.tektoncd-cli
(pkgs.pulumi.withPackages (ps: [ps.pulumi-language-go]))
pkgs.go

# Additional tools from within our development environment.
local-image-test
generate-toolchains
customClang
native-cli
]
++ maybeDarwinDeps;
shellHook = ''
# Generate the .pre-commit-config.yaml symlink when entering the
# development shell.
${config.pre-commit.installationScript}
# The Bazel and Cargo builds in nix require a Clang toolchain.
export CC=customClang
'';
};
};
};
}
Loading

0 comments on commit 2739656

Please sign in to comment.