Skip to content

Commit dd9a970

Browse files
PGO for LLVM builds on x86_64-unknown-linux-gnu in CI
This shows up to 5% less instruction counts on multiple benchmarks, and up to 19% wins on the -j1 wall times for rustc self-compilation. We can afford to spend the extra cycles building LLVM essentially once more for the x86_64-unknown-linux-gnu CI build today. The builder finishes in around 50 minutes on average, and this adds just 10 more minutes. Given the sizeable improvements in compiler performance, this is definitely worth it.
1 parent c0490a2 commit dd9a970

File tree

6 files changed

+84
-52
lines changed

6 files changed

+84
-52
lines changed

src/bootstrap/config.rs

+4
Original file line numberDiff line numberDiff line change
@@ -143,6 +143,8 @@ pub struct Config {
143143
pub rust_new_symbol_mangling: bool,
144144
pub rust_profile_use: Option<String>,
145145
pub rust_profile_generate: Option<String>,
146+
pub llvm_profile_use: Option<String>,
147+
pub llvm_profile_generate: bool,
146148

147149
pub build: TargetSelection,
148150
pub hosts: Vec<TargetSelection>,
@@ -605,6 +607,8 @@ impl Config {
605607
if let Some(value) = flags.deny_warnings {
606608
config.deny_warnings = value;
607609
}
610+
config.llvm_profile_use = flags.llvm_profile_use;
611+
config.llvm_profile_generate = flags.llvm_profile_generate;
608612

609613
if config.dry_run {
610614
let dir = config.out.join("tmp-dry-run");

src/bootstrap/flags.rs

+18-2
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,13 @@ pub struct Flags {
7171

7272
pub rust_profile_use: Option<String>,
7373
pub rust_profile_generate: Option<String>,
74+
75+
pub llvm_profile_use: Option<String>,
76+
// LLVM doesn't support a custom location for generating profile
77+
// information.
78+
//
79+
// llvm_out/build/profiles/ is the location this writes to.
80+
pub llvm_profile_generate: bool,
7481
}
7582

7683
pub enum Subcommand {
@@ -225,8 +232,15 @@ To learn more about a subcommand, run `./x.py <subcommand> -h`",
225232
VALUE overrides the skip-rebuild option in config.toml.",
226233
"VALUE",
227234
);
228-
opts.optopt("", "rust-profile-generate", "generate PGO profile with rustc build", "FORMAT");
229-
opts.optopt("", "rust-profile-use", "use PGO profile for rustc build", "FORMAT");
235+
opts.optopt(
236+
"",
237+
"rust-profile-generate",
238+
"generate PGO profile with rustc build",
239+
"PROFILE",
240+
);
241+
opts.optopt("", "rust-profile-use", "use PGO profile for rustc build", "PROFILE");
242+
opts.optflag("", "llvm-profile-generate", "generate PGO profile with llvm built for rustc");
243+
opts.optopt("", "llvm-profile-use", "use PGO profile for llvm build", "PROFILE");
230244

231245
// We can't use getopt to parse the options until we have completed specifying which
232246
// options are valid, but under the current implementation, some options are conditional on
@@ -685,6 +699,8 @@ Arguments:
685699
.expect("`color` should be `always`, `never`, or `auto`"),
686700
rust_profile_use: matches.opt_str("rust-profile-use"),
687701
rust_profile_generate: matches.opt_str("rust-profile-generate"),
702+
llvm_profile_use: matches.opt_str("llvm-profile-use"),
703+
llvm_profile_generate: matches.opt_present("llvm-profile-generate"),
688704
}
689705
}
690706
}

src/bootstrap/native.rs

+8
Original file line numberDiff line numberDiff line change
@@ -188,6 +188,14 @@ impl Step for Llvm {
188188
.define("LLVM_TARGET_ARCH", target_native.split('-').next().unwrap())
189189
.define("LLVM_DEFAULT_TARGET_TRIPLE", target_native);
190190

191+
if builder.config.llvm_profile_generate {
192+
cfg.define("LLVM_BUILD_INSTRUMENTED", "IR");
193+
cfg.define("LLVM_BUILD_RUNTIME", "No");
194+
}
195+
if let Some(path) = builder.config.llvm_profile_use.as_ref() {
196+
cfg.define("LLVM_PROFDATA_FILE", &path);
197+
}
198+
191199
if target != "aarch64-apple-darwin" && !target.contains("windows") {
192200
cfg.define("LLVM_ENABLE_ZLIB", "ON");
193201
} else {

src/ci/docker/host-x86_64/dist-x86_64-linux/Dockerfile

+6
Original file line numberDiff line numberDiff line change
@@ -82,6 +82,12 @@ COPY host-x86_64/dist-x86_64-linux/build-clang.sh /tmp/
8282
RUN ./build-clang.sh
8383
ENV CC=clang CXX=clang++
8484

85+
ENV PERF_COMMIT 1e19fc4c6168d2f7596e512f42f358f245d8f09d
86+
RUN curl -LS -o perf.zip https://github.com/rust-lang/rustc-perf/archive/$PERF_COMMIT.zip && \
87+
unzip perf.zip && \
88+
mv rustc-perf-$PERF_COMMIT rustc-perf && \
89+
rm perf.zip
90+
8591
COPY scripts/sccache.sh /scripts/
8692
RUN sh /scripts/sccache.sh
8793

src/ci/docker/host-x86_64/dist-x86_64-linux/build-clang.sh

+2-1
Original file line numberDiff line numberDiff line change
@@ -26,8 +26,9 @@ hide_output \
2626
-DCMAKE_CXX_COMPILER=/rustroot/bin/g++ \
2727
-DCMAKE_BUILD_TYPE=Release \
2828
-DCMAKE_INSTALL_PREFIX=/rustroot \
29+
-DCOMPILER_RT_BUILD_SANITIZERS=OFF \
2930
-DLLVM_TARGETS_TO_BUILD=X86 \
30-
-DLLVM_ENABLE_PROJECTS="clang;lld" \
31+
-DLLVM_ENABLE_PROJECTS="clang;lld;compiler-rt" \
3132
-DC_INCLUDE_DIRS="$INC"
3233

3334
hide_output make -j$(nproc)

src/ci/pgo.sh

+46-49
Original file line numberDiff line numberDiff line change
@@ -5,61 +5,58 @@ set -euxo pipefail
55
rm -rf /tmp/rustc-pgo
66

77
python3 ../x.py build --target=$PGO_HOST --host=$PGO_HOST \
8-
--stage 2 library/std --rust-profile-generate=/tmp/rustc-pgo
8+
--stage 2 library/std \
9+
--rust-profile-generate=/tmp/rustc-pgo \
10+
--llvm-profile-generate
911

12+
# Profile libcore compilation in opt-level=0 and opt-level=3
1013
RUSTC_BOOTSTRAP=1 ./build/$PGO_HOST/stage2/bin/rustc --edition=2018 \
1114
--crate-type=lib ../library/core/src/lib.rs
12-
13-
# Download and build a single-file stress test benchmark on perf.rust-lang.org.
14-
function pgo_perf_benchmark {
15-
local PERF=1e19fc4c6168d2f7596e512f42f358f245d8f09d
16-
local github_prefix=https://raw.githubusercontent.com/rust-lang/rustc-perf/$PERF
17-
local name=$1
18-
local edition=$2
19-
curl -o /tmp/$name.rs $github_prefix/collector/benchmarks/$name/src/lib.rs
20-
21-
RUSTC_BOOTSTRAP=1 ./build/$PGO_HOST/stage2/bin/rustc --edition=$edition \
22-
--crate-type=lib /tmp/$name.rs
23-
}
24-
25-
pgo_perf_benchmark externs 2018
26-
pgo_perf_benchmark ctfe-stress-4 2018
27-
pgo_perf_benchmark inflate 2015
28-
29-
cp -pri ../src/tools/cargo /tmp/cargo
30-
31-
# The Cargo repository does not have a Cargo.lock in it, as it relies on the
32-
# lockfile already present in the rust-lang/rust monorepo. This decision breaks
33-
# down when Cargo is built outside the monorepo though (like in this case),
34-
# resulting in a build without any dependency locking.
35-
#
36-
# To ensure Cargo is built with locked dependencies even during PGO profiling
37-
# the following command copies the monorepo's lockfile into the Cargo temporary
38-
# directory. Cargo will *not* keep that lockfile intact, as it will remove all
39-
# the dependencies Cargo itself doesn't rely on. Still, it will prevent
40-
# building Cargo with arbitrary dependency versions.
41-
#
42-
# See #81378 for the bug that prompted adding this.
43-
cp -p ../Cargo.lock /tmp/cargo
44-
45-
# Build cargo (with some flags)
46-
function pgo_cargo {
47-
RUSTC=./build/$PGO_HOST/stage2/bin/rustc \
48-
./build/$PGO_HOST/stage0/bin/cargo $@ \
49-
--manifest-path /tmp/cargo/Cargo.toml
50-
}
51-
52-
# Build a couple different variants of Cargo
53-
CARGO_INCREMENTAL=1 pgo_cargo check
54-
echo 'pub fn barbarbar() {}' >> /tmp/cargo/src/cargo/lib.rs
55-
CARGO_INCREMENTAL=1 pgo_cargo check
56-
touch /tmp/cargo/src/cargo/lib.rs
57-
CARGO_INCREMENTAL=1 pgo_cargo check
58-
pgo_cargo build --release
15+
RUSTC_BOOTSTRAP=1 ./build/$PGO_HOST/stage2/bin/rustc --edition=2018 \
16+
--crate-type=lib -Copt-level=3 ../library/core/src/lib.rs
17+
18+
cp -r /tmp/rustc-perf ./
19+
chown -R $(whoami): ./rustc-perf
20+
cd rustc-perf
21+
22+
RUST_LOG=collector=debug \
23+
RUSTC=/checkout/obj/build/$PGO_HOST/stage0/bin/rustc \
24+
RUSTC_BOOTSTRAP=1 \
25+
/checkout/obj/build/$PGO_HOST/stage0/bin/cargo build -p collector
26+
27+
# benchmark using profile_local with eprintln, which essentially just means
28+
# don't actually benchmark -- just make sure we run rustc a bunch of times.
29+
RUST_LOG=collector=debug \
30+
RUSTC=/checkout/obj/build/$PGO_HOST/stage0/bin/rustc \
31+
RUSTC_BOOTSTRAP=1 \
32+
/checkout/obj/build/$PGO_HOST/stage0/bin/cargo run -p collector --bin collector -- \
33+
profile_local \
34+
eprintln \
35+
/checkout/obj/build/$PGO_HOST/stage2/bin/rustc \
36+
Test \
37+
--builds Check,Debug,Opt \
38+
--cargo /checkout/obj/build/$PGO_HOST/stage0/bin/cargo \
39+
--runs All \
40+
--include externs,ctfe-stress-4,inflate,cargo,token-stream-stress,match-stress-enum
41+
42+
cd /checkout/obj
5943

6044
# Merge the profile data we gathered
6145
./build/$PGO_HOST/llvm/bin/llvm-profdata \
6246
merge -o /tmp/rustc-pgo.profdata /tmp/rustc-pgo
6347

48+
# Merge the profile data we gathered for LLVM
49+
# Note that this uses the profdata from the clang we used to build LLVM,
50+
# which likely has a different version than our in-tree clang.
51+
/rustroot/bin/llvm-profdata \
52+
merge -o /tmp/llvm-pgo.profdata ./build/$PGO_HOST/llvm/build/profiles
53+
54+
# Rustbuild currently doesn't support rebuilding LLVM when PGO options
55+
# change (or any other llvm-related options); so just clear out the relevant
56+
# directories ourselves.
57+
rm -r ./build/$PGO_HOST/llvm ./build/$PGO_HOST/lld
58+
6459
# This produces the actual final set of artifacts.
65-
$@ --rust-profile-use=/tmp/rustc-pgo.profdata
60+
$@ \
61+
--rust-profile-use=/tmp/rustc-pgo.profdata \
62+
--llvm-profile-use=/tmp/llvm-pgo.profdata

0 commit comments

Comments
 (0)