Skip to content

Commit 09b1254

Browse files
authored
Rollup merge of rust-lang#109124 - ferrocene:pa-compression-mode, r=Mark-Simulacrum
Add `dist.compression-profile` option to control compression speed PR rust-lang#108534 reduced the size of compressed archives, but (as expected) it also resulted in way longer compression times and memory usage during compression. It's desirable to keep status quo (smaller archives but more CI usage), but it should also be configurable so that downstream users don't have to waste that much time on CI. As a data point, this resulted in doubling the time of Ferrocene's dist jobs, and required us to increase the RAM allocation for one of such jobs. This PR adds a new `config.toml` setting, `dist.compression-profile`. The values can be: * `fast`: equivalent to the gzip and xz preset of "1" * `balanced`: equivalent to the gzip and xz preset of "6" (the CLI defaults as far as I'm aware) * `best`: equivalent to the gzip present of "9", and our custom xz profile The default has also been moved back to `balanced`, to try and avoid the compression time regression for downstream users. I don't feel too strongly on the default, and I'm open to changing it. Also, for the `best` profile the XZ settings do not match the "9" preset used by the CLI, and it might be confusing. Should we create a `custom-rustc-ci`/`ultra` profile for that? r? ``@Mark-Simulacrum``
2 parents e79b182 + 0177176 commit 09b1254

File tree

9 files changed

+127
-47
lines changed

9 files changed

+127
-47
lines changed

config.example.toml

+6
Original file line numberDiff line numberDiff line change
@@ -806,3 +806,9 @@ changelog-seen = 2
806806
#
807807
# This list must be non-empty.
808808
#compression-formats = ["gz", "xz"]
809+
810+
# How much time should be spent compressing the tarballs. The better the
811+
# compression profile, the longer compression will take.
812+
#
813+
# Available options: fast, balanced, best
814+
#compression-profile = "fast"

src/bootstrap/config.rs

+4
Original file line numberDiff line numberDiff line change
@@ -191,6 +191,7 @@ pub struct Config {
191191
pub dist_sign_folder: Option<PathBuf>,
192192
pub dist_upload_addr: Option<String>,
193193
pub dist_compression_formats: Option<Vec<String>>,
194+
pub dist_compression_profile: String,
194195
pub dist_include_mingw_linker: bool,
195196

196197
// libstd features
@@ -703,6 +704,7 @@ define_config! {
703704
src_tarball: Option<bool> = "src-tarball",
704705
missing_tools: Option<bool> = "missing-tools",
705706
compression_formats: Option<Vec<String>> = "compression-formats",
707+
compression_profile: Option<String> = "compression-profile",
706708
include_mingw_linker: Option<bool> = "include-mingw-linker",
707709
}
708710
}
@@ -821,6 +823,7 @@ impl Config {
821823
config.deny_warnings = true;
822824
config.bindir = "bin".into();
823825
config.dist_include_mingw_linker = true;
826+
config.dist_compression_profile = "fast".into();
824827

825828
// set by build.rs
826829
config.build = TargetSelection::from_user(&env!("BUILD_TRIPLE"));
@@ -1308,6 +1311,7 @@ impl Config {
13081311
config.dist_sign_folder = t.sign_folder.map(PathBuf::from);
13091312
config.dist_upload_addr = t.upload_addr;
13101313
config.dist_compression_formats = t.compression_formats;
1314+
set(&mut config.dist_compression_profile, t.compression_profile);
13111315
set(&mut config.rust_dist_src, t.src_tarball);
13121316
set(&mut config.missing_tools, t.missing_tools);
13131317
set(&mut config.dist_include_mingw_linker, t.include_mingw_linker)

src/bootstrap/defaults/config.user.toml

+4
Original file line numberDiff line numberDiff line change
@@ -11,3 +11,7 @@ extended = true
1111
[llvm]
1212
# Most users installing from source want to build all parts of the project from source, not just rustc itself.
1313
download-ci-llvm = false
14+
15+
[dist]
16+
# Use better compression when preparing tarballs.
17+
compression-profile = "balanced"

src/bootstrap/tarball.rs

+1
Original file line numberDiff line numberDiff line change
@@ -318,6 +318,7 @@ impl<'a> Tarball<'a> {
318318
assert!(!formats.is_empty(), "dist.compression-formats can't be empty");
319319
cmd.arg("--compression-formats").arg(formats.join(","));
320320
}
321+
cmd.args(&["--compression-profile", &self.builder.config.dist_compression_profile]);
321322
self.builder.run(&mut cmd);
322323

323324
// Ensure there are no symbolic links in the tarball. In particular,

src/ci/run.sh

+1
Original file line numberDiff line numberDiff line change
@@ -58,6 +58,7 @@ RUST_CONFIGURE_ARGS="$RUST_CONFIGURE_ARGS --disable-manage-submodules"
5858
RUST_CONFIGURE_ARGS="$RUST_CONFIGURE_ARGS --enable-locked-deps"
5959
RUST_CONFIGURE_ARGS="$RUST_CONFIGURE_ARGS --enable-cargo-native-static"
6060
RUST_CONFIGURE_ARGS="$RUST_CONFIGURE_ARGS --set rust.codegen-units-std=1"
61+
RUST_CONFIGURE_ARGS="$RUST_CONFIGURE_ARGS --set dist.compression-profile=best"
6162

6263
# Only produce xz tarballs on CI. gz tarballs will be generated by the release
6364
# process by recompressing the existing xz ones. This decreases the storage

src/tools/rust-installer/src/combiner.rs

+6-1
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
use super::Scripter;
22
use super::Tarballer;
33
use crate::{
4-
compression::{CompressionFormat, CompressionFormats},
4+
compression::{CompressionFormat, CompressionFormats, CompressionProfile},
55
util::*,
66
};
77
use anyhow::{bail, Context, Result};
@@ -48,6 +48,10 @@ actor! {
4848
#[clap(value_name = "DIR")]
4949
output_dir: String = "./dist",
5050

51+
/// The profile used to compress the tarball.
52+
#[clap(value_name = "FORMAT", default_value_t)]
53+
compression_profile: CompressionProfile,
54+
5155
/// The formats used to compress the tarball
5256
#[clap(value_name = "FORMAT", default_value_t)]
5357
compression_formats: CompressionFormats,
@@ -153,6 +157,7 @@ impl Combiner {
153157
.work_dir(self.work_dir)
154158
.input(self.package_name)
155159
.output(path_to_str(&output)?.into())
160+
.compression_profile(self.compression_profile)
156161
.compression_formats(self.compression_formats.clone());
157162
tarballer.run()?;
158163

src/tools/rust-installer/src/compression.rs

+93-43
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,37 @@ use rayon::prelude::*;
44
use std::{convert::TryFrom, fmt, io::Read, io::Write, path::Path, str::FromStr};
55
use xz2::{read::XzDecoder, write::XzEncoder};
66

7+
#[derive(Default, Debug, Copy, Clone)]
8+
pub enum CompressionProfile {
9+
Fast,
10+
#[default]
11+
Balanced,
12+
Best,
13+
}
14+
15+
impl FromStr for CompressionProfile {
16+
type Err = Error;
17+
18+
fn from_str(input: &str) -> Result<Self, Error> {
19+
Ok(match input {
20+
"fast" => Self::Fast,
21+
"balanced" => Self::Balanced,
22+
"best" => Self::Best,
23+
other => anyhow::bail!("invalid compression profile: {other}"),
24+
})
25+
}
26+
}
27+
28+
impl fmt::Display for CompressionProfile {
29+
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
30+
match self {
31+
CompressionProfile::Fast => f.write_str("fast"),
32+
CompressionProfile::Balanced => f.write_str("balanced"),
33+
CompressionProfile::Best => f.write_str("best"),
34+
}
35+
}
36+
}
37+
738
#[derive(Debug, Copy, Clone)]
839
pub enum CompressionFormat {
940
Gz,
@@ -26,7 +57,11 @@ impl CompressionFormat {
2657
}
2758
}
2859

29-
pub(crate) fn encode(&self, path: impl AsRef<Path>) -> Result<Box<dyn Encoder>, Error> {
60+
pub(crate) fn encode(
61+
&self,
62+
path: impl AsRef<Path>,
63+
profile: CompressionProfile,
64+
) -> Result<Box<dyn Encoder>, Error> {
3065
let mut os = path.as_ref().as_os_str().to_os_string();
3166
os.push(format!(".{}", self.extension()));
3267
let path = Path::new(&os);
@@ -37,49 +72,64 @@ impl CompressionFormat {
3772
let file = crate::util::create_new_file(path)?;
3873

3974
Ok(match self {
40-
CompressionFormat::Gz => Box::new(GzEncoder::new(file, flate2::Compression::best())),
75+
CompressionFormat::Gz => Box::new(GzEncoder::new(
76+
file,
77+
match profile {
78+
CompressionProfile::Fast => flate2::Compression::fast(),
79+
CompressionProfile::Balanced => flate2::Compression::new(6),
80+
CompressionProfile::Best => flate2::Compression::best(),
81+
},
82+
)),
4183
CompressionFormat::Xz => {
42-
let mut filters = xz2::stream::Filters::new();
43-
// the preset is overridden by the other options so it doesn't matter
44-
let mut lzma_ops = xz2::stream::LzmaOptions::new_preset(9).unwrap();
45-
// This sets the overall dictionary size, which is also how much memory (baseline)
46-
// is needed for decompression.
47-
lzma_ops.dict_size(64 * 1024 * 1024);
48-
// Use the best match finder for compression ratio.
49-
lzma_ops.match_finder(xz2::stream::MatchFinder::BinaryTree4);
50-
lzma_ops.mode(xz2::stream::Mode::Normal);
51-
// Set nice len to the maximum for best compression ratio
52-
lzma_ops.nice_len(273);
53-
// Set depth to a reasonable value, 0 means auto, 1000 is somwhat high but gives
54-
// good results.
55-
lzma_ops.depth(1000);
56-
// 2 is the default and does well for most files
57-
lzma_ops.position_bits(2);
58-
// 0 is the default and does well for most files
59-
lzma_ops.literal_position_bits(0);
60-
// 3 is the default and does well for most files
61-
lzma_ops.literal_context_bits(3);
62-
63-
filters.lzma2(&lzma_ops);
64-
65-
let mut builder = xz2::stream::MtStreamBuilder::new();
66-
builder.filters(filters);
67-
68-
// On 32-bit platforms limit ourselves to 3 threads, otherwise we exceed memory
69-
// usage this process can take. In the future we'll likely only do super-fast
70-
// compression in CI and move this heavyweight processing to promote-release (which
71-
// is always 64-bit and can run on big-memory machines) but for now this lets us
72-
// move forward.
73-
if std::mem::size_of::<usize>() == 4 {
74-
builder.threads(3);
75-
} else {
76-
builder.threads(6);
77-
}
78-
79-
let compressor = XzEncoder::new_stream(
80-
std::io::BufWriter::new(file),
81-
builder.encoder().unwrap(),
82-
);
84+
let encoder = match profile {
85+
CompressionProfile::Fast => {
86+
xz2::stream::MtStreamBuilder::new().threads(6).preset(1).encoder().unwrap()
87+
}
88+
CompressionProfile::Balanced => {
89+
xz2::stream::MtStreamBuilder::new().threads(6).preset(6).encoder().unwrap()
90+
}
91+
CompressionProfile::Best => {
92+
let mut filters = xz2::stream::Filters::new();
93+
// the preset is overridden by the other options so it doesn't matter
94+
let mut lzma_ops = xz2::stream::LzmaOptions::new_preset(9).unwrap();
95+
// This sets the overall dictionary size, which is also how much memory (baseline)
96+
// is needed for decompression.
97+
lzma_ops.dict_size(64 * 1024 * 1024);
98+
// Use the best match finder for compression ratio.
99+
lzma_ops.match_finder(xz2::stream::MatchFinder::BinaryTree4);
100+
lzma_ops.mode(xz2::stream::Mode::Normal);
101+
// Set nice len to the maximum for best compression ratio
102+
lzma_ops.nice_len(273);
103+
// Set depth to a reasonable value, 0 means auto, 1000 is somwhat high but gives
104+
// good results.
105+
lzma_ops.depth(1000);
106+
// 2 is the default and does well for most files
107+
lzma_ops.position_bits(2);
108+
// 0 is the default and does well for most files
109+
lzma_ops.literal_position_bits(0);
110+
// 3 is the default and does well for most files
111+
lzma_ops.literal_context_bits(3);
112+
113+
filters.lzma2(&lzma_ops);
114+
115+
let mut builder = xz2::stream::MtStreamBuilder::new();
116+
builder.filters(filters);
117+
118+
// On 32-bit platforms limit ourselves to 3 threads, otherwise we exceed memory
119+
// usage this process can take. In the future we'll likely only do super-fast
120+
// compression in CI and move this heavyweight processing to promote-release (which
121+
// is always 64-bit and can run on big-memory machines) but for now this lets us
122+
// move forward.
123+
if std::mem::size_of::<usize>() == 4 {
124+
builder.threads(3);
125+
} else {
126+
builder.threads(6);
127+
}
128+
builder.encoder().unwrap()
129+
}
130+
};
131+
132+
let compressor = XzEncoder::new_stream(std::io::BufWriter::new(file), encoder);
83133
Box::new(compressor)
84134
}
85135
})

src/tools/rust-installer/src/generator.rs

+6-1
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
use super::Scripter;
22
use super::Tarballer;
3-
use crate::compression::CompressionFormats;
3+
use crate::compression::{CompressionFormats, CompressionProfile};
44
use crate::util::*;
55
use anyhow::{bail, format_err, Context, Result};
66
use std::collections::BTreeSet;
@@ -54,6 +54,10 @@ actor! {
5454
#[clap(value_name = "DIR")]
5555
output_dir: String = "./dist",
5656

57+
/// The profile used to compress the tarball.
58+
#[clap(value_name = "FORMAT", default_value_t)]
59+
compression_profile: CompressionProfile,
60+
5761
/// The formats used to compress the tarball
5862
#[clap(value_name = "FORMAT", default_value_t)]
5963
compression_formats: CompressionFormats,
@@ -113,6 +117,7 @@ impl Generator {
113117
.work_dir(self.work_dir)
114118
.input(self.package_name)
115119
.output(path_to_str(&output)?.into())
120+
.compression_profile(self.compression_profile)
116121
.compression_formats(self.compression_formats.clone());
117122
tarballer.run()?;
118123

src/tools/rust-installer/src/tarballer.rs

+6-2
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ use tar::{Builder, Header};
66
use walkdir::WalkDir;
77

88
use crate::{
9-
compression::{CombinedEncoder, CompressionFormats},
9+
compression::{CombinedEncoder, CompressionFormats, CompressionProfile},
1010
util::*,
1111
};
1212

@@ -25,6 +25,10 @@ actor! {
2525
#[clap(value_name = "DIR")]
2626
work_dir: String = "./workdir",
2727

28+
/// The profile used to compress the tarball.
29+
#[clap(value_name = "FORMAT", default_value_t)]
30+
compression_profile: CompressionProfile,
31+
2832
/// The formats used to compress the tarball.
2933
#[clap(value_name = "FORMAT", default_value_t)]
3034
compression_formats: CompressionFormats,
@@ -38,7 +42,7 @@ impl Tarballer {
3842
let encoder = CombinedEncoder::new(
3943
self.compression_formats
4044
.iter()
41-
.map(|f| f.encode(&tarball_name))
45+
.map(|f| f.encode(&tarball_name, self.compression_profile))
4246
.collect::<Result<Vec<_>>>()?,
4347
);
4448

0 commit comments

Comments
 (0)