Skip to content

Commit 6d676d0

Browse files
committed
bootstrap: use internment instead of hand-rolled interning
1 parent 6689597 commit 6d676d0

File tree

4 files changed

+57
-203
lines changed

4 files changed

+57
-203
lines changed

src/bootstrap/Cargo.lock

+39
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,12 @@ dependencies = [
1111
"memchr",
1212
]
1313

14+
[[package]]
15+
name = "allocator-api2"
16+
version = "0.2.19"
17+
source = "registry+https://github.com/rust-lang/crates.io-index"
18+
checksum = "611cc2ae7d2e242c457e4be7f97036b8ad9ca152b499f53faf99b1ed8fc2553f"
19+
1420
[[package]]
1521
name = "anstyle"
1622
version = "1.0.8"
@@ -44,6 +50,7 @@ dependencies = [
4450
"fd-lock",
4551
"home",
4652
"ignore",
53+
"internment",
4754
"junction",
4855
"libc",
4956
"object",
@@ -219,6 +226,12 @@ dependencies = [
219226
"crypto-common",
220227
]
221228

229+
[[package]]
230+
name = "equivalent"
231+
version = "1.0.1"
232+
source = "registry+https://github.com/rust-lang/crates.io-index"
233+
checksum = "5443807d6dff69373d433ab9ef5378ad8df50ca6298caf15de6e52e24aaf54d5"
234+
222235
[[package]]
223236
name = "errno"
224237
version = "0.3.9"
@@ -252,6 +265,12 @@ dependencies = [
252265
"windows-sys 0.59.0",
253266
]
254267

268+
[[package]]
269+
name = "foldhash"
270+
version = "0.1.3"
271+
source = "registry+https://github.com/rust-lang/crates.io-index"
272+
checksum = "f81ec6369c545a7d40e4589b5597581fa1c441fe1cce96dd1de43159910a36a2"
273+
255274
[[package]]
256275
name = "generic-array"
257276
version = "0.14.7"
@@ -275,6 +294,17 @@ dependencies = [
275294
"regex-syntax",
276295
]
277296

297+
[[package]]
298+
name = "hashbrown"
299+
version = "0.15.1"
300+
source = "registry+https://github.com/rust-lang/crates.io-index"
301+
checksum = "3a9bfc1af68b1726ea47d3d5109de126281def866b33970e10fbab11b5dafab3"
302+
dependencies = [
303+
"allocator-api2",
304+
"equivalent",
305+
"foldhash",
306+
]
307+
278308
[[package]]
279309
name = "heck"
280310
version = "0.5.0"
@@ -306,6 +336,15 @@ dependencies = [
306336
"winapi-util",
307337
]
308338

339+
[[package]]
340+
name = "internment"
341+
version = "0.8.6"
342+
source = "registry+https://github.com/rust-lang/crates.io-index"
343+
checksum = "636d4b0f6a39fd684effe2a73f5310df16a3fa7954c26d36833e98f44d1977a2"
344+
dependencies = [
345+
"hashbrown",
346+
]
347+
309348
[[package]]
310349
name = "itoa"
311350
version = "1.0.11"

src/bootstrap/Cargo.toml

+1
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,7 @@ clap = { version = "4.4", default-features = false, features = ["std", "usage",
4545
clap_complete = "4.4"
4646
fd-lock = "4.0"
4747
home = "0.5"
48+
internment = "0.8.5"
4849
ignore = "0.4"
4950
libc = "0.2"
5051
object = { version = "0.36.3", default-features = false, features = ["archive", "coff", "read_core", "unaligned"] }

src/bootstrap/src/core/config/config.rs

+16-14
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ use crate::core::build_steps::llvm;
2424
pub use crate::core::config::flags::Subcommand;
2525
use crate::core::config::flags::{Color, Flags, Warnings};
2626
use crate::core::download::is_download_ci_available;
27-
use crate::utils::cache::{INTERNER, Interned};
27+
use crate::utils::cache::Interned;
2828
use crate::utils::channel::{self, GitInfo};
2929
use crate::utils::helpers::{self, exe, output, t};
3030

@@ -465,15 +465,21 @@ impl std::str::FromStr for RustcLto {
465465
}
466466
}
467467

468-
#[derive(Copy, Clone, Default, PartialEq, Eq, PartialOrd, Ord, Hash)]
468+
#[derive(Copy, Clone, PartialEq, Eq, PartialOrd, Ord, Hash)]
469469
// N.B.: This type is used everywhere, and the entire codebase relies on it being Copy.
470470
// Making !Copy is highly nontrivial!
471471
pub struct TargetSelection {
472-
pub triple: Interned<String>,
473-
file: Option<Interned<String>>,
472+
pub triple: Interned<str>,
473+
file: Option<Interned<str>>,
474474
synthetic: bool,
475475
}
476476

477+
impl Default for TargetSelection {
478+
fn default() -> Self {
479+
Self { triple: "".into(), file: Default::default(), synthetic: Default::default() }
480+
}
481+
}
482+
477483
/// Newtype over `Vec<TargetSelection>` so we can implement custom parsing logic
478484
#[derive(Clone, Default, PartialEq, Eq, PartialOrd, Ord, Hash, Debug)]
479485
pub struct TargetSelectionList(Vec<TargetSelection>);
@@ -500,18 +506,14 @@ impl TargetSelection {
500506
(selection, None)
501507
};
502508

503-
let triple = INTERNER.intern_str(triple);
504-
let file = file.map(|f| INTERNER.intern_str(f));
509+
let triple: Interned<str> = triple.into();
510+
let file: Option<Interned<str>> = file.map(|f| f.into());
505511

506512
Self { triple, file, synthetic: false }
507513
}
508514

509515
pub fn create_synthetic(triple: &str, file: &str) -> Self {
510-
Self {
511-
triple: INTERNER.intern_str(triple),
512-
file: Some(INTERNER.intern_str(file)),
513-
synthetic: true,
514-
}
516+
Self { triple: triple.into(), file: Some(file.into()), synthetic: true }
515517
}
516518

517519
pub fn rustc_target_arg(&self) -> &str {
@@ -571,15 +573,15 @@ impl fmt::Debug for TargetSelection {
571573

572574
impl PartialEq<&str> for TargetSelection {
573575
fn eq(&self, other: &&str) -> bool {
574-
self.triple == *other
576+
&*self.triple == *other
575577
}
576578
}
577579

578580
// Targets are often used as directory names throughout bootstrap.
579581
// This impl makes it more ergonomics to use them as such.
580582
impl AsRef<Path> for TargetSelection {
581583
fn as_ref(&self) -> &Path {
582-
self.triple.as_ref()
584+
(*self.triple).as_ref()
583585
}
584586
}
585587

@@ -2119,7 +2121,7 @@ impl Config {
21192121
// thus, disabled
21202122
// - similarly, lld will not be built nor used by default when explicitly asked not to, e.g.
21212123
// when the config sets `rust.lld = false`
2122-
if config.build.triple == "x86_64-unknown-linux-gnu"
2124+
if &*config.build.triple == "x86_64-unknown-linux-gnu"
21232125
&& config.hosts == [config.build]
21242126
&& (config.channel == "dev" || config.channel == "nightly")
21252127
{

src/bootstrap/src/utils/cache.rs

+1-189
Original file line numberDiff line numberDiff line change
@@ -1,198 +1,10 @@
11
use std::any::{Any, TypeId};
2-
use std::borrow::Borrow;
32
use std::cell::RefCell;
4-
use std::cmp::Ordering;
53
use std::collections::HashMap;
6-
use std::hash::{Hash, Hasher};
7-
use std::marker::PhantomData;
8-
use std::ops::Deref;
9-
use std::path::PathBuf;
10-
use std::sync::{LazyLock, Mutex};
11-
use std::{fmt, mem};
124

135
use crate::core::builder::Step;
146

15-
pub struct Interned<T>(usize, PhantomData<*const T>);
16-
17-
impl<T: Internable + Default> Default for Interned<T> {
18-
fn default() -> Self {
19-
T::default().intern()
20-
}
21-
}
22-
23-
impl<T> Copy for Interned<T> {}
24-
impl<T> Clone for Interned<T> {
25-
fn clone(&self) -> Interned<T> {
26-
*self
27-
}
28-
}
29-
30-
impl<T> PartialEq for Interned<T> {
31-
fn eq(&self, other: &Self) -> bool {
32-
self.0 == other.0
33-
}
34-
}
35-
impl<T> Eq for Interned<T> {}
36-
37-
impl PartialEq<str> for Interned<String> {
38-
fn eq(&self, other: &str) -> bool {
39-
*self == other
40-
}
41-
}
42-
impl PartialEq<&str> for Interned<String> {
43-
fn eq(&self, other: &&str) -> bool {
44-
**self == **other
45-
}
46-
}
47-
impl<T> PartialEq<&Interned<T>> for Interned<T> {
48-
fn eq(&self, other: &&Self) -> bool {
49-
self.0 == other.0
50-
}
51-
}
52-
impl<T> PartialEq<Interned<T>> for &Interned<T> {
53-
fn eq(&self, other: &Interned<T>) -> bool {
54-
self.0 == other.0
55-
}
56-
}
57-
58-
unsafe impl<T> Send for Interned<T> {}
59-
unsafe impl<T> Sync for Interned<T> {}
60-
61-
impl fmt::Display for Interned<String> {
62-
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
63-
let s: &str = self;
64-
f.write_str(s)
65-
}
66-
}
67-
68-
impl<T, U: ?Sized + fmt::Debug> fmt::Debug for Interned<T>
69-
where
70-
Self: Deref<Target = U>,
71-
{
72-
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
73-
let s: &U = self;
74-
f.write_fmt(format_args!("{s:?}"))
75-
}
76-
}
77-
78-
impl<T: Internable + Hash> Hash for Interned<T> {
79-
fn hash<H: Hasher>(&self, state: &mut H) {
80-
let l = T::intern_cache().lock().unwrap();
81-
l.get(*self).hash(state)
82-
}
83-
}
84-
85-
impl<T: Internable + Deref> Deref for Interned<T> {
86-
type Target = T::Target;
87-
fn deref(&self) -> &Self::Target {
88-
let l = T::intern_cache().lock().unwrap();
89-
unsafe { mem::transmute::<&Self::Target, &Self::Target>(l.get(*self)) }
90-
}
91-
}
92-
93-
impl<T: Internable + AsRef<U>, U: ?Sized> AsRef<U> for Interned<T> {
94-
fn as_ref(&self) -> &U {
95-
let l = T::intern_cache().lock().unwrap();
96-
unsafe { mem::transmute::<&U, &U>(l.get(*self).as_ref()) }
97-
}
98-
}
99-
100-
impl<T: Internable + PartialOrd> PartialOrd for Interned<T> {
101-
fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
102-
let l = T::intern_cache().lock().unwrap();
103-
l.get(*self).partial_cmp(l.get(*other))
104-
}
105-
}
106-
107-
impl<T: Internable + Ord> Ord for Interned<T> {
108-
fn cmp(&self, other: &Self) -> Ordering {
109-
let l = T::intern_cache().lock().unwrap();
110-
l.get(*self).cmp(l.get(*other))
111-
}
112-
}
113-
114-
struct TyIntern<T: Clone + Eq> {
115-
items: Vec<T>,
116-
set: HashMap<T, Interned<T>>,
117-
}
118-
119-
impl<T: Hash + Clone + Eq> Default for TyIntern<T> {
120-
fn default() -> Self {
121-
TyIntern { items: Vec::new(), set: Default::default() }
122-
}
123-
}
124-
125-
impl<T: Hash + Clone + Eq> TyIntern<T> {
126-
fn intern_borrow<B>(&mut self, item: &B) -> Interned<T>
127-
where
128-
B: Eq + Hash + ToOwned<Owned = T> + ?Sized,
129-
T: Borrow<B>,
130-
{
131-
if let Some(i) = self.set.get(item) {
132-
return *i;
133-
}
134-
let item = item.to_owned();
135-
let interned = Interned(self.items.len(), PhantomData::<*const T>);
136-
self.set.insert(item.clone(), interned);
137-
self.items.push(item);
138-
interned
139-
}
140-
141-
fn intern(&mut self, item: T) -> Interned<T> {
142-
if let Some(i) = self.set.get(&item) {
143-
return *i;
144-
}
145-
let interned = Interned(self.items.len(), PhantomData::<*const T>);
146-
self.set.insert(item.clone(), interned);
147-
self.items.push(item);
148-
interned
149-
}
150-
151-
fn get(&self, i: Interned<T>) -> &T {
152-
&self.items[i.0]
153-
}
154-
}
155-
156-
#[derive(Default)]
157-
pub struct Interner {
158-
strs: Mutex<TyIntern<String>>,
159-
paths: Mutex<TyIntern<PathBuf>>,
160-
lists: Mutex<TyIntern<Vec<String>>>,
161-
}
162-
163-
trait Internable: Clone + Eq + Hash + 'static {
164-
fn intern_cache() -> &'static Mutex<TyIntern<Self>>;
165-
166-
fn intern(self) -> Interned<Self> {
167-
Self::intern_cache().lock().unwrap().intern(self)
168-
}
169-
}
170-
171-
impl Internable for String {
172-
fn intern_cache() -> &'static Mutex<TyIntern<Self>> {
173-
&INTERNER.strs
174-
}
175-
}
176-
177-
impl Internable for PathBuf {
178-
fn intern_cache() -> &'static Mutex<TyIntern<Self>> {
179-
&INTERNER.paths
180-
}
181-
}
182-
183-
impl Internable for Vec<String> {
184-
fn intern_cache() -> &'static Mutex<TyIntern<Self>> {
185-
&INTERNER.lists
186-
}
187-
}
188-
189-
impl Interner {
190-
pub fn intern_str(&self, s: &str) -> Interned<String> {
191-
self.strs.lock().unwrap().intern_borrow(s)
192-
}
193-
}
194-
195-
pub static INTERNER: LazyLock<Interner> = LazyLock::new(Interner::default);
7+
pub type Interned<T> = internment::Intern<T>;
1968

1979
/// This is essentially a `HashMap` which allows storing any type in its input and
19810
/// any type in its output. It is a write-once cache; values are never evicted,

0 commit comments

Comments
 (0)