Skip to content

Commit

Permalink
Merge matklad#233
Browse files Browse the repository at this point in the history
233: Make `unsync::Lazy<T, F>` covariant in `F` r=matklad a=danielhenrymantilla

"Continuation" from matklad#230, which partially handles matklad#167.

  - Incidentally, this also makes `unsync::Lazy` smaller in size in most cases, since `T` and `F` are now sharing the same `union` storage.

The `sync` can basically use the same logic (my PR paves the way for such a follow-up PR), only the whole thing would need to be moved to each of the possible `imp`lementations of `sync::OnceCell`, and special care to synchronization semantics will be in order, which I prefer to let somebody else do.

Co-authored-by: Daniel Henry-Mantilla <daniel.henry.mantilla@gmail.com>
  • Loading branch information
bors[bot] and danielhenrymantilla authored Jun 3, 2023
2 parents 8f39b77 + 179b2a9 commit e3b2260
Show file tree
Hide file tree
Showing 2 changed files with 174 additions and 23 deletions.
133 changes: 110 additions & 23 deletions src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -716,15 +716,52 @@ pub mod unsync {
/// // 92
/// ```
pub struct Lazy<T, F = fn() -> T> {
cell: OnceCell<T>,
init: Cell<Option<F>>,
state: Cell<State>,
data: Data<T, F>,
}

/// Discriminant of the union.
#[derive(Debug, Clone, Copy)]
enum State {
/// `.init` has not been taken yet.
Uninit,
/// `.init` has been *taken*, but the call has not completed (panic?), so there is no `.value` either.
Poisoned,
/// `.value` has been set.
Value,
}

// One of the rare cases `#[repr(C)]` is not needed for an union ("externally tagged `enum`" pattern)
union Data<T, F> {
/// Idea: we don't need *mutation* to dispose of `F`, we can just let it be there, inert, behind a MD.
///
/// This makes it so we remain covariant in `F`.
init: mem::ManuallyDrop<F>,
value: mem::ManuallyDrop<UnsafeCell<T>>,
}

impl<T, F> Drop for Lazy<T, F> {
fn drop(&mut self) {
match self.state.get_mut() {
State::Value => unsafe { mem::ManuallyDrop::drop(&mut self.data.value) },
State::Uninit => unsafe { mem::ManuallyDrop::drop(&mut self.data.init) },
State::Poisoned => {}
}
}
}

impl<T, F: RefUnwindSafe> RefUnwindSafe for Lazy<T, F> where OnceCell<T>: RefUnwindSafe {}

impl<T: fmt::Debug, F> fmt::Debug for Lazy<T, F> {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
f.debug_struct("Lazy").field("cell", &self.cell).field("init", &"..").finish()
match self.state.get() {
// `Lazy("some value")`
State::Value => {
f.debug_tuple("Lazy").field(unsafe { &*self.data.value.get() }).finish()
}
// `Uninit`, or `Poisoned`
state => state.fmt(f),
}
}
}

Expand All @@ -744,18 +781,28 @@ pub mod unsync {
/// # }
/// ```
pub const fn new(init: F) -> Lazy<T, F> {
Lazy { cell: OnceCell::new(), init: Cell::new(Some(init)) }
Lazy {
state: Cell::new(State::Uninit),
data: Data { init: mem::ManuallyDrop::new(init) },
}
}

/// Consumes this `Lazy` returning the stored value.
///
/// Returns `Ok(value)` if `Lazy` is initialized and `Err(f)` otherwise.
pub fn into_value(this: Lazy<T, F>) -> Result<T, F> {
let cell = this.cell;
let init = this.init;
cell.into_inner().ok_or_else(|| {
init.take().unwrap_or_else(|| panic!("Lazy instance has previously been poisoned"))
})
// Safety: beyond the typical "check discriminant before accessing corresponding union variant",
// we have to be careful not to run `this`' `impl Drop` glue as we extract its fields,
// hence the initial extra layer of `ManuallyDrop`.
// Once that's done nothing is owned anymore, so we are free to `ManuallyDrop::take` what we want.
let mut this = mem::ManuallyDrop::new(this);
match this.state.get_mut() {
State::Value => {
Ok(unsafe { mem::ManuallyDrop::take(&mut this.data.value) }.into_inner())
}
State::Uninit => Err(unsafe { mem::ManuallyDrop::take(&mut this.data.init) }),
State::Poisoned => panic!("Lazy instance has previously been poisoned"),
}
}
}

Expand All @@ -775,10 +822,37 @@ pub mod unsync {
/// assert_eq!(&*lazy, &92);
/// ```
pub fn force(this: &Lazy<T, F>) -> &T {
this.cell.get_or_init(|| match this.init.take() {
Some(f) => f(),
None => panic!("Lazy instance has previously been poisoned"),
})
match this.state.get() {
State::Value => unsafe { &*this.data.value.get() },
State::Uninit => {
// Safety: `<*const _>::read(&*...)` is the by-ref counterpart of `ManuallyDrop::take`.
// We are allowed to `take` the `F` once we have taken its `State::Uninit` discriminant.
// We cannot put `State::Value` in its stead yet in case `init()` panics.
// Hence the `Poisoned` / "empty `Lazy`" state.
let init = unsafe {
this.state.set(State::Poisoned);
<*const F>::read(&*this.data.init)
};
let value = init();
unsafe {
// Safety: here we need to tread with caution, since we need to "pick a union variant"
// without accidentally asserting that the `ManuallyDrop<... T ...>` is init since it still isn't.
// Hence `ptr::addr_of!`.
let ptr: *const mem::ManuallyDrop<UnsafeCell<T>> =
core::ptr::addr_of!(this.data.value);
// There is no raw accessor on `ManuallyDrop`, but it's a `transparent` wrapper so we can
// just `.cast()` that layer away.
let ptr: *const UnsafeCell<T> = ptr.cast();
// To handle the `UnsafeCell` layer, no need for casts, there is a dedicated API.
let ptr: *mut T = UnsafeCell::raw_get(ptr);
// Once we've gotten the pointer, the rest is easy: set the value and discriminants accordingly.
ptr.write(value);
this.state.set(State::Value);
&*ptr
}
}
State::Poisoned => panic!("Lazy instance has previously been poisoned"),
}
}

/// Forces the evaluation of this lazy value and returns a mutable reference to
Expand All @@ -796,14 +870,25 @@ pub mod unsync {
/// assert_eq!(*lazy, 92);
/// ```
pub fn force_mut(this: &mut Lazy<T, F>) -> &mut T {
if this.cell.get_mut().is_none() {
let value = match this.init.get_mut().take() {
Some(f) => f(),
None => panic!("Lazy instance has previously been poisoned"),
};
this.cell = OnceCell::with_value(value);
let state = this.state.get_mut();
match state {
State::Value => unsafe { (*this.data.value).get_mut() },
State::Uninit => {
// Safety: same reasoning as with `force`, except simpler since we can use `&mut` accesses.
// (so we do not need to worry about any `UnsafeCell` shenanigans)
let init = unsafe {
*state = State::Poisoned;
mem::ManuallyDrop::take(&mut this.data.init)
};
let value = mem::ManuallyDrop::new(init().into());
unsafe {
core::ptr::addr_of_mut!(this.data.value).write(value);
*state = State::Value;
(*this.data.value).get_mut()
}
}
State::Poisoned => panic!("Lazy instance has previously been poisoned"),
}
this.cell.get_mut().unwrap_or_else(|| unreachable!())
}

/// Gets the reference to the result of this lazy value if
Expand All @@ -820,7 +905,7 @@ pub mod unsync {
/// assert_eq!(Lazy::get(&lazy), Some(&92));
/// ```
pub fn get(this: &Lazy<T, F>) -> Option<&T> {
this.cell.get()
matches!(this.state.get(), State::Value).then(|| unsafe { &*this.data.value.get() })
}

/// Gets the mutable reference to the result of this lazy value if
Expand All @@ -837,7 +922,8 @@ pub mod unsync {
/// assert_eq!(Lazy::get_mut(&mut lazy), Some(&mut 92));
/// ```
pub fn get_mut(this: &mut Lazy<T, F>) -> Option<&mut T> {
this.cell.get_mut()
matches!(this.state.get_mut(), State::Value)
.then(|| unsafe { (*this.data.value).get_mut() })
}
}

Expand Down Expand Up @@ -1290,7 +1376,8 @@ pub mod sync {
let cell = this.cell;
let init = this.init;
cell.into_inner().ok_or_else(|| {
init.take().unwrap_or_else(|| panic!("Lazy instance has previously been poisoned"))
init.into_inner()
.unwrap_or_else(|| panic!("Lazy instance has previously been poisoned"))
})
}
}
Expand Down
64 changes: 64 additions & 0 deletions tests/it.rs
Original file line number Diff line number Diff line change
@@ -1,3 +1,53 @@
/// Put here any code relying on duck-typed `Lazy` and `OnceCell`, oblivious to
/// their exact `sync` or `unsync` nature.
macro_rules! tests_for_both {
() => {
#[test]
fn lazy_does_drop() {
type Counter = std::rc::Rc<()>;

let (counter, [c1, c2, c3]) = {
let c = Counter::new(());
(Counter::downgrade(&c), [(); 3].map(|()| c.clone()))
};
assert_eq!(counter.strong_count(), 3);

let lazy_1 = Lazy::<Counter, _>::new(|| c1);
assert_eq!(counter.strong_count(), 3);
drop(lazy_1);
assert_eq!(
counter.strong_count(),
2,
"dropping a `Lazy::Uninit` drops the `init` closure"
);

let lazy_2 = Lazy::<Counter, _>::new(|| c2);
Lazy::force(&lazy_2);
assert_eq!(
counter.strong_count(),
2,
"from `Lazy::Uninit` to `Lazy::Value` drops `init` but owns `value`"
);
drop(lazy_2);
assert_eq!(counter.strong_count(), 1, "dropping a `Lazy::Value` drops its `value`");

let lazy_3 = Lazy::<Counter, _>::new(|| {
None::<()>.unwrap();
c3
});
assert_eq!(counter.strong_count(), 1);
let _ = std::panic::catch_unwind(|| Lazy::force(&lazy_3)).expect_err("it panicked");
assert_eq!(
counter.strong_count(),
0,
"`init` closure is properly dropped despite panicking"
);
drop(lazy_3);
assert_eq!(counter.strong_count(), 0, "what is dead may never die 🧟");
}
};
}

mod unsync {
use core::{
cell::Cell,
Expand All @@ -6,6 +56,8 @@ mod unsync {

use once_cell::unsync::{Lazy, OnceCell};

tests_for_both!();

#[test]
fn once_cell() {
let c = OnceCell::new();
Expand Down Expand Up @@ -247,6 +299,16 @@ mod unsync {
cell.set(&s).unwrap();
}
}

#[test]
fn assert_lazy_is_covariant_in_the_ctor() {
#[allow(dead_code)]
type AnyLazy<'f, T> = Lazy<T, Box<dyn 'f + FnOnce() -> T>>;

fn _for<'short, T>(it: *const (AnyLazy<'static, T>,)) -> *const (AnyLazy<'short, T>,) {
it
}
}
}

#[cfg(any(feature = "std", feature = "critical-section"))]
Expand All @@ -263,6 +325,8 @@ mod sync {

use once_cell::sync::{Lazy, OnceCell};

tests_for_both!();

#[test]
fn once_cell() {
let c = OnceCell::new();
Expand Down

0 comments on commit e3b2260

Please sign in to comment.