From dabc0887532aefa90ae439295d530bdc814febd8 Mon Sep 17 00:00:00 2001 From: Anders Kaseorg Date: Tue, 20 Dec 2022 14:52:59 -0800 Subject: [PATCH 1/5] Remove unnecessary Cell from GcState.boxes_start Signed-off-by: Anders Kaseorg --- gc/src/gc.rs | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/gc/src/gc.rs b/gc/src/gc.rs index 0b30b1c..fc15067 100644 --- a/gc/src/gc.rs +++ b/gc/src/gc.rs @@ -6,7 +6,7 @@ use std::ptr::{self, NonNull}; struct GcState { stats: GcStats, config: GcConfig, - boxes_start: Cell>>>, + boxes_start: Option>>, } impl Drop for GcState { @@ -43,7 +43,7 @@ pub fn finalizer_safe() -> bool { thread_local!(static GC_STATE: RefCell = RefCell::new(GcState { stats: GcStats::default(), config: GcConfig::default(), - boxes_start: Cell::new(None), + boxes_start: None, })); const MARK_MASK: usize = 1 << (usize::BITS - 1); @@ -138,8 +138,7 @@ impl GcBox { data: value, })); - st.boxes_start - .set(Some(unsafe { NonNull::new_unchecked(gcbox) })); + st.boxes_start = Some(unsafe { NonNull::new_unchecked(gcbox) }); // We allocated some bytes! Let's record it st.stats.bytes_allocated += mem::size_of::>(); @@ -240,14 +239,15 @@ fn collect_garbage(st: &mut GcState) { st.stats.collections_performed += 1; unsafe { - let unmarked = mark(&st.boxes_start); + let head = Cell::from_mut(&mut st.boxes_start); + let unmarked = mark(head); if unmarked.is_empty() { return; } for node in &unmarked { Trace::finalize_glue(&(*node.this.as_ptr()).data); } - mark(&st.boxes_start); + mark(head); sweep(unmarked, &mut st.stats.bytes_allocated); } } From d93d72b3769c34278ba1e753511bcfe8fd530dd1 Mon Sep 17 00:00:00 2001 From: Anders Kaseorg Date: Tue, 20 Dec 2022 15:02:37 -0800 Subject: [PATCH 2/5] Use NonNull::as_ref Signed-off-by: Anders Kaseorg --- gc/src/gc.rs | 16 ++++++++-------- gc/src/lib.rs | 4 ++-- 2 files changed, 10 insertions(+), 10 deletions(-) diff --git a/gc/src/gc.rs b/gc/src/gc.rs index fc15067..7adc38b 100644 --- a/gc/src/gc.rs +++ b/gc/src/gc.rs @@ -198,11 +198,11 @@ fn collect_garbage(st: &mut GcState) { // Walk the tree, tracing and marking the nodes let mut mark_head = head.get(); while let Some(node) = mark_head { - if (*node.as_ptr()).header.roots() > 0 { - (*node.as_ptr()).trace_inner(); + if node.as_ref().header.roots() > 0 { + node.as_ref().trace_inner(); } - mark_head = (*node.as_ptr()).header.next.get(); + mark_head = node.as_ref().header.next.get(); } // Collect a vector of all of the nodes which were not marked, @@ -210,15 +210,15 @@ fn collect_garbage(st: &mut GcState) { let mut unmarked = Vec::new(); let mut unmark_head = head; while let Some(node) = unmark_head.get() { - if (*node.as_ptr()).header.is_marked() { - (*node.as_ptr()).header.unmark(); + if node.as_ref().header.is_marked() { + node.as_ref().header.unmark(); } else { unmarked.push(Unmarked { incoming: unmark_head, this: node, }); } - unmark_head = &(*node.as_ptr()).header.next; + unmark_head = &node.as_ref().header.next; } unmarked } @@ -226,7 +226,7 @@ fn collect_garbage(st: &mut GcState) { unsafe fn sweep(finalized: Vec>, bytes_allocated: &mut usize) { let _guard = DropGuard::new(); for node in finalized.into_iter().rev() { - if (*node.this.as_ptr()).header.is_marked() { + if node.this.as_ref().header.is_marked() { continue; } let incoming = node.incoming; @@ -245,7 +245,7 @@ fn collect_garbage(st: &mut GcState) { return; } for node in &unmarked { - Trace::finalize_glue(&(*node.this.as_ptr()).data); + Trace::finalize_glue(&node.this.as_ref().data); } mark(head); sweep(unmarked, &mut st.stats.bytes_allocated); diff --git a/gc/src/lib.rs b/gc/src/lib.rs index 6babcf5..73f34be 100644 --- a/gc/src/lib.rs +++ b/gc/src/lib.rs @@ -80,9 +80,9 @@ impl Gc { // When we create a Gc, all pointers which have been moved to the // heap no longer need to be rooted, so we unroot them. - (*ptr.as_ptr()).value().unroot(); + ptr.as_ref().value().unroot(); let gc = Gc { - ptr_root: Cell::new(NonNull::new_unchecked(ptr.as_ptr())), + ptr_root: Cell::new(ptr), marker: PhantomData, }; gc.set_root(); From 189a876c3d49fb12f56afd5324629a03f1cd1e8e Mon Sep 17 00:00:00 2001 From: Anders Kaseorg Date: Tue, 20 Dec 2022 14:23:06 -0800 Subject: [PATCH 3/5] Factor out insert_gcbox helper Signed-off-by: Anders Kaseorg --- gc/src/gc.rs | 73 ++++++++++++++++++++++++++++++---------------------- 1 file changed, 42 insertions(+), 31 deletions(-) diff --git a/gc/src/gc.rs b/gc/src/gc.rs index 7adc38b..7d72dbc 100644 --- a/gc/src/gc.rs +++ b/gc/src/gc.rs @@ -57,10 +57,10 @@ pub(crate) struct GcBoxHeader { impl GcBoxHeader { #[inline] - pub fn new(next: Option>>) -> Self { + pub fn new() -> Self { GcBoxHeader { roots: Cell::new(1), // unmarked and roots count = 1 - next: Cell::new(next), + next: Cell::new(None), } } @@ -111,42 +111,53 @@ pub(crate) struct GcBox { impl GcBox { /// Allocates a garbage collected `GcBox` on the heap, - /// and appends it to the thread-local `GcBox` chain. + /// and appends it to the thread-local `GcBox` chain. This might + /// trigger a collection. /// /// A `GcBox` allocated this way starts its life rooted. pub(crate) fn new(value: T) -> NonNull { - GC_STATE.with(|st| { - let mut st = st.borrow_mut(); - - // XXX We should probably be more clever about collecting - if st.stats.bytes_allocated > st.config.threshold { - collect_garbage(&mut st); - - if st.stats.bytes_allocated as f64 - > st.config.threshold as f64 * st.config.used_space_ratio - { - // we didn't collect enough, so increase the - // threshold for next time, to avoid thrashing the - // collector too much/behaving quadratically. - st.config.threshold = - (st.stats.bytes_allocated as f64 / st.config.used_space_ratio) as usize; - } - } + let gcbox = NonNull::from(Box::leak(Box::new(GcBox { + header: GcBoxHeader::new(), + data: value, + }))); + unsafe { insert_gcbox(gcbox) }; + gcbox + } +} - let gcbox = Box::into_raw(Box::new(GcBox { - header: GcBoxHeader::new(st.boxes_start.take()), - data: value, - })); +/// Add a new `GcBox` to the current thread's `GcBox` chain. This +/// might trigger a collection first if enough bytes have been +/// allocated since the previous collection. +/// +/// # Safety +/// +/// `gcbox` must point to a valid `GcBox` that is not yet in a `GcBox` +/// chain. +unsafe fn insert_gcbox(gcbox: NonNull>) { + GC_STATE.with(|st| { + let mut st = st.borrow_mut(); - st.boxes_start = Some(unsafe { NonNull::new_unchecked(gcbox) }); + // XXX We should probably be more clever about collecting + if st.stats.bytes_allocated > st.config.threshold { + collect_garbage(&mut st); + + if st.stats.bytes_allocated as f64 + > st.config.threshold as f64 * st.config.used_space_ratio + { + // we didn't collect enough, so increase the + // threshold for next time, to avoid thrashing the + // collector too much/behaving quadratically. + st.config.threshold = + (st.stats.bytes_allocated as f64 / st.config.used_space_ratio) as usize; + } + } - // We allocated some bytes! Let's record it - st.stats.bytes_allocated += mem::size_of::>(); + let next = st.boxes_start.replace(gcbox); + gcbox.as_ref().header.next.set(next); - // Return the pointer to the newly allocated data - unsafe { NonNull::new_unchecked(gcbox) } - }) - } + // We allocated some bytes! Let's record it + st.stats.bytes_allocated += mem::size_of_val::>(gcbox.as_ref()); + }); } impl GcBox { From 5d6a7a11ee0fb7d21c3aa57e9e038533f7415dc3 Mon Sep 17 00:00:00 2001 From: Anders Kaseorg Date: Tue, 20 Dec 2022 14:27:10 -0800 Subject: [PATCH 4/5] Factor out from_gcbox helper Signed-off-by: Anders Kaseorg --- gc/src/lib.rs | 36 ++++++++++++++++++++++-------------- 1 file changed, 22 insertions(+), 14 deletions(-) diff --git a/gc/src/lib.rs b/gc/src/lib.rs index 73f34be..19e09a5 100644 --- a/gc/src/lib.rs +++ b/gc/src/lib.rs @@ -72,22 +72,30 @@ impl Gc { /// assert_eq!(*five, 5); /// ``` pub fn new(value: T) -> Self { - assert!(mem::align_of::>() > 1); + unsafe { Gc::from_gcbox(GcBox::new(value)) } + } +} - unsafe { - // Allocate the memory for the object - let ptr = GcBox::new(value); +impl Gc { + /// Constructs a `Gc` that points to a new `GcBox`. + /// + /// # Safety + /// + /// `ptr` must point to a valid `GcBox` on the thread-local + /// `GcBox` chain. + #[inline] + unsafe fn from_gcbox(ptr: NonNull>) -> Gc { + assert!(mem::align_of_val::>(ptr.as_ref()) > 1); - // When we create a Gc, all pointers which have been moved to the - // heap no longer need to be rooted, so we unroot them. - ptr.as_ref().value().unroot(); - let gc = Gc { - ptr_root: Cell::new(ptr), - marker: PhantomData, - }; - gc.set_root(); - gc - } + // When we create a Gc, all pointers which have been moved to the + // heap no longer need to be rooted, so we unroot them. + ptr.as_ref().value().unroot(); + let gc = Gc { + ptr_root: Cell::new(ptr), + marker: PhantomData, + }; + gc.set_root(); + gc } } From 743271ea8cabcf542aab05ac05b2cf520a6a2a2e Mon Sep 17 00:00:00 2001 From: Anders Kaseorg Date: Tue, 20 Dec 2022 15:09:45 -0800 Subject: [PATCH 5/5] Implement From> for Gc This is especially useful on nightly, where it works for unsized trait objects. Signed-off-by: Anders Kaseorg --- gc/src/gc.rs | 59 +++++++++++++++++++++++++++++++++++++++++++- gc/src/lib.rs | 13 ++++++++++ gc/tests/from_box.rs | 20 +++++++++++++++ 3 files changed, 91 insertions(+), 1 deletion(-) create mode 100644 gc/tests/from_box.rs diff --git a/gc/src/gc.rs b/gc/src/gc.rs index 7d72dbc..58cb3c2 100644 --- a/gc/src/gc.rs +++ b/gc/src/gc.rs @@ -1,8 +1,13 @@ +use crate::set_data_ptr; use crate::trace::Trace; +use std::alloc::{alloc, dealloc, Layout}; use std::cell::{Cell, RefCell}; use std::mem; use std::ptr::{self, NonNull}; +#[cfg(feature = "nightly")] +use std::marker::Unsize; + struct GcState { stats: GcStats, config: GcConfig, @@ -103,7 +108,7 @@ impl GcBoxHeader { } } -#[repr(C)] // to justify the layout computation in Gc::from_raw +#[repr(C)] // to justify the layout computations in GcBox::from_box, Gc::from_raw pub(crate) struct GcBox { header: GcBoxHeader, data: T, @@ -125,6 +130,58 @@ impl GcBox { } } +impl< + #[cfg(not(feature = "nightly"))] T: Trace, + #[cfg(feature = "nightly")] T: Trace + Unsize + ?Sized, + > GcBox +{ + /// Consumes a `Box`, moving the value inside into a new `GcBox` + /// on the heap. Adds the new `GcBox` to the thread-local `GcBox` + /// chain. This might trigger a collection. + /// + /// A `GcBox` allocated this way starts its life rooted. + pub(crate) fn from_box(value: Box) -> NonNull { + let header_layout = Layout::new::(); + let value_layout = Layout::for_value::(&*value); + // This relies on GcBox being #[repr(C)]. + let gcbox_layout = header_layout.extend(value_layout).unwrap().0.pad_to_align(); + + unsafe { + // Allocate the GcBox in a way that's compatible with Box, + // since the collector will deallocate it via + // Box::from_raw. + let gcbox_addr = alloc(gcbox_layout); + + // Since we're not allowed to move the value out of an + // active Box, and we will need to deallocate the Box + // without calling the destructor, convert it to a raw + // pointer first. + let value = Box::into_raw(value); + + // Create a pointer with the metadata of value and the + // address and provenance of the GcBox. + let gcbox = set_data_ptr(value as *mut GcBox, gcbox_addr); + + // Move the data. + ptr::addr_of_mut!((*gcbox).header).write(GcBoxHeader::new()); + ptr::addr_of_mut!((*gcbox).data) + .cast::() + .copy_from_nonoverlapping(value.cast::(), value_layout.size()); + + // Deallocate the former Box. (Box only allocates for size + // != 0.) + if value_layout.size() != 0 { + dealloc(value.cast::(), value_layout); + } + + // Add the new GcBox to the chain and return it. + let gcbox = NonNull::new_unchecked(gcbox); + insert_gcbox(gcbox); + gcbox + } + } +} + /// Add a new `GcBox` to the current thread's `GcBox` chain. This /// might trigger a collection first if enough bytes have been /// allocated since the previous collection. diff --git a/gc/src/lib.rs b/gc/src/lib.rs index 19e09a5..927705a 100644 --- a/gc/src/lib.rs +++ b/gc/src/lib.rs @@ -379,6 +379,19 @@ impl From for Gc { } } +impl< + #[cfg(not(feature = "nightly"))] T: Trace, + #[cfg(feature = "nightly")] T: Trace + Unsize + ?Sized, + > From> for Gc +{ + /// Moves a boxed value into a new garbage-collected + /// allocation. If the `nightly` crate feature is enabled, the + /// value may be an unsized trait object. + fn from(v: Box) -> Gc { + unsafe { Gc::from_gcbox(GcBox::from_box(v)) } + } +} + impl std::borrow::Borrow for Gc { fn borrow(&self) -> &T { self diff --git a/gc/tests/from_box.rs b/gc/tests/from_box.rs new file mode 100644 index 0000000..567b7b5 --- /dev/null +++ b/gc/tests/from_box.rs @@ -0,0 +1,20 @@ +use gc::{Finalize, Gc, Trace}; + +trait Foo: Trace {} + +#[derive(Trace, Finalize)] +struct Bar; +impl Foo for Bar {} + +#[test] +fn test_from_box_sized() { + let b: Box<[i32; 3]> = Box::new([1, 2, 3]); + let _: Gc<[i32; 3]> = Gc::from(b); +} + +#[cfg(feature = "nightly")] +#[test] +fn test_from_box_dyn() { + let b: Box = Box::new(Bar); + let _: Gc = Gc::from(b); +}