Explain cache behavior a bit better, clean up diff

author Ben Kimock <kimockb@gmail.com>

Sat, 2 Jul 2022 23:44:55 +0000 (19:44 -0400)

committer Ben Kimock <kimockb@gmail.com>

Sat, 2 Jul 2022 23:44:55 +0000 (19:44 -0400)
author Ben Kimock <kimockb@gmail.com>
Sat, 2 Jul 2022 23:44:55 +0000 (19:44 -0400)
committer Ben Kimock <kimockb@gmail.com>
Sat, 2 Jul 2022 23:44:55 +0000 (19:44 -0400)
diff --git a/Cargo.toml b/Cargo.toml

index 0dead9fa28f70263fa044024fcc91151301fe4f3..f612e7a3e9e50d58df1baef9ffc4c86cebc52b4f 100644 (file)
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -53,5 +53,6 @@ harness = false
  
  [features]
  default = ["stack-cache"]
+# Will be enabled on CI via `--all-features`.
  expensive-debug-assertions = []
  stack-cache = []
diff --git a/src/lib.rs b/src/lib.rs

index a98239711ef42cdb9b9ec74138adbecb2da43804..269980ede37963dc74418f7db61e1877d6233555 100644 (file)
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -90,8 +90,8 @@
  pub use crate::operator::EvalContextExt as OperatorEvalContextExt;
  pub use crate::range_map::RangeMap;
  pub use crate::stacked_borrows::{
-    stack::Stack, CallId, EvalContextExt as StackedBorEvalContextExt, Item, Permission, PtrId,
-    SbTag, SbTagExtra, Stacks,
+    stack::Stack, CallId, EvalContextExt as StackedBorEvalContextExt, Item, Permission, SbTag,
+    SbTagExtra, Stacks,
  };
  pub use crate::sync::{CondvarId, EvalContextExt as SyncEvalContextExt, MutexId, RwLockId};
  pub use crate::thread::{
diff --git a/src/stacked_borrows.rs b/src/stacked_borrows.rs

index 3a4b4ad65fa1a6f0a98f4493cce6b4fb80e649ac..01d67fcf59e0bb971f70f6609ba2cdcd7197e799 100644 (file)
--- a/src/stacked_borrows.rs
+++ b/src/stacked_borrows.rs
@@ -26,7 +26,6 @@
  pub mod stack;
  use stack::Stack;
  
-pub type PtrId = NonZeroU64;
  pub type CallId = NonZeroU64;
  
  // Even reading memory can have effects on the stack, so we need a `RefCell` here.
@@ -479,7 +478,7 @@ fn dealloc(
              )
          })?;
  
-        // Step 2: Remove all items.  Also checks for protectors.
+        // Step 2: Consider all items removed. This checks for protectors.
          for idx in (0..self.len()).rev() {
              let item = self.get(idx).unwrap();
              Stack::item_popped(&item, None, global, alloc_history)?;
@@ -579,8 +578,8 @@ impl<'tcx> Stacks {
      /// Creates new stack with initial tag.
      fn new(size: Size, perm: Permission, tag: SbTag) -> Self {
          let item = Item { perm, tag, protector: None };
-
          let stack = Stack::new(item);
+
          Stacks {
              stacks: RangeMap::new(size, stack),
              history: AllocHistory::new(),
@@ -826,14 +825,11 @@ fn reborrow(
                  // We have to use shared references to alloc/memory_extra here since
                  // `visit_freeze_sensitive` needs to access the global state.
                  let extra = this.get_alloc_extra(alloc_id)?;
-
                  let mut stacked_borrows = extra
                      .stacked_borrows
                      .as_ref()
                      .expect("we should have Stacked Borrows data")
                      .borrow_mut();
-                let mut current_span = this.machine.current_span();
-
                  this.visit_freeze_sensitive(place, size, |mut range, frozen| {
                      // Adjust range.
                      range.start += base_offset;
@@ -858,7 +854,7 @@ fn reborrow(
                              item,
                              (alloc_id, range, offset),
                              &mut global,
-                            &mut current_span,
+                            current_span,
                              history,
                              exposed_tags,
                          )
diff --git a/src/stacked_borrows/stack.rs b/src/stacked_borrows/stack.rs

index 5ad9b5dc5353a874594386fc75ae3e9f1ed02eed..1c3ee0fd573aaad78647c142910c0f1666a8c5aa 100644 (file)
--- a/src/stacked_borrows/stack.rs
+++ b/src/stacked_borrows/stack.rs
@@ -27,8 +27,7 @@ pub struct Stack {
      /// we never have the unknown-to-known boundary in an SRW group.
      unknown_bottom: Option<SbTag>,
  
-    /// A small LRU cache of searches of the borrow stack. This only caches accesses of `Tagged`,
-    /// because those are unique in the stack.
+    /// A small LRU cache of searches of the borrow stack.
      #[cfg(feature = "stack-cache")]
      cache: StackCache,
      /// On a read, we need to disable all `Unique` above the granting item. We can avoid most of
@@ -42,6 +41,11 @@ pub struct Stack {
  /// probably-cold random access into the borrow stack to figure out what `Permission` an
  /// `SbTag` grants. We could avoid this by also storing the `Permission` in the cache, but
  /// most lookups into the cache are immediately followed by access of the full borrow stack anyway.
+///
+/// It may seem like maintaining this cache is a waste for small stacks, but
+/// (a) iterating over small fixed-size arrays is super fast, and (b) empirically this helps *a lot*,
+/// probably because runtime is dominated by large stacks.
+/// arrays is super fast
  #[cfg(feature = "stack-cache")]
  #[derive(Clone, Debug)]
  struct StackCache {
@@ -81,7 +85,9 @@ impl<'tcx> Stack {
      /// - There are no Unique tags outside of first_unique..last_unique
      #[cfg(feature = "expensive-debug-assertions")]
      fn verify_cache_consistency(&self) {
-        if self.borrows.len() > CACHE_LEN {
+        // Only a full cache needs to be valid. Also see the comments in find_granting_cache
+        // and set_unknown_bottom.
+        if self.borrows.len() >= CACHE_LEN {
              for (tag, stack_idx) in self.cache.tags.iter().zip(self.cache.idx.iter()) {
                  assert_eq!(self.borrows[*stack_idx].tag, *tag);
              }
@@ -154,7 +160,7 @@ fn find_granting_tagged(&mut self, access: AccessKind, tag: SbTag) -> Option<usi
          }
  
          // If we didn't find the tag in the cache, fall back to a linear search of the
-        // whole stack, and add the tag to the stack.
+        // whole stack, and add the tag to the cache.
          for (stack_idx, item) in self.borrows.iter().enumerate().rev() {
              if tag == item.tag && item.perm.grants(access) {
                  #[cfg(feature = "stack-cache")]
@@ -185,8 +191,11 @@ fn find_granting_cache(&mut self, access: AccessKind, tag: SbTag) -> Option<usiz
          // If we found the tag, look up its position in the stack to see if it grants
          // the required permission
          if self.borrows[stack_idx].perm.grants(access) {
-            // If it does, and it's not already in the most-recently-used position, move it there.
-            // Except if the tag is in position 1, this is equivalent to just a swap, so do that.
+            // If it does, and it's not already in the most-recently-used position, re-insert it at
+            // the most-recently-used position. This technically reduces the efficiency of the
+            // cache by duplicating elements, but current benchmarks do not seem to benefit from
+            // avoiding this duplication.
+            // But if the tag is in position 1, avoiding the duplicating add is trivial.
              if cache_idx == 1 {
                  self.cache.tags.swap(0, 1);
                  self.cache.idx.swap(0, 1);
@@ -287,7 +296,6 @@ pub fn disable_uniques_starting_at<V: FnMut(Item) -> crate::InterpResult<'tcx>>(
          let unique_range = 0..self.len();
  
          if disable_start <= unique_range.end {
-            // add 1 so we don't disable the granting item
              let lower = unique_range.start.max(disable_start);
              let upper = (unique_range.end + 1).min(self.borrows.len());
              for item in &mut self.borrows[lower..upper] {
author	Ben Kimock <kimockb@gmail.com>
	Sat, 2 Jul 2022 23:44:55 +0000 (19:44 -0400)
committer	Ben Kimock <kimockb@gmail.com>
	Sat, 2 Jul 2022 23:44:55 +0000 (19:44 -0400)
Cargo.toml		patch \| blob \| history
src/lib.rs		patch \| blob \| history
src/stacked_borrows.rs		patch \| blob \| history
src/stacked_borrows/stack.rs		patch \| blob \| history