src/data_race.rs

   1 //! Implementation of a data-race detector using Lamport Timestamps / Vector-clocks
   2 //! based on the Dynamic Race Detection for C++:
   3 //! https://www.doc.ic.ac.uk/~afd/homepages/papers/pdfs/2017/POPL.pdf
   4 //! which does not report false-positives when fences are used, and gives better
   5 //! accuracy in presence of read-modify-write operations.
   6 //!
   7 //! The implementation contains modifications to correctly model the changes to the memory model in C++20
   8 //! regarding the weakening of release sequences: http://www.open-std.org/jtc1/sc22/wg21/docs/papers/2018/p0982r1.html.
   9 //! Relaxed stores now unconditionally block all currently active release sequences and so per-thread tracking of release
  10 //! sequences is not needed.
  11 //!
  12 //! The implementation also models races with memory allocation and deallocation via treating allocation and
  13 //! deallocation as a type of write internally for detecting data-races.
  14 //!
  15 //! This does not explore weak memory orders and so can still miss data-races
  16 //! but should not report false-positives
  17 //!
  18 //! Data-race definition from(https://en.cppreference.com/w/cpp/language/memory_model#Threads_and_data_races):
  19 //! a data race occurs between two memory accesses if they are on different threads, at least one operation
  20 //! is non-atomic, at least one operation is a write and neither access happens-before the other. Read the link
  21 //! for full definition.
  22 //!
  23 //! This re-uses vector indexes for threads that are known to be unable to report data-races, this is valid
  24 //! because it only re-uses vector indexes once all currently-active (not-terminated) threads have an internal
  25 //! vector clock that happens-after the join operation of the candidate thread. Threads that have not been joined
  26 //! on are not considered. Since the thread's vector clock will only increase and a data-race implies that
  27 //! there is some index x where clock[x] > thread_clock, when this is true clock[candidate-idx] > thread_clock
  28 //! can never hold and hence a data-race can never be reported in that vector index again.
  29 //! This means that the thread-index can be safely re-used, starting on the next timestamp for the newly created
  30 //! thread.
  31 //!
  32 //! The sequentially consistent ordering corresponds to the ordering that the threads
  33 //! are currently scheduled, this means that the data-race detector has no additional
  34 //! logic for sequentially consistent accesses at the moment since they are indistinguishable
  35 //! from acquire/release operations. If weak memory orderings are explored then this
  36 //! may need to change or be updated accordingly.
  37 //!
  38 //! Per the C++ spec for the memory model a sequentially consistent operation:
  39 //!   "A load operation with this memory order performs an acquire operation,
  40 //!    a store performs a release operation, and read-modify-write performs
  41 //!    both an acquire operation and a release operation, plus a single total
  42 //!    order exists in which all threads observe all modifications in the same
  43 //!    order (see Sequentially-consistent ordering below) "
  44 //! So in the absence of weak memory effects a seq-cst load & a seq-cst store is identical
  45 //! to a acquire load and a release store given the global sequentially consistent order
  46 //! of the schedule.
  47 //!
  48 //! The timestamps used in the data-race detector assign each sequence of non-atomic operations
  49 //! followed by a single atomic or concurrent operation a single timestamp.
  50 //! Write, Read, Write, ThreadJoin will be represented by a single timestamp value on a thread.
  51 //! This is because extra increment operations between the operations in the sequence are not
  52 //! required for accurate reporting of data-race values.
  53 //!
  54 //! As per the paper a threads timestamp is only incremented after a release operation is performed
  55 //! so some atomic operations that only perform acquires do not increment the timestamp. Due to shared
  56 //! code some atomic operations may increment the timestamp when not necessary but this has no effect
  57 //! on the data-race detection code.
  58 //!
  59 //! FIXME:
  60 //! currently we have our own local copy of the currently active thread index and names, this is due
  61 //! in part to the inability to access the current location of threads.active_thread inside the AllocExtra
  62 //! read, write and deallocate functions and should be cleaned up in the future.
  63
  64 use std::{
  65     cell::{Cell, Ref, RefCell, RefMut},
  66     fmt::Debug,
  67     mem,
  68     rc::Rc,
  69 };
  70
  71 use rustc_data_structures::fx::{FxHashMap, FxHashSet};
  72 use rustc_index::vec::{Idx, IndexVec};
  73 use rustc_middle::{mir, ty::layout::TyAndLayout};
  74 use rustc_target::abi::Size;
  75
  76 use crate::{
  77     ImmTy, Immediate, InterpResult, MPlaceTy, MemPlaceMeta, MiriEvalContext, MiriEvalContextExt,
  78     OpTy, Pointer, RangeMap, Scalar, ScalarMaybeUninit, Tag, ThreadId, VClock, VTimestamp,
  79     VectorIdx, MemoryKind, MiriMemoryKind
  80 };
  81
  82 pub type AllocExtra = VClockAlloc;
  83 pub type MemoryExtra = Rc<GlobalState>;
  84
  85 /// Valid atomic read-write operations, alias of atomic::Ordering (not non-exhaustive).
  86 #[derive(Copy, Clone, PartialEq, Eq, Debug)]
  87 pub enum AtomicRwOp {
  88     Relaxed,
  89     Acquire,
  90     Release,
  91     AcqRel,
  92     SeqCst,
  93 }
  94
  95 /// Valid atomic read operations, subset of atomic::Ordering.
  96 #[derive(Copy, Clone, PartialEq, Eq, Debug)]
  97 pub enum AtomicReadOp {
  98     Relaxed,
  99     Acquire,
 100     SeqCst,
 101 }
 102
 103 /// Valid atomic write operations, subset of atomic::Ordering.
 104 #[derive(Copy, Clone, PartialEq, Eq, Debug)]
 105 pub enum AtomicWriteOp {
 106     Relaxed,
 107     Release,
 108     SeqCst,
 109 }
 110
 111 /// Valid atomic fence operations, subset of atomic::Ordering.
 112 #[derive(Copy, Clone, PartialEq, Eq, Debug)]
 113 pub enum AtomicFenceOp {
 114     Acquire,
 115     Release,
 116     AcqRel,
 117     SeqCst,
 118 }
 119
 120 /// The current set of vector clocks describing the state
 121 /// of a thread, contains the happens-before clock and
 122 /// additional metadata to model atomic fence operations.
 123 #[derive(Clone, Default, Debug)]
 124 struct ThreadClockSet {
 125     /// The increasing clock representing timestamps
 126     /// that happen-before this thread.
 127     clock: VClock,
 128
 129     /// The set of timestamps that will happen-before this
 130     /// thread once it performs an acquire fence.
 131     fence_acquire: VClock,
 132
 133     /// The last timestamp of happens-before relations that
 134     /// have been released by this thread by a fence.
 135     fence_release: VClock,
 136 }
 137
 138 impl ThreadClockSet {
 139     /// Apply the effects of a release fence to this
 140     /// set of thread vector clocks.
 141     #[inline]
 142     fn apply_release_fence(&mut self) {
 143         self.fence_release.clone_from(&self.clock);
 144     }
 145
 146     /// Apply the effects of a acquire fence to this
 147     /// set of thread vector clocks.
 148     #[inline]
 149     fn apply_acquire_fence(&mut self) {
 150         self.clock.join(&self.fence_acquire);
 151     }
 152
 153     /// Increment the happens-before clock at a
 154     /// known index.
 155     #[inline]
 156     fn increment_clock(&mut self, index: VectorIdx) {
 157         self.clock.increment_index(index);
 158     }
 159
 160     /// Join the happens-before clock with that of
 161     /// another thread, used to model thread join
 162     /// operations.
 163     fn join_with(&mut self, other: &ThreadClockSet) {
 164         self.clock.join(&other.clock);
 165     }
 166 }
 167
 168 /// Error returned by finding a data race
 169 /// should be elaborated upon.
 170 #[derive(Copy, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Debug)]
 171 pub struct DataRace;
 172
 173 /// Externally stored memory cell clocks
 174 /// explicitly to reduce memory usage for the
 175 /// common case where no atomic operations
 176 /// exists on the memory cell.
 177 #[derive(Clone, PartialEq, Eq, Default, Debug)]
 178 struct AtomicMemoryCellClocks {
 179     /// The clock-vector of the timestamp of the last atomic
 180     /// read operation performed by each thread.
 181     /// This detects potential data-races between atomic read
 182     /// and non-atomic write operations.
 183     read_vector: VClock,
 184
 185     /// The clock-vector of the timestamp of the last atomic
 186     /// write operation performed by each thread.
 187     /// This detects potential data-races between atomic write
 188     /// and non-atomic read or write operations.
 189     write_vector: VClock,
 190
 191     /// Synchronization vector for acquire-release semantics
 192     /// contains the vector of timestamps that will
 193     /// happen-before a thread if an acquire-load is
 194     /// performed on the data.
 195     sync_vector: VClock,
 196 }
 197
 198 /// Type of write operation: allocating memory
 199 /// non-atomic writes and deallocating memory
 200 /// are all treated as writes for the purpose
 201 /// of the data-race detector.
 202 #[derive(Copy, Clone, PartialEq, Eq, Debug)]
 203 enum WriteType {
 204     /// Allocate memory.
 205     Allocate,
 206
 207     /// Standard unsynchronized write.
 208     Write,
 209
 210     /// Deallocate memory.
 211     /// Note that when memory is deallocated first, later non-atomic accesses
 212     /// will be reported as use-after-free, not as data races.
 213     /// (Same for `Allocate` above.)
 214     Deallocate,
 215 }
 216 impl WriteType {
 217     fn get_descriptor(self) -> &'static str {
 218         match self {
 219             WriteType::Allocate => "Allocate",
 220             WriteType::Write => "Write",
 221             WriteType::Deallocate => "Deallocate",
 222         }
 223     }
 224 }
 225
 226 /// Memory Cell vector clock metadata
 227 /// for data-race detection.
 228 #[derive(Clone, PartialEq, Eq, Debug)]
 229 struct MemoryCellClocks {
 230     /// The vector-clock timestamp of the last write
 231     /// corresponding to the writing threads timestamp.
 232     write: VTimestamp,
 233
 234     /// The identifier of the vector index, corresponding to a thread
 235     /// that performed the last write operation.
 236     write_index: VectorIdx,
 237
 238     /// The type of operation that the write index represents,
 239     /// either newly allocated memory, a non-atomic write or
 240     /// a deallocation of memory.
 241     write_type: WriteType,
 242
 243     /// The vector-clock of the timestamp of the last read operation
 244     /// performed by a thread since the last write operation occurred.
 245     /// It is reset to zero on each write operation.
 246     read: VClock,
 247
 248     /// Atomic acquire & release sequence tracking clocks.
 249     /// For non-atomic memory in the common case this
 250     /// value is set to None.
 251     atomic_ops: Option<Box<AtomicMemoryCellClocks>>,
 252 }
 253
 254 impl MemoryCellClocks {
 255     /// Create a new set of clocks representing memory allocated
 256     ///  at a given vector timestamp and index.
 257     fn new(alloc: VTimestamp, alloc_index: VectorIdx) -> Self {
 258         MemoryCellClocks {
 259             read: VClock::default(),
 260             write: alloc,
 261             write_index: alloc_index,
 262             write_type: WriteType::Allocate,
 263             atomic_ops: None,
 264         }
 265     }
 266
 267     /// Load the internal atomic memory cells if they exist.
 268     #[inline]
 269     fn atomic(&self) -> Option<&AtomicMemoryCellClocks> {
 270         match &self.atomic_ops {
 271             Some(op) => Some(&*op),
 272             None => None,
 273         }
 274     }
 275
 276     /// Load or create the internal atomic memory metadata
 277     /// if it does not exist.
 278     #[inline]
 279     fn atomic_mut(&mut self) -> &mut AtomicMemoryCellClocks {
 280         self.atomic_ops.get_or_insert_with(Default::default)
 281     }
 282
 283     /// Update memory cell data-race tracking for atomic
 284     /// load acquire semantics, is a no-op if this memory was
 285     /// not used previously as atomic memory.
 286     fn load_acquire(
 287         &mut self,
 288         clocks: &mut ThreadClockSet,
 289         index: VectorIdx,
 290     ) -> Result<(), DataRace> {
 291         self.atomic_read_detect(clocks, index)?;
 292         if let Some(atomic) = self.atomic() {
 293             clocks.clock.join(&atomic.sync_vector);
 294         }
 295         Ok(())
 296     }
 297
 298     /// Update memory cell data-race tracking for atomic
 299     /// load relaxed semantics, is a no-op if this memory was
 300     /// not used previously as atomic memory.
 301     fn load_relaxed(
 302         &mut self,
 303         clocks: &mut ThreadClockSet,
 304         index: VectorIdx,
 305     ) -> Result<(), DataRace> {
 306         self.atomic_read_detect(clocks, index)?;
 307         if let Some(atomic) = self.atomic() {
 308             clocks.fence_acquire.join(&atomic.sync_vector);
 309         }
 310         Ok(())
 311     }
 312
 313     /// Update the memory cell data-race tracking for atomic
 314     /// store release semantics.
 315     fn store_release(&mut self, clocks: &ThreadClockSet, index: VectorIdx) -> Result<(), DataRace> {
 316         self.atomic_write_detect(clocks, index)?;
 317         let atomic = self.atomic_mut();
 318         atomic.sync_vector.clone_from(&clocks.clock);
 319         Ok(())
 320     }
 321
 322     /// Update the memory cell data-race tracking for atomic
 323     /// store relaxed semantics.
 324     fn store_relaxed(&mut self, clocks: &ThreadClockSet, index: VectorIdx) -> Result<(), DataRace> {
 325         self.atomic_write_detect(clocks, index)?;
 326
 327         // The handling of release sequences was changed in C++20 and so
 328         // the code here is different to the paper since now all relaxed
 329         // stores block release sequences. The exception for same-thread
 330         // relaxed stores has been removed.
 331         let atomic = self.atomic_mut();
 332         atomic.sync_vector.clone_from(&clocks.fence_release);
 333         Ok(())
 334     }
 335
 336     /// Update the memory cell data-race tracking for atomic
 337     /// store release semantics for RMW operations.
 338     fn rmw_release(&mut self, clocks: &ThreadClockSet, index: VectorIdx) -> Result<(), DataRace> {
 339         self.atomic_write_detect(clocks, index)?;
 340         let atomic = self.atomic_mut();
 341         atomic.sync_vector.join(&clocks.clock);
 342         Ok(())
 343     }
 344
 345     /// Update the memory cell data-race tracking for atomic
 346     /// store relaxed semantics for RMW operations.
 347     fn rmw_relaxed(&mut self, clocks: &ThreadClockSet, index: VectorIdx) -> Result<(), DataRace> {
 348         self.atomic_write_detect(clocks, index)?;
 349         let atomic = self.atomic_mut();
 350         atomic.sync_vector.join(&clocks.fence_release);
 351         Ok(())
 352     }
 353
 354     /// Detect data-races with an atomic read, caused by a non-atomic write that does
 355     /// not happen-before the atomic-read.
 356     fn atomic_read_detect(
 357         &mut self,
 358         clocks: &ThreadClockSet,
 359         index: VectorIdx,
 360     ) -> Result<(), DataRace> {
 361         log::trace!("Atomic read with vectors: {:#?} :: {:#?}", self, clocks);
 362         if self.write <= clocks.clock[self.write_index] {
 363             let atomic = self.atomic_mut();
 364             atomic.read_vector.set_at_index(&clocks.clock, index);
 365             Ok(())
 366         } else {
 367             Err(DataRace)
 368         }
 369     }
 370
 371     /// Detect data-races with an atomic write, either with a non-atomic read or with
 372     /// a non-atomic write.
 373     fn atomic_write_detect(
 374         &mut self,
 375         clocks: &ThreadClockSet,
 376         index: VectorIdx,
 377     ) -> Result<(), DataRace> {
 378         log::trace!("Atomic write with vectors: {:#?} :: {:#?}", self, clocks);
 379         if self.write <= clocks.clock[self.write_index] && self.read <= clocks.clock {
 380             let atomic = self.atomic_mut();
 381             atomic.write_vector.set_at_index(&clocks.clock, index);
 382             Ok(())
 383         } else {
 384             Err(DataRace)
 385         }
 386     }
 387
 388     /// Detect races for non-atomic read operations at the current memory cell
 389     /// returns true if a data-race is detected.
 390     fn read_race_detect(
 391         &mut self,
 392         clocks: &ThreadClockSet,
 393         index: VectorIdx,
 394     ) -> Result<(), DataRace> {
 395         log::trace!("Unsynchronized read with vectors: {:#?} :: {:#?}", self, clocks);
 396         if self.write <= clocks.clock[self.write_index] {
 397             let race_free = if let Some(atomic) = self.atomic() {
 398                 atomic.write_vector <= clocks.clock
 399             } else {
 400                 true
 401             };
 402             if race_free {
 403                 self.read.set_at_index(&clocks.clock, index);
 404                 Ok(())
 405             } else {
 406                 Err(DataRace)
 407             }
 408         } else {
 409             Err(DataRace)
 410         }
 411     }
 412
 413     /// Detect races for non-atomic write operations at the current memory cell
 414     /// returns true if a data-race is detected.
 415     fn write_race_detect(
 416         &mut self,
 417         clocks: &ThreadClockSet,
 418         index: VectorIdx,
 419         write_type: WriteType,
 420     ) -> Result<(), DataRace> {
 421         log::trace!("Unsynchronized write with vectors: {:#?} :: {:#?}", self, clocks);
 422         if self.write <= clocks.clock[self.write_index] && self.read <= clocks.clock {
 423             let race_free = if let Some(atomic) = self.atomic() {
 424                 atomic.write_vector <= clocks.clock && atomic.read_vector <= clocks.clock
 425             } else {
 426                 true
 427             };
 428             if race_free {
 429                 self.write = clocks.clock[index];
 430                 self.write_index = index;
 431                 self.write_type = write_type;
 432                 self.read.set_zero_vector();
 433                 Ok(())
 434             } else {
 435                 Err(DataRace)
 436             }
 437         } else {
 438             Err(DataRace)
 439         }
 440     }
 441 }
 442
 443 /// Evaluation context extensions.
 444 impl<'mir, 'tcx: 'mir> EvalContextExt<'mir, 'tcx> for MiriEvalContext<'mir, 'tcx> {}
 445 pub trait EvalContextExt<'mir, 'tcx: 'mir>: MiriEvalContextExt<'mir, 'tcx> {
 446     /// Atomic variant of read_scalar_at_offset.
 447     fn read_scalar_at_offset_atomic(
 448         &self,
 449         op: &OpTy<'tcx, Tag>,
 450         offset: u64,
 451         layout: TyAndLayout<'tcx>,
 452         atomic: AtomicReadOp,
 453     ) -> InterpResult<'tcx, ScalarMaybeUninit<Tag>> {
 454         let this = self.eval_context_ref();
 455         let op_place = this.deref_operand(op)?;
 456         let offset = Size::from_bytes(offset);
 457
 458         // Ensure that the following read at an offset is within bounds.
 459         assert!(op_place.layout.size >= offset + layout.size);
 460         let value_place = op_place.offset(offset, MemPlaceMeta::None, layout, this)?;
 461         this.read_scalar_atomic(&value_place, atomic)
 462     }
 463
 464     /// Atomic variant of write_scalar_at_offset.
 465     fn write_scalar_at_offset_atomic(
 466         &mut self,
 467         op: &OpTy<'tcx, Tag>,
 468         offset: u64,
 469         value: impl Into<ScalarMaybeUninit<Tag>>,
 470         layout: TyAndLayout<'tcx>,
 471         atomic: AtomicWriteOp,
 472     ) -> InterpResult<'tcx> {
 473         let this = self.eval_context_mut();
 474         let op_place = this.deref_operand(op)?;
 475         let offset = Size::from_bytes(offset);
 476
 477         // Ensure that the following read at an offset is within bounds.
 478         assert!(op_place.layout.size >= offset + layout.size);
 479         let value_place = op_place.offset(offset, MemPlaceMeta::None, layout, this)?;
 480         this.write_scalar_atomic(value.into(), &value_place, atomic)
 481     }
 482
 483     /// Perform an atomic read operation at the memory location.
 484     fn read_scalar_atomic(
 485         &self,
 486         place: &MPlaceTy<'tcx, Tag>,
 487         atomic: AtomicReadOp,
 488     ) -> InterpResult<'tcx, ScalarMaybeUninit<Tag>> {
 489         let this = self.eval_context_ref();
 490         let scalar = this.allow_data_races_ref(move |this| this.read_scalar(&place.into()))?;
 491         self.validate_atomic_load(place, atomic)?;
 492         Ok(scalar)
 493     }
 494
 495     /// Perform an atomic write operation at the memory location.
 496     fn write_scalar_atomic(
 497         &mut self,
 498         val: ScalarMaybeUninit<Tag>,
 499         dest: &MPlaceTy<'tcx, Tag>,
 500         atomic: AtomicWriteOp,
 501     ) -> InterpResult<'tcx> {
 502         let this = self.eval_context_mut();
 503         this.allow_data_races_mut(move |this| this.write_scalar(val, &(*dest).into()))?;
 504         self.validate_atomic_store(dest, atomic)
 505     }
 506
 507     /// Perform a atomic operation on a memory location.
 508     fn atomic_op_immediate(
 509         &mut self,
 510         place: &MPlaceTy<'tcx, Tag>,
 511         rhs: &ImmTy<'tcx, Tag>,
 512         op: mir::BinOp,
 513         neg: bool,
 514         atomic: AtomicRwOp,
 515     ) -> InterpResult<'tcx, ImmTy<'tcx, Tag>> {
 516         let this = self.eval_context_mut();
 517
 518         let old = this.allow_data_races_mut(|this| this.read_immediate(&place.into()))?;
 519
 520         // Atomics wrap around on overflow.
 521         let val = this.binary_op(op, &old, rhs)?;
 522         let val = if neg { this.unary_op(mir::UnOp::Not, &val)? } else { val };
 523         this.allow_data_races_mut(|this| this.write_immediate(*val, &(*place).into()))?;
 524
 525         this.validate_atomic_rmw(place, atomic)?;
 526         Ok(old)
 527     }
 528
 529     /// Perform an atomic exchange with a memory place and a new
 530     /// scalar value, the old value is returned.
 531     fn atomic_exchange_scalar(
 532         &mut self,
 533         place: &MPlaceTy<'tcx, Tag>,
 534         new: ScalarMaybeUninit<Tag>,
 535         atomic: AtomicRwOp,
 536     ) -> InterpResult<'tcx, ScalarMaybeUninit<Tag>> {
 537         let this = self.eval_context_mut();
 538
 539         let old = this.allow_data_races_mut(|this| this.read_scalar(&place.into()))?;
 540         this.allow_data_races_mut(|this| this.write_scalar(new, &(*place).into()))?;
 541         this.validate_atomic_rmw(place, atomic)?;
 542         Ok(old)
 543     }
 544
 545     /// Perform an atomic compare and exchange at a given memory location.
 546     /// On success an atomic RMW operation is performed and on failure
 547     /// only an atomic read occurs. If `can_fail_spuriously` is true,
 548     /// then we treat it as a "compare_exchange_weak" operation, and
 549     /// some portion of the time fail even when the values are actually
 550     /// identical.
 551     fn atomic_compare_exchange_scalar(
 552         &mut self,
 553         place: &MPlaceTy<'tcx, Tag>,
 554         expect_old: &ImmTy<'tcx, Tag>,
 555         new: ScalarMaybeUninit<Tag>,
 556         success: AtomicRwOp,
 557         fail: AtomicReadOp,
 558         can_fail_spuriously: bool,
 559     ) -> InterpResult<'tcx, Immediate<Tag>> {
 560         use rand::Rng as _;
 561         let this = self.eval_context_mut();
 562
 563         // Failure ordering cannot be stronger than success ordering, therefore first attempt
 564         // to read with the failure ordering and if successful then try again with the success
 565         // read ordering and write in the success case.
 566         // Read as immediate for the sake of `binary_op()`
 567         let old = this.allow_data_races_mut(|this| this.read_immediate(&(place.into())))?;
 568         // `binary_op` will bail if either of them is not a scalar.
 569         let eq = this.overflowing_binary_op(mir::BinOp::Eq, &old, expect_old)?.0;
 570         // If the operation would succeed, but is "weak", fail some portion
 571         // of the time, based on `rate`.
 572         let rate = this.memory.extra.cmpxchg_weak_failure_rate;
 573         let cmpxchg_success = eq.to_bool()?
 574             && (!can_fail_spuriously || this.memory.extra.rng.borrow_mut().gen::<f64>() < rate);
 575         let res = Immediate::ScalarPair(
 576             old.to_scalar_or_uninit(),
 577             Scalar::from_bool(cmpxchg_success).into(),
 578         );
 579
 580         // Update ptr depending on comparison.
 581         // if successful, perform a full rw-atomic validation
 582         // otherwise treat this as an atomic load with the fail ordering.
 583         if cmpxchg_success {
 584             this.allow_data_races_mut(|this| this.write_scalar(new, &(*place).into()))?;
 585             this.validate_atomic_rmw(place, success)?;
 586         } else {
 587             this.validate_atomic_load(place, fail)?;
 588         }
 589
 590         // Return the old value.
 591         Ok(res)
 592     }
 593
 594     /// Update the data-race detector for an atomic read occurring at the
 595     /// associated memory-place and on the current thread.
 596     fn validate_atomic_load(
 597         &self,
 598         place: &MPlaceTy<'tcx, Tag>,
 599         atomic: AtomicReadOp,
 600     ) -> InterpResult<'tcx> {
 601         let this = self.eval_context_ref();
 602         this.validate_atomic_op(
 603             place,
 604             atomic,
 605             "Atomic Load",
 606             move |memory, clocks, index, atomic| {
 607                 if atomic == AtomicReadOp::Relaxed {
 608                     memory.load_relaxed(&mut *clocks, index)
 609                 } else {
 610                     memory.load_acquire(&mut *clocks, index)
 611                 }
 612             },
 613         )
 614     }
 615
 616     /// Update the data-race detector for an atomic write occurring at the
 617     /// associated memory-place and on the current thread.
 618     fn validate_atomic_store(
 619         &mut self,
 620         place: &MPlaceTy<'tcx, Tag>,
 621         atomic: AtomicWriteOp,
 622     ) -> InterpResult<'tcx> {
 623         let this = self.eval_context_ref();
 624         this.validate_atomic_op(
 625             place,
 626             atomic,
 627             "Atomic Store",
 628             move |memory, clocks, index, atomic| {
 629                 if atomic == AtomicWriteOp::Relaxed {
 630                     memory.store_relaxed(clocks, index)
 631                 } else {
 632                     memory.store_release(clocks, index)
 633                 }
 634             },
 635         )
 636     }
 637
 638     /// Update the data-race detector for an atomic read-modify-write occurring
 639     /// at the associated memory place and on the current thread.
 640     fn validate_atomic_rmw(
 641         &mut self,
 642         place: &MPlaceTy<'tcx, Tag>,
 643         atomic: AtomicRwOp,
 644     ) -> InterpResult<'tcx> {
 645         use AtomicRwOp::*;
 646         let acquire = matches!(atomic, Acquire | AcqRel | SeqCst);
 647         let release = matches!(atomic, Release | AcqRel | SeqCst);
 648         let this = self.eval_context_ref();
 649         this.validate_atomic_op(place, atomic, "Atomic RMW", move |memory, clocks, index, _| {
 650             if acquire {
 651                 memory.load_acquire(clocks, index)?;
 652             } else {
 653                 memory.load_relaxed(clocks, index)?;
 654             }
 655             if release {
 656                 memory.rmw_release(clocks, index)
 657             } else {
 658                 memory.rmw_relaxed(clocks, index)
 659             }
 660         })
 661     }
 662
 663     /// Update the data-race detector for an atomic fence on the current thread.
 664     fn validate_atomic_fence(&mut self, atomic: AtomicFenceOp) -> InterpResult<'tcx> {
 665         let this = self.eval_context_mut();
 666         if let Some(data_race) = &this.memory.extra.data_race {
 667             data_race.maybe_perform_sync_operation(move |index, mut clocks| {
 668                 log::trace!("Atomic fence on {:?} with ordering {:?}", index, atomic);
 669
 670                 // Apply data-race detection for the current fences
 671                 // this treats AcqRel and SeqCst as the same as a acquire
 672                 // and release fence applied in the same timestamp.
 673                 if atomic != AtomicFenceOp::Release {
 674                     // Either Acquire | AcqRel | SeqCst
 675                     clocks.apply_acquire_fence();
 676                 }
 677                 if atomic != AtomicFenceOp::Acquire {
 678                     // Either Release | AcqRel | SeqCst
 679                     clocks.apply_release_fence();
 680                 }
 681
 682                 // Increment timestamp in case of release semantics.
 683                 Ok(atomic != AtomicFenceOp::Acquire)
 684             })
 685         } else {
 686             Ok(())
 687         }
 688     }
 689
 690     fn reset_vector_clocks(
 691         &mut self,
 692         ptr: Pointer<Tag>,
 693         size: Size
 694     ) -> InterpResult<'tcx> {
 695         let this = self.eval_context_mut();
 696         if let Some(data_race) = &mut this.memory.extra.data_race {
 697             if data_race.multi_threaded.get() {
 698                 let alloc_meta = this.memory.get_raw_mut(ptr.alloc_id)?.extra.data_race.as_mut().unwrap();
 699                 alloc_meta.reset_clocks(ptr.offset, size);
 700             }
 701         }
 702         Ok(())
 703     }
 704 }
 705
 706 /// Vector clock metadata for a logical memory allocation.
 707 #[derive(Debug, Clone)]
 708 pub struct VClockAlloc {
 709     /// Assigning each byte a MemoryCellClocks.
 710     alloc_ranges: RefCell<RangeMap<MemoryCellClocks>>,
 711
 712     /// Pointer to global state.
 713     global: MemoryExtra,
 714 }
 715
 716 impl VClockAlloc {
 717     /// Create a new data-race detector for newly allocated memory.
 718     pub fn new_allocation(global: &MemoryExtra, len: Size, kind: MemoryKind<MiriMemoryKind>) -> VClockAlloc {
 719         let (alloc_timestamp, alloc_index) = match kind {
 720             // User allocated and stack memory should track allocation.
 721             MemoryKind::Machine(
 722                 MiriMemoryKind::Rust | MiriMemoryKind::C | MiriMemoryKind::WinHeap
 723             ) | MemoryKind::Stack => {
 724                 let (alloc_index, clocks) = global.current_thread_state();
 725                 let alloc_timestamp = clocks.clock[alloc_index];
 726                 (alloc_timestamp, alloc_index)
 727             }
 728             // Other global memory should trace races but be allocated at the 0 timestamp.
 729             MemoryKind::Machine(
 730                 MiriMemoryKind::Global | MiriMemoryKind::Machine | MiriMemoryKind::Env |
 731                 MiriMemoryKind::ExternStatic | MiriMemoryKind::Tls
 732             ) | MemoryKind::CallerLocation | MemoryKind::Vtable => {
 733                 (0, VectorIdx::MAX_INDEX)
 734             }
 735         };
 736         VClockAlloc {
 737             global: Rc::clone(global),
 738             alloc_ranges: RefCell::new(RangeMap::new(
 739                 len, MemoryCellClocks::new(alloc_timestamp, alloc_index)
 740             )),
 741         }
 742     }
 743
 744     fn reset_clocks(&mut self, offset: Size, len: Size) {
 745         let mut alloc_ranges = self.alloc_ranges.borrow_mut();
 746         for (_, range) in alloc_ranges.iter_mut(offset, len) {
 747             // Reset the portion of the range
 748             *range = MemoryCellClocks::new(0, VectorIdx::MAX_INDEX);
 749         }
 750     }
 751
 752     // Find an index, if one exists where the value
 753     // in `l` is greater than the value in `r`.
 754     fn find_gt_index(l: &VClock, r: &VClock) -> Option<VectorIdx> {
 755         log::trace!("Find index where not {:?} <= {:?}", l, r);
 756         let l_slice = l.as_slice();
 757         let r_slice = r.as_slice();
 758         l_slice
 759             .iter()
 760             .zip(r_slice.iter())
 761             .enumerate()
 762             .find_map(|(idx, (&l, &r))| if l > r { Some(idx) } else { None })
 763             .or_else(|| {
 764                 if l_slice.len() > r_slice.len() {
 765                     // By invariant, if l_slice is longer
 766                     // then one element must be larger.
 767                     // This just validates that this is true
 768                     // and reports earlier elements first.
 769                     let l_remainder_slice = &l_slice[r_slice.len()..];
 770                     let idx = l_remainder_slice
 771                         .iter()
 772                         .enumerate()
 773                         .find_map(|(idx, &r)| if r == 0 { None } else { Some(idx) })
 774                         .expect("Invalid VClock Invariant");
 775                     Some(idx + r_slice.len())
 776                 } else {
 777                     None
 778                 }
 779             })
 780             .map(|idx| VectorIdx::new(idx))
 781     }
 782
 783     /// Report a data-race found in the program.
 784     /// This finds the two racing threads and the type
 785     /// of data-race that occurred. This will also
 786     /// return info about the memory location the data-race
 787     /// occurred in.
 788     #[cold]
 789     #[inline(never)]
 790     fn report_data_race<'tcx>(
 791         global: &MemoryExtra,
 792         range: &MemoryCellClocks,
 793         action: &str,
 794         is_atomic: bool,
 795         pointer: Pointer<Tag>,
 796         len: Size,
 797     ) -> InterpResult<'tcx> {
 798         let (current_index, current_clocks) = global.current_thread_state();
 799         let write_clock;
 800         let (other_action, other_thread, other_clock) = if range.write
 801             > current_clocks.clock[range.write_index]
 802         {
 803             // Convert the write action into the vector clock it
 804             // represents for diagnostic purposes.
 805             write_clock = VClock::new_with_index(range.write_index, range.write);
 806             (range.write_type.get_descriptor(), range.write_index, &write_clock)
 807         } else if let Some(idx) = Self::find_gt_index(&range.read, &current_clocks.clock) {
 808             ("Read", idx, &range.read)
 809         } else if !is_atomic {
 810             if let Some(atomic) = range.atomic() {
 811                 if let Some(idx) = Self::find_gt_index(&atomic.write_vector, &current_clocks.clock)
 812                 {
 813                     ("Atomic Store", idx, &atomic.write_vector)
 814                 } else if let Some(idx) =
 815                     Self::find_gt_index(&atomic.read_vector, &current_clocks.clock)
 816                 {
 817                     ("Atomic Load", idx, &atomic.read_vector)
 818                 } else {
 819                     unreachable!(
 820                         "Failed to report data-race for non-atomic operation: no race found"
 821                     )
 822                 }
 823             } else {
 824                 unreachable!(
 825                     "Failed to report data-race for non-atomic operation: no atomic component"
 826                 )
 827             }
 828         } else {
 829             unreachable!("Failed to report data-race for atomic operation")
 830         };
 831
 832         // Load elaborated thread information about the racing thread actions.
 833         let current_thread_info = global.print_thread_metadata(current_index);
 834         let other_thread_info = global.print_thread_metadata(other_thread);
 835
 836         // Throw the data-race detection.
 837         throw_ub_format!(
 838             "Data race detected between {} on {} and {} on {}, memory({:?},offset={},size={})\
 839             \n(current vector clock = {:?}, conflicting timestamp = {:?})",
 840             action,
 841             current_thread_info,
 842             other_action,
 843             other_thread_info,
 844             pointer.alloc_id,
 845             pointer.offset.bytes(),
 846             len.bytes(),
 847             current_clocks.clock,
 848             other_clock
 849         )
 850     }
 851
 852     /// Detect data-races for an unsynchronized read operation, will not perform
 853     /// data-race detection if `multi-threaded` is false, either due to no threads
 854     /// being created or if it is temporarily disabled during a racy read or write
 855     /// operation for which data-race detection is handled separately, for example
 856     /// atomic read operations.
 857     pub fn read<'tcx>(&self, pointer: Pointer<Tag>, len: Size) -> InterpResult<'tcx> {
 858         if self.global.multi_threaded.get() {
 859             let (index, clocks) = self.global.current_thread_state();
 860             let mut alloc_ranges = self.alloc_ranges.borrow_mut();
 861             for (_, range) in alloc_ranges.iter_mut(pointer.offset, len) {
 862                 if let Err(DataRace) = range.read_race_detect(&*clocks, index) {
 863                     // Report data-race.
 864                     return Self::report_data_race(
 865                         &self.global,
 866                         range,
 867                         "Read",
 868                         false,
 869                         pointer,
 870                         len,
 871                     );
 872                 }
 873             }
 874             Ok(())
 875         } else {
 876             Ok(())
 877         }
 878     }
 879
 880     // Shared code for detecting data-races on unique access to a section of memory
 881     fn unique_access<'tcx>(
 882         &mut self,
 883         pointer: Pointer<Tag>,
 884         len: Size,
 885         write_type: WriteType,
 886     ) -> InterpResult<'tcx> {
 887         if self.global.multi_threaded.get() {
 888             let (index, clocks) = self.global.current_thread_state();
 889             for (_, range) in self.alloc_ranges.get_mut().iter_mut(pointer.offset, len) {
 890                 if let Err(DataRace) = range.write_race_detect(&*clocks, index, write_type) {
 891                     // Report data-race
 892                     return Self::report_data_race(
 893                         &self.global,
 894                         range,
 895                         write_type.get_descriptor(),
 896                         false,
 897                         pointer,
 898                         len,
 899                     );
 900                 }
 901             }
 902             Ok(())
 903         } else {
 904             Ok(())
 905         }
 906     }
 907
 908     /// Detect data-races for an unsynchronized write operation, will not perform
 909     /// data-race threads if `multi-threaded` is false, either due to no threads
 910     /// being created or if it is temporarily disabled during a racy read or write
 911     /// operation
 912     pub fn write<'tcx>(&mut self, pointer: Pointer<Tag>, len: Size) -> InterpResult<'tcx> {
 913         self.unique_access(pointer, len, WriteType::Write)
 914     }
 915
 916     /// Detect data-races for an unsynchronized deallocate operation, will not perform
 917     /// data-race threads if `multi-threaded` is false, either due to no threads
 918     /// being created or if it is temporarily disabled during a racy read or write
 919     /// operation
 920     pub fn deallocate<'tcx>(&mut self, pointer: Pointer<Tag>, len: Size) -> InterpResult<'tcx> {
 921         self.unique_access(pointer, len, WriteType::Deallocate)
 922     }
 923 }
 924
 925 impl<'mir, 'tcx: 'mir> EvalContextPrivExt<'mir, 'tcx> for MiriEvalContext<'mir, 'tcx> {}
 926 trait EvalContextPrivExt<'mir, 'tcx: 'mir>: MiriEvalContextExt<'mir, 'tcx> {
 927     // Temporarily allow data-races to occur, this should only be
 928     // used if either one of the appropriate `validate_atomic` functions
 929     // will be called to treat a memory access as atomic or if the memory
 930     // being accessed should be treated as internal state, that cannot be
 931     // accessed by the interpreted program.
 932     #[inline]
 933     fn allow_data_races_ref<R>(&self, op: impl FnOnce(&MiriEvalContext<'mir, 'tcx>) -> R) -> R {
 934         let this = self.eval_context_ref();
 935         let old = if let Some(data_race) = &this.memory.extra.data_race {
 936             data_race.multi_threaded.replace(false)
 937         } else {
 938             false
 939         };
 940         let result = op(this);
 941         if let Some(data_race) = &this.memory.extra.data_race {
 942             data_race.multi_threaded.set(old);
 943         }
 944         result
 945     }
 946
 947     /// Same as `allow_data_races_ref`, this temporarily disables any data-race detection and
 948     /// so should only be used for atomic operations or internal state that the program cannot
 949     /// access.
 950     #[inline]
 951     fn allow_data_races_mut<R>(
 952         &mut self,
 953         op: impl FnOnce(&mut MiriEvalContext<'mir, 'tcx>) -> R,
 954     ) -> R {
 955         let this = self.eval_context_mut();
 956         let old = if let Some(data_race) = &this.memory.extra.data_race {
 957             data_race.multi_threaded.replace(false)
 958         } else {
 959             false
 960         };
 961         let result = op(this);
 962         if let Some(data_race) = &this.memory.extra.data_race {
 963             data_race.multi_threaded.set(old);
 964         }
 965         result
 966     }
 967
 968     /// Generic atomic operation implementation,
 969     /// this accesses memory via get_raw instead of
 970     /// get_raw_mut, due to issues calling get_raw_mut
 971     /// for atomic loads from read-only memory.
 972     /// FIXME: is this valid, or should get_raw_mut be used for
 973     /// atomic-stores/atomic-rmw?
 974     fn validate_atomic_op<A: Debug + Copy>(
 975         &self,
 976         place: &MPlaceTy<'tcx, Tag>,
 977         atomic: A,
 978         description: &str,
 979         mut op: impl FnMut(
 980             &mut MemoryCellClocks,
 981             &mut ThreadClockSet,
 982             VectorIdx,
 983             A,
 984         ) -> Result<(), DataRace>,
 985     ) -> InterpResult<'tcx> {
 986         let this = self.eval_context_ref();
 987         if let Some(data_race) = &this.memory.extra.data_race {
 988             if data_race.multi_threaded.get() {
 989                 // Load and log the atomic operation.
 990                 let place_ptr = place.ptr.assert_ptr();
 991                 let size = place.layout.size;
 992                 let alloc_meta =
 993                     &this.memory.get_raw(place_ptr.alloc_id)?.extra.data_race.as_ref().unwrap();
 994                 log::trace!(
 995                     "Atomic op({}) with ordering {:?} on memory({:?}, offset={}, size={})",
 996                     description,
 997                     &atomic,
 998                     place_ptr.alloc_id,
 999                     place_ptr.offset.bytes(),
1000                     size.bytes()
1001                 );
1002
1003                 // Perform the atomic operation.
1004                 let data_race = &alloc_meta.global;
1005                 data_race.maybe_perform_sync_operation(|index, mut clocks| {
1006                     for (_, range) in
1007                         alloc_meta.alloc_ranges.borrow_mut().iter_mut(place_ptr.offset, size)
1008                     {
1009                         if let Err(DataRace) = op(range, &mut *clocks, index, atomic) {
1010                             mem::drop(clocks);
1011                             return VClockAlloc::report_data_race(
1012                                 &alloc_meta.global,
1013                                 range,
1014                                 description,
1015                                 true,
1016                                 place_ptr,
1017                                 size,
1018                             ).map(|_| true);
1019                         }
1020                     }
1021
1022                     // This conservatively assumes all operations have release semantics
1023                     Ok(true)
1024                 })?;
1025
1026                 // Log changes to atomic memory.
1027                 if log::log_enabled!(log::Level::Trace) {
1028                     for (_, range) in alloc_meta.alloc_ranges.borrow().iter(place_ptr.offset, size)
1029                     {
1030                         log::trace!(
1031                             "Updated atomic memory({:?}, offset={}, size={}) to {:#?}",
1032                             place.ptr.assert_ptr().alloc_id,
1033                             place_ptr.offset.bytes(),
1034                             size.bytes(),
1035                             range.atomic_ops
1036                         );
1037                     }
1038                 }
1039             }
1040         }
1041         Ok(())
1042     }
1043 }
1044
1045 /// Extra metadata associated with a thread.
1046 #[derive(Debug, Clone, Default)]
1047 struct ThreadExtraState {
1048     /// The current vector index in use by the
1049     /// thread currently, this is set to None
1050     /// after the vector index has been re-used
1051     /// and hence the value will never need to be
1052     /// read during data-race reporting.
1053     vector_index: Option<VectorIdx>,
1054
1055     /// The name of the thread, updated for better
1056     /// diagnostics when reporting detected data
1057     /// races.
1058     thread_name: Option<Box<str>>,
1059
1060     /// Thread termination vector clock, this
1061     /// is set on thread termination and is used
1062     /// for joining on threads since the vector_index
1063     /// may be re-used when the join operation occurs.
1064     termination_vector_clock: Option<VClock>,
1065 }
1066
1067 /// Global data-race detection state, contains the currently
1068 /// executing thread as well as the vector-clocks associated
1069 /// with each of the threads.
1070 #[derive(Debug, Clone)]
1071 pub struct GlobalState {
1072     /// Set to true once the first additional
1073     /// thread has launched, due to the dependency
1074     /// between before and after a thread launch.
1075     /// Any data-races must be recorded after this
1076     /// so concurrent execution can ignore recording
1077     /// any data-races.
1078     multi_threaded: Cell<bool>,
1079
1080     /// Mapping of a vector index to a known set of thread
1081     /// clocks, this is not directly mapping from a thread id
1082     /// since it may refer to multiple threads.
1083     vector_clocks: RefCell<IndexVec<VectorIdx, ThreadClockSet>>,
1084
1085     /// Mapping of a given vector index to the current thread
1086     /// that the execution is representing, this may change
1087     /// if a vector index is re-assigned to a new thread.
1088     vector_info: RefCell<IndexVec<VectorIdx, ThreadId>>,
1089
1090     /// The mapping of a given thread to associated thread metadata.
1091     thread_info: RefCell<IndexVec<ThreadId, ThreadExtraState>>,
1092
1093     /// The current vector index being executed.
1094     current_index: Cell<VectorIdx>,
1095
1096     /// Potential vector indices that could be re-used on thread creation
1097     /// values are inserted here on after the thread has terminated and
1098     /// been joined with, and hence may potentially become free
1099     /// for use as the index for a new thread.
1100     /// Elements in this set may still require the vector index to
1101     /// report data-races, and can only be re-used after all
1102     /// active vector-clocks catch up with the threads timestamp.
1103     reuse_candidates: RefCell<FxHashSet<VectorIdx>>,
1104
1105     /// Counts the number of threads that are currently active
1106     /// if the number of active threads reduces to 1 and then
1107     /// a join operation occurs with the remaining main thread
1108     /// then multi-threaded execution may be disabled.
1109     active_thread_count: Cell<usize>,
1110
1111     /// This contains threads that have terminated, but not yet joined
1112     /// and so cannot become re-use candidates until a join operation
1113     /// occurs.
1114     /// The associated vector index will be moved into re-use candidates
1115     /// after the join operation occurs.
1116     terminated_threads: RefCell<FxHashMap<ThreadId, VectorIdx>>,
1117 }
1118
1119 impl GlobalState {
1120     /// Create a new global state, setup with just thread-id=0
1121     /// advanced to timestamp = 1.
1122     pub fn new() -> Self {
1123         let global_state = GlobalState {
1124             multi_threaded: Cell::new(false),
1125             vector_clocks: RefCell::new(IndexVec::new()),
1126             vector_info: RefCell::new(IndexVec::new()),
1127             thread_info: RefCell::new(IndexVec::new()),
1128             current_index: Cell::new(VectorIdx::new(0)),
1129             active_thread_count: Cell::new(1),
1130             reuse_candidates: RefCell::new(FxHashSet::default()),
1131             terminated_threads: RefCell::new(FxHashMap::default()),
1132         };
1133
1134         // Setup the main-thread since it is not explicitly created:
1135         // uses vector index and thread-id 0, also the rust runtime gives
1136         // the main-thread a name of "main".
1137         let index = global_state.vector_clocks.borrow_mut().push(ThreadClockSet::default());
1138         global_state.vector_info.borrow_mut().push(ThreadId::new(0));
1139         global_state.thread_info.borrow_mut().push(ThreadExtraState {
1140             vector_index: Some(index),
1141             thread_name: Some("main".to_string().into_boxed_str()),
1142             termination_vector_clock: None,
1143         });
1144
1145         global_state
1146     }
1147
1148     // Try to find vector index values that can potentially be re-used
1149     // by a new thread instead of a new vector index being created.
1150     fn find_vector_index_reuse_candidate(&self) -> Option<VectorIdx> {
1151         let mut reuse = self.reuse_candidates.borrow_mut();
1152         let vector_clocks = self.vector_clocks.borrow();
1153         let vector_info = self.vector_info.borrow();
1154         let terminated_threads = self.terminated_threads.borrow();
1155         for &candidate in reuse.iter() {
1156             let target_timestamp = vector_clocks[candidate].clock[candidate];
1157             if vector_clocks.iter_enumerated().all(|(clock_idx, clock)| {
1158                 // The thread happens before the clock, and hence cannot report
1159                 // a data-race with this the candidate index.
1160                 let no_data_race = clock.clock[candidate] >= target_timestamp;
1161
1162                 // The vector represents a thread that has terminated and hence cannot
1163                 // report a data-race with the candidate index.
1164                 let thread_id = vector_info[clock_idx];
1165                 let vector_terminated =
1166                     reuse.contains(&clock_idx) || terminated_threads.contains_key(&thread_id);
1167
1168                 // The vector index cannot report a race with the candidate index
1169                 // and hence allows the candidate index to be re-used.
1170                 no_data_race || vector_terminated
1171             }) {
1172                 // All vector clocks for each vector index are equal to
1173                 // the target timestamp, and the thread is known to have
1174                 // terminated, therefore this vector clock index cannot
1175                 // report any more data-races.
1176                 assert!(reuse.remove(&candidate));
1177                 return Some(candidate);
1178             }
1179         }
1180         None
1181     }
1182
1183     // Hook for thread creation, enabled multi-threaded execution and marks
1184     // the current thread timestamp as happening-before the current thread.
1185     #[inline]
1186     pub fn thread_created(&self, thread: ThreadId) {
1187         let current_index = self.current_index();
1188
1189         // Increment the number of active threads.
1190         let active_threads = self.active_thread_count.get();
1191         self.active_thread_count.set(active_threads + 1);
1192
1193         // Enable multi-threaded execution, there are now two threads
1194         // so data-races are now possible.
1195         self.multi_threaded.set(true);
1196
1197         // Load and setup the associated thread metadata
1198         let mut thread_info = self.thread_info.borrow_mut();
1199         thread_info.ensure_contains_elem(thread, Default::default);
1200
1201         // Assign a vector index for the thread, attempting to re-use an old
1202         // vector index that can no longer report any data-races if possible.
1203         let created_index = if let Some(reuse_index) = self.find_vector_index_reuse_candidate() {
1204             // Now re-configure the re-use candidate, increment the clock
1205             // for the new sync use of the vector.
1206             let mut vector_clocks = self.vector_clocks.borrow_mut();
1207             vector_clocks[reuse_index].increment_clock(reuse_index);
1208
1209             // Locate the old thread the vector was associated with and update
1210             // it to represent the new thread instead.
1211             let mut vector_info = self.vector_info.borrow_mut();
1212             let old_thread = vector_info[reuse_index];
1213             vector_info[reuse_index] = thread;
1214
1215             // Mark the thread the vector index was associated with as no longer
1216             // representing a thread index.
1217             thread_info[old_thread].vector_index = None;
1218
1219             reuse_index
1220         } else {
1221             // No vector re-use candidates available, instead create
1222             // a new vector index.
1223             let mut vector_info = self.vector_info.borrow_mut();
1224             vector_info.push(thread)
1225         };
1226
1227         log::trace!("Creating thread = {:?} with vector index = {:?}", thread, created_index);
1228
1229         // Mark the chosen vector index as in use by the thread.
1230         thread_info[thread].vector_index = Some(created_index);
1231
1232         // Create a thread clock set if applicable.
1233         let mut vector_clocks = self.vector_clocks.borrow_mut();
1234         if created_index == vector_clocks.next_index() {
1235             vector_clocks.push(ThreadClockSet::default());
1236         }
1237
1238         // Now load the two clocks and configure the initial state.
1239         let (current, created) = vector_clocks.pick2_mut(current_index, created_index);
1240
1241         // Join the created with current, since the current threads
1242         // previous actions happen-before the created thread.
1243         created.join_with(current);
1244
1245         // Advance both threads after the synchronized operation.
1246         // Both operations are considered to have release semantics.
1247         current.increment_clock(current_index);
1248         created.increment_clock(created_index);
1249     }
1250
1251     /// Hook on a thread join to update the implicit happens-before relation
1252     /// between the joined thread and the current thread.
1253     #[inline]
1254     pub fn thread_joined(&self, current_thread: ThreadId, join_thread: ThreadId) {
1255         let mut clocks_vec = self.vector_clocks.borrow_mut();
1256         let thread_info = self.thread_info.borrow();
1257
1258         // Load the vector clock of the current thread.
1259         let current_index = thread_info[current_thread]
1260             .vector_index
1261             .expect("Performed thread join on thread with no assigned vector");
1262         let current = &mut clocks_vec[current_index];
1263
1264         // Load the associated vector clock for the terminated thread.
1265         let join_clock = thread_info[join_thread]
1266             .termination_vector_clock
1267             .as_ref()
1268             .expect("Joined with thread but thread has not terminated");
1269
1270
1271         // The join thread happens-before the current thread
1272         // so update the current vector clock.
1273         // Is not a release operation so the clock is not incremented.
1274         current.clock.join(join_clock);
1275
1276         // Check the number of active threads, if the value is 1
1277         // then test for potentially disabling multi-threaded execution.
1278         let active_threads = self.active_thread_count.get();
1279         if active_threads == 1 {
1280             // May potentially be able to disable multi-threaded execution.
1281             let current_clock = &clocks_vec[current_index];
1282             if clocks_vec
1283                 .iter_enumerated()
1284                 .all(|(idx, clocks)| clocks.clock[idx] <= current_clock.clock[idx])
1285             {
1286                 // All thread terminations happen-before the current clock
1287                 // therefore no data-races can be reported until a new thread
1288                 // is created, so disable multi-threaded execution.
1289                 self.multi_threaded.set(false);
1290             }
1291         }
1292
1293         // If the thread is marked as terminated but not joined
1294         // then move the thread to the re-use set.
1295         let mut termination = self.terminated_threads.borrow_mut();
1296         if let Some(index) = termination.remove(&join_thread) {
1297             let mut reuse = self.reuse_candidates.borrow_mut();
1298             reuse.insert(index);
1299         }
1300     }
1301
1302     /// On thread termination, the vector-clock may re-used
1303     /// in the future once all remaining thread-clocks catch
1304     /// up with the time index of the terminated thread.
1305     /// This assigns thread termination with a unique index
1306     /// which will be used to join the thread
1307     /// This should be called strictly before any calls to
1308     /// `thread_joined`.
1309     #[inline]
1310     pub fn thread_terminated(&self) {
1311         let current_index = self.current_index();
1312
1313         // Increment the clock to a unique termination timestamp.
1314         let mut vector_clocks = self.vector_clocks.borrow_mut();
1315         let current_clocks = &mut vector_clocks[current_index];
1316         current_clocks.increment_clock(current_index);
1317
1318         // Load the current thread id for the executing vector.
1319         let vector_info = self.vector_info.borrow();
1320         let current_thread = vector_info[current_index];
1321
1322         // Load the current thread metadata, and move to a terminated
1323         // vector state. Setting up the vector clock all join operations
1324         // will use.
1325         let mut thread_info = self.thread_info.borrow_mut();
1326         let current = &mut thread_info[current_thread];
1327         current.termination_vector_clock = Some(current_clocks.clock.clone());
1328
1329         // Add this thread as a candidate for re-use after a thread join
1330         // occurs.
1331         let mut termination = self.terminated_threads.borrow_mut();
1332         termination.insert(current_thread, current_index);
1333
1334         // Reduce the number of active threads, now that a thread has
1335         // terminated.
1336         let mut active_threads = self.active_thread_count.get();
1337         active_threads -= 1;
1338         self.active_thread_count.set(active_threads);
1339     }
1340
1341     /// Hook for updating the local tracker of the currently
1342     /// enabled thread, should always be updated whenever
1343     /// `active_thread` in thread.rs is updated.
1344     #[inline]
1345     pub fn thread_set_active(&self, thread: ThreadId) {
1346         let thread_info = self.thread_info.borrow();
1347         let vector_idx = thread_info[thread]
1348             .vector_index
1349             .expect("Setting thread active with no assigned vector");
1350         self.current_index.set(vector_idx);
1351     }
1352
1353     /// Hook for updating the local tracker of the threads name
1354     /// this should always mirror the local value in thread.rs
1355     /// the thread name is used for improved diagnostics
1356     /// during a data-race.
1357     #[inline]
1358     pub fn thread_set_name(&self, thread: ThreadId, name: String) {
1359         let name = name.into_boxed_str();
1360         let mut thread_info = self.thread_info.borrow_mut();
1361         thread_info[thread].thread_name = Some(name);
1362     }
1363
1364     /// Attempt to perform a synchronized operation, this
1365     /// will perform no operation if multi-threading is
1366     /// not currently enabled.
1367     /// Otherwise it will increment the clock for the current
1368     /// vector before and after the operation for data-race
1369     /// detection between any happens-before edges the
1370     /// operation may create.
1371     fn maybe_perform_sync_operation<'tcx>(
1372         &self,
1373         op: impl FnOnce(VectorIdx, RefMut<'_, ThreadClockSet>) -> InterpResult<'tcx, bool>,
1374     ) -> InterpResult<'tcx> {
1375         if self.multi_threaded.get() {
1376             let (index, clocks) = self.current_thread_state_mut();
1377             if op(index, clocks)? {
1378                 let (_, mut clocks) = self.current_thread_state_mut();
1379                 clocks.increment_clock(index);
1380             }
1381         }
1382         Ok(())
1383     }
1384
1385     /// Internal utility to identify a thread stored internally
1386     /// returns the id and the name for better diagnostics.
1387     fn print_thread_metadata(&self, vector: VectorIdx) -> String {
1388         let thread = self.vector_info.borrow()[vector];
1389         let thread_name = &self.thread_info.borrow()[thread].thread_name;
1390         if let Some(name) = thread_name {
1391             let name: &str = name;
1392             format!("Thread(id = {:?}, name = {:?})", thread.to_u32(), &*name)
1393         } else {
1394             format!("Thread(id = {:?})", thread.to_u32())
1395         }
1396     }
1397
1398     /// Acquire a lock, express that the previous call of
1399     /// `validate_lock_release` must happen before this.
1400     /// As this is an acquire operation, the thread timestamp is not
1401     /// incremented.
1402     pub fn validate_lock_acquire(&self, lock: &VClock, thread: ThreadId) {
1403         let (_, mut clocks) = self.load_thread_state_mut(thread);
1404         clocks.clock.join(&lock);
1405     }
1406
1407     /// Release a lock handle, express that this happens-before
1408     /// any subsequent calls to `validate_lock_acquire`.
1409     /// For normal locks this should be equivalent to `validate_lock_release_shared`
1410     /// since an acquire operation should have occurred before, however
1411     /// for futex & condvar operations this is not the case and this
1412     /// operation must be used.
1413     pub fn validate_lock_release(&self, lock: &mut VClock, thread: ThreadId) {
1414         let (index, mut clocks) = self.load_thread_state_mut(thread);
1415         lock.clone_from(&clocks.clock);
1416         clocks.increment_clock(index);
1417     }
1418
1419     /// Release a lock handle, express that this happens-before
1420     /// any subsequent calls to `validate_lock_acquire` as well
1421     /// as any previous calls to this function after any
1422     /// `validate_lock_release` calls.
1423     /// For normal locks this should be equivalent to `validate_lock_release`.
1424     /// This function only exists for joining over the set of concurrent readers
1425     /// in a read-write lock and should not be used for anything else.
1426     pub fn validate_lock_release_shared(&self, lock: &mut VClock, thread: ThreadId) {
1427         let (index, mut clocks) = self.load_thread_state_mut(thread);
1428         lock.join(&clocks.clock);
1429         clocks.increment_clock(index);
1430     }
1431
1432     /// Load the vector index used by the given thread as well as the set of vector clocks
1433     /// used by the thread.
1434     #[inline]
1435     fn load_thread_state_mut(&self, thread: ThreadId) -> (VectorIdx, RefMut<'_, ThreadClockSet>) {
1436         let index = self.thread_info.borrow()[thread]
1437             .vector_index
1438             .expect("Loading thread state for thread with no assigned vector");
1439         let ref_vector = self.vector_clocks.borrow_mut();
1440         let clocks = RefMut::map(ref_vector, |vec| &mut vec[index]);
1441         (index, clocks)
1442     }
1443
1444     /// Load the current vector clock in use and the current set of thread clocks
1445     /// in use for the vector.
1446     #[inline]
1447     fn current_thread_state(&self) -> (VectorIdx, Ref<'_, ThreadClockSet>) {
1448         let index = self.current_index();
1449         let ref_vector = self.vector_clocks.borrow();
1450         let clocks = Ref::map(ref_vector, |vec| &vec[index]);
1451         (index, clocks)
1452     }
1453
1454     /// Load the current vector clock in use and the current set of thread clocks
1455     /// in use for the vector mutably for modification.
1456     #[inline]
1457     fn current_thread_state_mut(&self) -> (VectorIdx, RefMut<'_, ThreadClockSet>) {
1458         let index = self.current_index();
1459         let ref_vector = self.vector_clocks.borrow_mut();
1460         let clocks = RefMut::map(ref_vector, |vec| &mut vec[index]);
1461         (index, clocks)
1462     }
1463
1464     /// Return the current thread, should be the same
1465     /// as the data-race active thread.
1466     #[inline]
1467     fn current_index(&self) -> VectorIdx {
1468         self.current_index.get()
1469     }
1470 }