Extend DepGraph so it can track "work-products"

author Niko Matsakis <niko@alum.mit.edu>

Thu, 21 Jul 2016 16:33:23 +0000 (12:33 -0400)

committer Niko Matsakis <niko@alum.mit.edu>

Thu, 28 Jul 2016 16:05:04 +0000 (12:05 -0400)
author Niko Matsakis <niko@alum.mit.edu>
Thu, 21 Jul 2016 16:33:23 +0000 (12:33 -0400)
committer Niko Matsakis <niko@alum.mit.edu>
Thu, 28 Jul 2016 16:05:04 +0000 (12:05 -0400)
diff --git a/src/librustc/dep_graph/dep_node.rs b/src/librustc/dep_graph/dep_node.rs

index 73b96651b05e27826c031d55267cff16415a7bf1..dd7f0286574d0b46f11758b21a21f4c32a82f11c 100644 (file)
--- a/src/librustc/dep_graph/dep_node.rs
+++ b/src/librustc/dep_graph/dep_node.rs
@@ -9,6 +9,7 @@
  // except according to those terms.
  
  use std::fmt::Debug;
+use std::sync::Arc;
  
  macro_rules! try_opt {
      ($e:expr) => (
@@ -45,6 +46,10 @@ pub enum DepNode<D: Clone + Debug> {
      // in an extern crate.
      MetaData(D),
  
+    // Represents some artifact that we save to disk. Note that these
+    // do not have a def-id as part of their identifier.
+    WorkProduct(Arc<WorkProductId>),
+
      // Represents different phases in the compiler.
      CrateReader,
      CollectLanguageItems,
@@ -189,6 +194,11 @@ pub fn map_def<E, OP>(&self, mut op: OP) -> Option<DepNode<E>>
              TransCrate => Some(TransCrate),
              TransWriteMetadata => Some(TransWriteMetadata),
              LinkBinary => Some(LinkBinary),
+
+            // work product names do not need to be mapped, because
+            // they are always absolute.
+            WorkProduct(ref id) => Some(WorkProduct(id.clone())),
+
              Hir(ref d) => op(d).map(Hir),
              MetaData(ref d) => op(d).map(MetaData),
              CollectItem(ref d) => op(d).map(CollectItem),
@@ -229,3 +239,14 @@ pub fn map_def<E, OP>(&self, mut op: OP) -> Option<DepNode<E>>
          }
      }
  }
+
+/// A "work product" corresponds to a `.o` (or other) file that we
+/// save in between runs. These ids do not have a DefId but rather
+/// some independent path or string that persists between runs without
+/// the need to be mapped or unmapped. (This ensures we can serialize
+/// them even in the absence of a tcx.)
+#[derive(Clone, Debug, PartialEq, Eq, Hash, RustcEncodable, RustcDecodable)]
+pub enum WorkProductId {
+    PartitionObjectFile(String), // see (*TransPartition) below
+}
+
diff --git a/src/librustc/dep_graph/graph.rs b/src/librustc/dep_graph/graph.rs

index 741ad65c29fda373a9bb17129c16299f5b6f6871..ab7013df33f14c23a63715f1d3ec5d6ed2f8beb1 100644 (file)
--- a/src/librustc/dep_graph/graph.rs
+++ b/src/librustc/dep_graph/graph.rs
@@ -9,22 +9,44 @@
  // except according to those terms.
  
  use hir::def_id::DefId;
+use rustc_data_structures::fnv::FnvHashMap;
+use std::cell::{Ref, RefCell};
  use std::rc::Rc;
+use std::sync::Arc;
  
-use super::dep_node::DepNode;
+use super::dep_node::{DepNode, WorkProductId};
  use super::query::DepGraphQuery;
  use super::raii;
  use super::thread::{DepGraphThreadData, DepMessage};
  
  #[derive(Clone)]
  pub struct DepGraph {
-    data: Rc<DepGraphThreadData>
+    data: Rc<DepGraphData>
+}
+
+struct DepGraphData {
+    /// we send messages to the thread to let it build up the dep-graph
+    /// from the current run
+    thread: DepGraphThreadData,
+
+    /// when we load, there may be `.o` files, cached mir, or other such
+    /// things available to us. If we find that they are not dirty, we
+    /// load the path to the file storing those work-products here into
+    /// this map. We can later look for and extract that data.
+    previous_work_products: RefCell<FnvHashMap<Arc<WorkProductId>, WorkProduct>>,
+
+    /// work-products that we generate in this run
+    work_products: RefCell<FnvHashMap<Arc<WorkProductId>, WorkProduct>>,
  }
  
  impl DepGraph {
      pub fn new(enabled: bool) -> DepGraph {
          DepGraph {
-            data: Rc::new(DepGraphThreadData::new(enabled))
+            data: Rc::new(DepGraphData {
+                thread: DepGraphThreadData::new(enabled),
+                previous_work_products: RefCell::new(FnvHashMap()),
+                work_products: RefCell::new(FnvHashMap())
+            })
          }
      }
  
@@ -32,19 +54,19 @@ pub fn new(enabled: bool) -> DepGraph {
      /// then the other methods on this `DepGraph` will have no net effect.
      #[inline]
      pub fn enabled(&self) -> bool {
-        self.data.enabled()
+        self.data.thread.enabled()
      }
  
      pub fn query(&self) -> DepGraphQuery<DefId> {
-        self.data.query()
+        self.data.thread.query()
      }
  
      pub fn in_ignore<'graph>(&'graph self) -> raii::IgnoreTask<'graph> {
-        raii::IgnoreTask::new(&self.data)
+        raii::IgnoreTask::new(&self.data.thread)
      }
  
      pub fn in_task<'graph>(&'graph self, key: DepNode<DefId>) -> raii::DepTask<'graph> {
-        raii::DepTask::new(&self.data, key)
+        raii::DepTask::new(&self.data.thread, key)
      }
  
      pub fn with_ignore<OP,R>(&self, op: OP) -> R
@@ -62,10 +84,84 @@ pub fn with_task<OP,R>(&self, key: DepNode<DefId>, op: OP) -> R
      }
  
      pub fn read(&self, v: DepNode<DefId>) {
-        self.data.enqueue(DepMessage::Read(v));
+        self.data.thread.enqueue(DepMessage::Read(v));
      }
  
      pub fn write(&self, v: DepNode<DefId>) {
-        self.data.enqueue(DepMessage::Write(v));
+        self.data.thread.enqueue(DepMessage::Write(v));
+    }
+
+    /// Indicates that a previous work product exists for `v`. This is
+    /// invoked during initial start-up based on what nodes are clean
+    /// (and what files exist in the incr. directory).
+    pub fn insert_previous_work_product(&self, v: &Arc<WorkProductId>, data: WorkProduct) {
+        debug!("insert_previous_work_product({:?}, {:?})", v, data);
+        self.data.previous_work_products.borrow_mut()
+                                        .insert(v.clone(), data);
+    }
+
+    /// Indicates that we created the given work-product in this run
+    /// for `v`. This record will be preserved and loaded in the next
+    /// run.
+    pub fn insert_work_product(&self, v: &Arc<WorkProductId>, data: WorkProduct) {
+        debug!("insert_work_product({:?}, {:?})", v, data);
+        self.data.work_products.borrow_mut()
+                               .insert(v.clone(), data);
      }
+
+    /// Check whether a previous work product exists for `v` and, if
+    /// so, return the path that leads to it. Used to skip doing work.
+    pub fn previous_work_product(&self, v: &Arc<WorkProductId>) -> Option<WorkProduct> {
+        self.data.previous_work_products.borrow()
+                                        .get(v)
+                                        .cloned()
+    }
+
+    /// Access the map of work-products created during this run. Only
+    /// used during saving of the dep-graph.
+    pub fn work_products(&self) -> Ref<FnvHashMap<Arc<WorkProductId>, WorkProduct>> {
+        self.data.work_products.borrow()
+    }
+}
+
+/// A "work product" is an intermediate result that we save into the
+/// incremental directory for later re-use. The primary example are
+/// the object files that we save for each partition at code
+/// generation time.
+///
+/// Each work product is associated with a dep-node, representing the
+/// process that produced the work-product. If that dep-node is found
+/// to be dirty when we load up, then we will delete the work-product
+/// at load time. If the work-product is found to be clean, the we
+/// will keep a record in the `previous_work_products` list.
+///
+/// In addition, work products have an associated hash. This hash is
+/// an extra hash that can be used to decide if the work-product from
+/// a previous compilation can be re-used (in addition to the dirty
+/// edges check).
+///
+/// As the primary example, consider the object files we generate for
+/// each partition. In the first run, we create partitions based on
+/// the symbols that need to be compiled. For each partition P, we
+/// hash the symbols in P and create a `WorkProduct` record associated
+/// with `DepNode::TransPartition(P)`; the hash is the set of symbols
+/// in P.
+///
+/// The next time we compile, if the `DepNode::TransPartition(P)` is
+/// judged to be clean (which means none of the things we read to
+/// generate the partition were found to be dirty), it will be loaded
+/// into previous work products. We will then regenerate the set of
+/// symbols in the partition P and hash them (note that new symbols
+/// may be added -- for example, new monomorphizations -- even if
+/// nothing in P changed!). We will compare that hash against the
+/// previous hash. If it matches up, we can reuse the object file.
+#[derive(Clone, Debug, RustcEncodable, RustcDecodable)]
+pub struct WorkProduct {
+    /// extra hash used to decide if work-product is still suitable;
+    /// note that this is *not* a hash of the work-product itself.
+    /// See documentation on `WorkProduct` type for an example.
+    pub input_hash: u64,
+
+    /// filename storing this work-product (found in the incr. comp. directory)
+    pub file_name: String,
  }
diff --git a/src/librustc/dep_graph/mod.rs b/src/librustc/dep_graph/mod.rs

index e65f6bbcf7aab672acdf3028b794582cf6180450..a499cb10f2325d3032f72d58b106ef18a5559d10 100644 (file)
--- a/src/librustc/dep_graph/mod.rs
+++ b/src/librustc/dep_graph/mod.rs
@@ -20,7 +20,9 @@
  
  pub use self::dep_tracking_map::{DepTrackingMap, DepTrackingMapConfig};
  pub use self::dep_node::DepNode;
+pub use self::dep_node::WorkProductId;
  pub use self::graph::DepGraph;
+pub use self::graph::WorkProduct;
  pub use self::query::DepGraphQuery;
  pub use self::visit::visit_all_items_in_krate;
  pub use self::raii::DepTask;
author	Niko Matsakis <niko@alum.mit.edu>
	Thu, 21 Jul 2016 16:33:23 +0000 (12:33 -0400)
committer	Niko Matsakis <niko@alum.mit.edu>
	Thu, 28 Jul 2016 16:05:04 +0000 (12:05 -0400)
src/librustc/dep_graph/dep_node.rs		patch \| blob \| history
src/librustc/dep_graph/graph.rs		patch \| blob \| history
src/librustc/dep_graph/mod.rs		patch \| blob \| history