rust-lang · Zoxc · Jun 13, 2019 · nikomatsakis · Oct 22, 2019 · Mark-Simulacrum
diff --git a/src/librustc/dep_graph/graph.rs b/src/librustc/dep_graph/graph.rs
@@ -3,11 +3,15 @@ use rustc_data_structures::stable_hasher::{HashStable, StableHasher};
 use rustc_data_structures::fx::{FxHashMap, FxHashSet};
 use rustc_index::vec::{Idx, IndexVec};
 use smallvec::SmallVec;
-use rustc_data_structures::sync::{Lrc, Lock, AtomicU32, AtomicU64, Ordering};
+use rustc_data_structures::sync::{
+    Lrc, Lock, LockGuard, MappedLockGuard, AtomicU32, AtomicU64, Ordering
+};
 use rustc_data_structures::sharded::{self, Sharded};
 use std::sync::atomic::Ordering::SeqCst;
 use std::env;
+use std::iter;
 use std::hash::Hash;
+use std::convert::{TryFrom, TryInto};
 use std::collections::hash_map::Entry;
 use std::mem;
 use crate::ty::{self, TyCtxt};
@@ -119,7 +123,15 @@ impl DepGraph {
     }
 
     pub fn query(&self) -> DepGraphQuery {
-        let data = self.data.as_ref().unwrap().current.data.lock();
+        let current = &self.data.as_ref().unwrap().current;
+        let shards = current.data.lock_shards();
+        let node_count = current.node_count.load(SeqCst) as usize;
+        let data: IndexVec<DepNodeIndex, _> = (0..node_count).map(|i| {
+            let shard = i % sharded::SHARDS;
+            let inner = i / sharded::SHARDS;
+            &shards[shard][inner]
+        }).collect();
+
         let nodes: Vec<_> = data.iter().map(|n| n.node).collect();
         let mut edges = Vec::new();
         for (from, edge_targets) in data.iter().map(|d| (d.node, &d.edges)) {
@@ -428,8 +440,7 @@ impl DepGraph {
 
     #[inline]
     pub fn fingerprint_of(&self, dep_node_index: DepNodeIndex) -> Fingerprint {
-        let data = self.data.as_ref().expect("dep graph enabled").current.data.lock();
-        data[dep_node_index].fingerprint
+        self.data.as_ref().expect("dep graph enabled").current.data(dep_node_index).fingerprint
     }
 
     pub fn prev_fingerprint_of(&self, dep_node: &DepNode) -> Option<Fingerprint> {
@@ -493,25 +504,32 @@ impl DepGraph {
     }
 
     pub fn serialize(&self) -> SerializedDepGraph {
-        let data = self.data.as_ref().unwrap().current.data.lock();
+        let current = &self.data.as_ref().unwrap().current;
+        let shards = current.data.lock_shards();
+        let node_count = current.node_count.load(SeqCst) as usize;
+        let data = || (0..node_count).map(|i| {
+            let shard = i % sharded::SHARDS;
+            let inner = i / sharded::SHARDS;
+            &shards[shard][inner]
+        });
 
         let fingerprints: IndexVec<SerializedDepNodeIndex, _> =
-            data.iter().map(|d| d.fingerprint).collect();
+            data().map(|d| d.fingerprint).collect();
         let nodes: IndexVec<SerializedDepNodeIndex, _> =
-            data.iter().map(|d| d.node).collect();
+            data().map(|d| d.node).collect();
 
-        let total_edge_count: usize = data.iter().map(|d| d.edges.len()).sum();
+        let total_edge_count: usize = data().map(|d| d.edges.len()).sum();
 
         let mut edge_list_indices = IndexVec::with_capacity(nodes.len());
         let mut edge_list_data = Vec::with_capacity(total_edge_count);
 
-        for (current_dep_node_index, edges) in data.iter_enumerated().map(|(i, d)| (i, &d.edges)) {
+        for (current_dep_node_index, edges) in data().enumerate().map(|(i, d)| (i, &d.edges)) {
             let start = edge_list_data.len() as u32;
             // This should really just be a memcpy :/
             edge_list_data.extend(edges.iter().map(|i| SerializedDepNodeIndex::new(i.index())));
             let end = edge_list_data.len() as u32;
 
-            debug_assert_eq!(current_dep_node_index.index(), edge_list_indices.len());
+            debug_assert_eq!(current_dep_node_index, edge_list_indices.len());
             edge_list_indices.push((start, end));
         }
 
@@ -936,7 +954,14 @@ struct DepNodeData {
 /// we first acquire the `node_to_node_index` lock and then, once a new node is to be inserted,
 /// acquire the lock on `data.`
 pub(super) struct CurrentDepGraph {
-    data: Lock<IndexVec<DepNodeIndex, DepNodeData>>,
+    /// The current node count. Used to allocate an index before storing it in the
+    /// `data` and `node_to_node_index` field below.
-    /// `data` and `node_to_node_index` field below.
+    /// `data` and `node_to_node_index` field below.
+    /// 
+    /// NB. This is the "logical" length of the complete data vector at any point.
+    /// In practice, though, the "logical" data vector is sharded across many vectors,
+    /// which will of course be of smaller lengths.
-    /// `data` and `node_to_node_index` field below.
+    /// `data` and `node_to_node_index` field below.
+    /// 
+    /// NB. This is the "logical" length of the complete data vector at any point.
+    /// In practice, though, the "logical" data vector is sharded across many vectors,
+    /// which will of course be of smaller lengths.
+    node_count: AtomicU64,
+
+    /// Maps from a `DepNodeIndex` to `DepNodeData`. The lowest bits of `DepNodeIndex` determines
+    /// which shard is used and the higher bits are the index into the vector.
+    data: Sharded<Vec<DepNodeData>>,
+
     node_to_node_index: Sharded<FxHashMap<DepNode, DepNodeIndex>>,
 
     /// Used to trap when a specific edge is added to the graph.
@@ -994,7 +1019,8 @@ impl CurrentDepGraph {
         let new_node_count_estimate = (prev_graph_node_count * 102) / 100 + 200;
 
         CurrentDepGraph {
-            data: Lock::new(IndexVec::with_capacity(new_node_count_estimate)),
+            node_count: AtomicU64::new(prev_graph_node_count.try_into().unwrap()),
+            data: Sharded::new(|| Vec::with_capacity(new_node_count_estimate / sharded::SHARDS)),
             node_to_node_index: Sharded::new(|| FxHashMap::with_capacity_and_hasher(
                 new_node_count_estimate / sharded::SHARDS,
                 Default::default(),
@@ -1058,20 +1084,56 @@ impl CurrentDepGraph {
         edges: SmallVec<[DepNodeIndex; 8]>,
         fingerprint: Fingerprint
     ) -> DepNodeIndex {
-        match self.node_to_node_index.get_shard_by_value(&dep_node).lock().entry(dep_node) {
-            Entry::Occupied(entry) => *entry.get(),
+        let (index, inserted) = match self.node_to_node_index
+                                          .get_shard_by_value(&dep_node)
+                                          .lock()
+                                          .entry(dep_node) {
+            Entry::Occupied(entry) => (*entry.get(), false),
             Entry::Vacant(entry) => {
-                let mut data = self.data.lock();
-                let dep_node_index = DepNodeIndex::new(data.len());
-                data.push(DepNodeData {
-                    node: dep_node,
-                    edges,
-                    fingerprint
-                });
+                let index = self.node_count.fetch_add(1, SeqCst);
+                // Cast to u32 to ensure we didn't overflow.
+                let index = u32::try_from(index).unwrap();
+
+                let dep_node_index = DepNodeIndex::new(index as usize);
                 entry.insert(dep_node_index);
-                dep_node_index
+                (dep_node_index, true)
+            }
+        };
+
+        if inserted {
+            let dep_node_data = DepNodeData {
+                node: dep_node,
+                edges,
+                fingerprint
+            };
+            let inner_index = index.as_usize() / sharded::SHARDS;
+            let mut data = self.data.get_shard_by_index(index.as_usize()).lock();
+            let len = data.len();
+            if likely!(len == inner_index) {
+                data.push(dep_node_data)
+            } else {
+                let dummy_data = DepNodeData {
+                    node: DepNode::new_no_params(DepKind::Null),
+                    edges: SmallVec::default(),
+                    fingerprint: Fingerprint::ZERO,
+                };
+                if inner_index >= len {
+                    data.extend(iter::repeat(dummy_data).take(inner_index - len + 1));
+                }
+                data[inner_index] = dep_node_data;
             }
         }
+
+        index
+    }
+
+    fn data(
+        &self,
+        index: DepNodeIndex,
+    ) -> MappedLockGuard<'_, DepNodeData> {
+        LockGuard::map(self.data.get_shard_by_index(index.as_usize()).lock(), |vec| {
+            &mut vec[index.as_usize() / sharded::SHARDS]
+        })
     }
 }
 
@@ -1090,9 +1152,8 @@ impl DepGraphData {
                     #[cfg(debug_assertions)]
                     {
                         if let Some(target) = task_deps.node {
-                            let data = self.current.data.lock();
                             if let Some(ref forbidden_edge) = self.current.forbidden_edge {
-                                let source = data[source].node;
+                                let source = self.current.data(source).node;
                                 if forbidden_edge.test(&source, &target) {
                                     bug!("forbidden edge {:?} -> {:?} created",
                                         source,

diff --git a/src/librustc_data_structures/sharded.rs b/src/librustc_data_structures/sharded.rs
@@ -60,6 +60,11 @@ impl<T> Sharded<T> {
         }
     }
 
+    #[inline]
+    pub fn get_shard_by_index(&self, index: usize) -> &Lock<T> {
+        &self.shards[index % SHARDS].0
+    }
+
     #[inline]
     pub fn get_shard_by_value<K: Hash + ?Sized>(&self, val: &K) -> &Lock<T> {
         if SHARDS == 1 {