rust/compiler/rustc_query_system/src/dep_graph/serialized.rs

416 lines
15 KiB
Rust
Raw Normal View History

//! The data that we will serialize and deserialize.
2021-03-02 22:38:49 +01:00
use super::query::DepGraphQuery;
use super::{DepKind, DepNode, DepNodeIndex};
2020-03-18 10:25:22 +01:00
use rustc_data_structures::fingerprint::Fingerprint;
2021-03-02 22:38:49 +01:00
use rustc_data_structures::fx::FxHashMap;
use rustc_data_structures::sync::{AtomicU32, Lock, Lrc, Ordering};
2021-03-06 11:17:56 +01:00
use rustc_index::vec::IndexVec;
2021-03-02 22:38:49 +01:00
use rustc_serialize::opaque::{self, FileEncodeResult, FileEncoder, IntEncodedWithFixedSize};
2021-03-06 11:17:56 +01:00
use rustc_serialize::{Decodable, Decoder, Encodable};
2021-03-02 22:38:49 +01:00
use smallvec::SmallVec;
use std::convert::TryInto;
#[cfg(parallel_compiler)]
use {rustc_data_structures::sync::WorkerLocal, std::sync::mpsc, std::thread};
// The maximum value of `SerializedDepNodeIndex` leaves the upper two bits
// unused so that we can store multiple index types in `CompressedHybridIndex`,
// and use those bits to encode which index type it contains.
rustc_index::newtype_index! {
pub struct SerializedDepNodeIndex {
MAX = 0x7FFF_FFFF
}
}
/// Data for use when recompiling the **current crate**.
#[derive(Debug)]
2020-03-18 10:25:22 +01:00
pub struct SerializedDepGraph<K: DepKind> {
/// The set of all DepNodes in the graph
2020-03-18 10:25:22 +01:00
pub nodes: IndexVec<SerializedDepNodeIndex, DepNode<K>>,
/// The set of all Fingerprints in the graph. Each Fingerprint corresponds to
/// the DepNode at the same index in the nodes vector.
pub fingerprints: IndexVec<SerializedDepNodeIndex, Fingerprint>,
/// For each DepNode, stores the list of edges originating from that
/// DepNode. Encoded as a [start, end) pair indexing into edge_list_data,
/// which holds the actual DepNodeIndices of the target nodes.
pub edge_list_indices: IndexVec<SerializedDepNodeIndex, (u32, u32)>,
/// A flattened list of all edge targets in the graph. Edge sources are
/// implicit in edge_list_indices.
pub edge_list_data: Vec<SerializedDepNodeIndex>,
}
2020-03-18 10:25:22 +01:00
impl<K: DepKind> Default for SerializedDepGraph<K> {
fn default() -> Self {
SerializedDepGraph {
nodes: Default::default(),
fingerprints: Default::default(),
edge_list_indices: Default::default(),
edge_list_data: Default::default(),
}
}
}
impl<K: DepKind> SerializedDepGraph<K> {
#[inline]
2019-12-22 17:42:04 -05:00
pub fn edge_targets_from(&self, source: SerializedDepNodeIndex) -> &[SerializedDepNodeIndex] {
let targets = self.edge_list_indices[source];
&self.edge_list_data[targets.0 as usize..targets.1 as usize]
}
}
2021-03-02 22:38:49 +01:00
impl<'a, K: DepKind + Decodable<opaque::Decoder<'a>>> Decodable<opaque::Decoder<'a>>
for SerializedDepGraph<K>
{
#[instrument(skip(d))]
fn decode(d: &mut opaque::Decoder<'a>) -> Result<SerializedDepGraph<K>, String> {
let position = d.position();
// The last 16 bytes are the node count and edge count.
debug!("position: {:?}", d.position());
d.set_position(d.data.len() - 2 * IntEncodedWithFixedSize::ENCODED_SIZE);
debug!("position: {:?}", d.position());
let node_count = IntEncodedWithFixedSize::decode(d)?.0 as usize;
let edge_count = IntEncodedWithFixedSize::decode(d)?.0 as usize;
debug!(?node_count, ?edge_count);
debug!("position: {:?}", d.position());
d.set_position(position);
debug!("position: {:?}", d.position());
let mut nodes = IndexVec::with_capacity(node_count);
let mut fingerprints = IndexVec::with_capacity(node_count);
let mut edge_list_indices = IndexVec::with_capacity(node_count);
let mut edge_list_data = Vec::with_capacity(edge_count);
for _index in 0..node_count {
2021-03-06 11:17:56 +01:00
d.read_struct("NodeInfo", 3, |d| {
let dep_node: DepNode<K> = d.read_struct_field("node", 0, Decodable::decode)?;
let _i: SerializedDepNodeIndex = nodes.push(dep_node);
debug_assert_eq!(_i.index(), _index);
let fingerprint: Fingerprint =
d.read_struct_field("fingerprint", 1, Decodable::decode)?;
let _i: SerializedDepNodeIndex = fingerprints.push(fingerprint);
debug_assert_eq!(_i.index(), _index);
d.read_struct_field("edges", 2, |d| {
d.read_seq(|d, len| {
let start = edge_list_data.len().try_into().unwrap();
for e in 0..len {
let edge = d.read_seq_elt(e, Decodable::decode)?;
edge_list_data.push(edge);
}
let end = edge_list_data.len().try_into().unwrap();
let _i: SerializedDepNodeIndex = edge_list_indices.push((start, end));
debug_assert_eq!(_i.index(), _index);
Ok(())
})
})
})?;
2021-03-02 22:38:49 +01:00
}
Ok(SerializedDepGraph { nodes, fingerprints, edge_list_indices, edge_list_data })
}
}
#[derive(Debug, Encodable, Decodable)]
2021-03-06 11:17:56 +01:00
pub struct NodeInfo<K: DepKind> {
2021-03-02 22:38:49 +01:00
node: DepNode<K>,
fingerprint: Fingerprint,
2021-03-06 11:17:56 +01:00
edges: SmallVec<[DepNodeIndex; 8]>,
2021-03-02 22:38:49 +01:00
}
struct Stat<K: DepKind> {
kind: K,
node_counter: u64,
edge_counter: u64,
}
struct Stats<K: DepKind> {
stats: FxHashMap<K, Stat<K>>,
total_node_count: usize,
total_edge_count: usize,
}
#[instrument(skip(encoder, _record_graph, record_stats))]
fn encode_node<K: DepKind>(
encoder: &mut FileEncoder,
_index: DepNodeIndex,
2021-03-06 11:17:56 +01:00
node: &NodeInfo<K>,
2021-03-02 22:38:49 +01:00
_record_graph: &Option<Lrc<Lock<DepGraphQuery<K>>>>,
record_stats: &Option<Lrc<Lock<Stats<K>>>>,
) -> FileEncodeResult {
#[cfg(debug_assertions)]
if let Some(record_graph) = &_record_graph {
record_graph.lock().push(_index, node.node, &node.edges);
}
if let Some(record_stats) = &record_stats {
let mut stats = record_stats.lock();
let kind = node.node.kind;
let edge_count = node.edges.len();
let stat =
stats.stats.entry(kind).or_insert(Stat { kind, node_counter: 0, edge_counter: 0 });
stat.node_counter += 1;
stat.edge_counter += edge_count as u64;
stats.total_node_count += 1;
stats.total_edge_count += edge_count;
}
debug!(?_index, ?node);
node.encode(encoder)
}
fn encode_counts(
mut encoder: FileEncoder,
node_count: usize,
edge_count: usize,
) -> FileEncodeResult {
let node_count = node_count.try_into().unwrap();
let edge_count = edge_count.try_into().unwrap();
debug!(?node_count, ?edge_count);
debug!("position: {:?}", encoder.position());
IntEncodedWithFixedSize(node_count).encode(&mut encoder)?;
IntEncodedWithFixedSize(edge_count).encode(&mut encoder)?;
debug!("position: {:?}", encoder.position());
// Drop the encoder so that nothing is written after the counts.
encoder.flush()
}
#[cfg(not(parallel_compiler))]
pub struct GraphEncoder<K: DepKind> {
status: Lock<(FileEncoder, usize, FileEncodeResult)>,
counter: AtomicU32,
record_graph: Option<Lrc<Lock<DepGraphQuery<K>>>>,
record_stats: Option<Lrc<Lock<Stats<K>>>>,
}
#[cfg(parallel_compiler)]
pub struct GraphEncoder<K: DepKind> {
2021-03-06 11:17:56 +01:00
send: WorkerLocal<mpsc::Sender<(DepNodeIndex, NodeInfo<K>)>>,
2021-03-02 22:38:49 +01:00
thread: thread::JoinHandle<FileEncodeResult>,
counter: AtomicU32,
record_graph: Option<Lrc<Lock<DepGraphQuery<K>>>>,
record_stats: Option<Lrc<Lock<Stats<K>>>>,
}
impl<K: DepKind + Encodable<FileEncoder>> GraphEncoder<K> {
pub fn new(
encoder: FileEncoder,
prev_node_count: usize,
record_graph: bool,
record_stats: bool,
) -> Self {
let record_graph = if cfg!(debug_assertions) && record_graph {
Some(Lrc::new(Lock::new(DepGraphQuery::new(prev_node_count))))
} else {
None
};
let record_stats = if record_stats {
Some(Lrc::new(Lock::new(Stats {
stats: FxHashMap::default(),
total_node_count: 0,
total_edge_count: 0,
})))
} else {
None
};
let counter = AtomicU32::new(0);
#[cfg(not(parallel_compiler))]
{
let status = Lock::new((encoder, 0, Ok(())));
GraphEncoder { status, counter, record_graph, record_stats }
}
#[cfg(parallel_compiler)]
{
let (send, recv) = mpsc::channel();
let thread = {
let record_graph = record_graph.clone();
let record_stats = record_stats.clone();
thread::spawn(move || {
encode_graph(encoder, recv, |encoder, index, node| {
encode_node(encoder, index, node, &record_graph, &record_stats)
})
2021-03-02 22:38:49 +01:00
})
};
let send = WorkerLocal::new(move |_| send.clone());
2021-03-02 22:38:49 +01:00
GraphEncoder { send, thread, counter, record_graph, record_stats }
}
}
pub(crate) fn with_query(&self, f: impl Fn(&DepGraphQuery<K>)) {
if let Some(record_graph) = &self.record_graph {
f(&record_graph.lock())
}
}
pub(crate) fn print_incremental_info(
&self,
total_read_count: u64,
total_duplicate_read_count: u64,
) {
if let Some(record_stats) = &self.record_stats {
let record_stats = record_stats.lock();
let mut stats: Vec<_> = record_stats.stats.values().collect();
stats.sort_by_key(|s| -(s.node_counter as i64));
const SEPARATOR: &str = "[incremental] --------------------------------\
----------------------------------------------\
------------";
eprintln!("[incremental]");
eprintln!("[incremental] DepGraph Statistics");
eprintln!("{}", SEPARATOR);
eprintln!("[incremental]");
eprintln!("[incremental] Total Node Count: {}", record_stats.total_node_count);
eprintln!("[incremental] Total Edge Count: {}", record_stats.total_edge_count);
if cfg!(debug_assertions) {
eprintln!("[incremental] Total Edge Reads: {}", total_read_count);
eprintln!(
"[incremental] Total Duplicate Edge Reads: {}",
total_duplicate_read_count
);
}
eprintln!("[incremental]");
eprintln!(
"[incremental] {:<36}| {:<17}| {:<12}| {:<17}|",
"Node Kind", "Node Frequency", "Node Count", "Avg. Edge Count"
);
eprintln!("{}", SEPARATOR);
for stat in stats {
let node_kind_ratio =
(100.0 * (stat.node_counter as f64)) / (record_stats.total_node_count as f64);
let node_kind_avg_edges = (stat.edge_counter as f64) / (stat.node_counter as f64);
eprintln!(
"[incremental] {:<36}|{:>16.1}% |{:>12} |{:>17.1} |",
format!("{:?}", stat.kind),
node_kind_ratio,
stat.node_counter,
node_kind_avg_edges,
);
}
eprintln!("{}", SEPARATOR);
eprintln!("[incremental]");
}
}
}
#[cfg(not(parallel_compiler))]
impl<K: DepKind + Encodable<FileEncoder>> GraphEncoder<K> {
pub(crate) fn send(
&self,
node: DepNode<K>,
fingerprint: Fingerprint,
edges: SmallVec<[DepNodeIndex; 8]>,
) -> DepNodeIndex {
let index = self.counter.fetch_add(1, Ordering::SeqCst);
let index = DepNodeIndex::from_u32(index);
let &mut (ref mut encoder, ref mut edge_count, ref mut result) = &mut *self.status.lock();
*edge_count += edges.len();
*result = std::mem::replace(result, Ok(())).and_then(|()| {
let node = NodeInfo { node, fingerprint, edges };
encode_node(encoder, index, &node, &self.record_graph, &self.record_stats)
});
index
}
pub fn finish(self) -> FileEncodeResult {
let (encoder, edge_count, result) = self.status.into_inner();
let () = result?;
let node_count = self.counter.into_inner() as usize;
encode_counts(encoder, node_count, edge_count)
}
}
#[cfg(parallel_compiler)]
impl<K: DepKind + Encodable<FileEncoder>> GraphEncoder<K> {
pub(crate) fn send(
&self,
node: DepNode<K>,
fingerprint: Fingerprint,
edges: SmallVec<[DepNodeIndex; 8]>,
) -> DepNodeIndex {
let node = NodeInfo { node, fingerprint, edges };
let index = self.counter.fetch_add(1, Ordering::SeqCst);
let index = DepNodeIndex::from_u32(index);
self.send.send((index, node)).unwrap();
index
}
2021-03-02 22:38:49 +01:00
pub fn finish(self) -> FileEncodeResult {
std::mem::drop(self.send);
self.thread.join().unwrap()
}
}
#[cfg(parallel_compiler)]
#[instrument(skip(encoder, recv, process))]
fn encode_graph<K: DepKind + Encodable<FileEncoder>>(
mut encoder: FileEncoder,
2021-03-06 11:17:56 +01:00
recv: mpsc::Receiver<(DepNodeIndex, NodeInfo<K>)>,
process: impl Fn(&mut FileEncoder, DepNodeIndex, &NodeInfo<K>) -> FileEncodeResult,
2021-03-02 22:38:49 +01:00
) -> FileEncodeResult {
let mut edge_count: usize = 0;
let node_count: usize = ordered_recv(recv, |index, node| {
edge_count += node.edges.len();
process(&mut encoder, index, node)
})?;
encode_counts(encoder, node_count, edge_count)
}
/// Since there are multiple producers assigning the DepNodeIndex using an atomic,
/// the messages may not arrive in order. This function sorts them as they come.
#[cfg(parallel_compiler)]
fn ordered_recv<K: DepKind + Encodable<opaque::FileEncoder>>(
2021-03-06 11:17:56 +01:00
recv: mpsc::Receiver<(DepNodeIndex, NodeInfo<K>)>,
mut f: impl FnMut(DepNodeIndex, &NodeInfo<K>) -> FileEncodeResult,
2021-03-02 22:38:49 +01:00
) -> Result<usize, std::io::Error> {
let mut pending = Vec::<(DepNodeIndex, _)>::new();
let mut expected = DepNodeIndex::new(0);
// INVARIANT: No message can arrive with an index less than `expected`.
'outer: loop {
pending.sort_by_key(|n| n.0);
for (index, node) in pending.drain_filter(|(index, _)| {
if *index == expected {
expected.increment_by(1);
true
} else {
false
}
}) {
f(index, &node)?;
}
while let Ok((index, node)) = recv.recv() {
if index > expected {
pending.push((index, node));
} else if index == expected {
f(index, &node)?;
expected.increment_by(1);
continue 'outer;
} else {
panic!("Unexpected index {:?} while waiting for {:?}", index, expected);
}
}
break;
}
Ok(expected.as_u32() as usize)
}