| //! This module defines the `DepNode` type which the compiler uses to represent |
| //! nodes in the dependency graph. |
| //! |
| //! A `DepNode` consists of a `DepKind` (which |
| //! specifies the kind of thing it represents, like a piece of HIR, MIR, etc) |
| //! and a `Fingerprint`, a 128-bit hash value the exact meaning of which |
| //! depends on the node's `DepKind`. Together, the kind and the fingerprint |
| //! fully identify a dependency node, even across multiple compilation sessions. |
| //! In other words, the value of the fingerprint does not depend on anything |
| //! that is specific to a given compilation session, like an unpredictable |
| //! interning key (e.g., NodeId, DefId, Symbol) or the numeric value of a |
| //! pointer. The concept behind this could be compared to how git commit hashes |
| //! uniquely identify a given commit and has a few advantages: |
| //! |
| //! * A `DepNode` can simply be serialized to disk and loaded in another session |
| //! without the need to do any "rebasing" (like we have to do for Spans and |
| //! NodeIds) or "retracing" (like we had to do for `DefId` in earlier |
| //! implementations of the dependency graph). |
| //! * A `Fingerprint` is just a bunch of bits, which allows `DepNode` to |
| //! implement `Copy`, `Sync`, `Send`, `Freeze`, etc. |
| //! * Since we just have a bit pattern, `DepNode` can be mapped from disk into |
| //! memory without any post-processing (e.g., "abomination-style" pointer |
| //! reconstruction). |
| //! * Because a `DepNode` is self-contained, we can instantiate `DepNodes` that |
| //! refer to things that do not exist anymore. In previous implementations |
| //! `DepNode` contained a `DefId`. A `DepNode` referring to something that |
| //! had been removed between the previous and the current compilation session |
| //! could not be instantiated because the current compilation session |
| //! contained no `DefId` for thing that had been removed. |
| //! |
| //! `DepNode` definition happens in the `define_dep_nodes!()` macro. This macro |
| //! defines the `DepKind` enum. Each `DepKind` has its own parameters that are |
| //! needed at runtime in order to construct a valid `DepNode` fingerprint. |
| //! However, only `CompileCodegenUnit` is constructed explicitly (with |
| //! `make_compile_codegen_unit`). |
| //! |
| //! Because the macro sees what parameters a given `DepKind` requires, it can |
| //! "infer" some properties for each kind of `DepNode`: |
| //! |
| //! * Whether a `DepNode` of a given kind has any parameters at all. Some |
| //! `DepNode`s could represent global concepts with only one value. |
| //! * Whether it is possible, in principle, to reconstruct a query key from a |
| //! given `DepNode`. Many `DepKind`s only require a single `DefId` parameter, |
| //! in which case it is possible to map the node's fingerprint back to the |
| //! `DefId` it was computed from. In other cases, too much information gets |
| //! lost during fingerprint computation. |
| //! |
| //! `make_compile_codegen_unit`, together with `DepNode::new()`, ensures that only |
| //! valid `DepNode` instances can be constructed. For example, the API does not |
| //! allow for constructing parameterless `DepNode`s with anything other |
| //! than a zeroed out fingerprint. More generally speaking, it relieves the |
| //! user of the `DepNode` API of having to know how to compute the expected |
| //! fingerprint for a given set of node parameters. |
| |
| use crate::ty::TyCtxt; |
| |
| use rustc_data_structures::fingerprint::Fingerprint; |
| use rustc_hir::def_id::{CrateNum, DefId, LocalDefId, CRATE_DEF_INDEX}; |
| use rustc_hir::definitions::DefPathHash; |
| use rustc_hir::HirId; |
| use rustc_span::symbol::Symbol; |
| use rustc_span::DUMMY_SP; |
| use std::hash::Hash; |
| |
| pub use rustc_query_system::dep_graph::{DepContext, DepNodeParams}; |
| |
| /// This struct stores metadata about each DepKind. |
| /// |
| /// Information is retrieved by indexing the `DEP_KINDS` array using the integer value |
| /// of the `DepKind`. Overall, this allows to implement `DepContext` using this manual |
| /// jump table instead of large matches. |
| pub struct DepKindStruct { |
| /// Whether the DepNode has parameters (query keys). |
| pub(super) has_params: bool, |
| |
| /// Anonymous queries cannot be replayed from one compiler invocation to the next. |
| /// When their result is needed, it is recomputed. They are useful for fine-grained |
| /// dependency tracking, and caching within one compiler invocation. |
| pub(super) is_anon: bool, |
| |
| /// Eval-always queries do not track their dependencies, and are always recomputed, even if |
| /// their inputs have not changed since the last compiler invocation. The result is still |
| /// cached within one compiler invocation. |
| pub(super) is_eval_always: bool, |
| |
| /// Whether the query key can be recovered from the hashed fingerprint. |
| /// See [DepNodeParams] trait for the behaviour of each key type. |
| // FIXME: Make this a simple boolean once DepNodeParams::can_reconstruct_query_key |
| // can be made a specialized associated const. |
| can_reconstruct_query_key: fn() -> bool, |
| |
| /// The red/green evaluation system will try to mark a specific DepNode in the |
| /// dependency graph as green by recursively trying to mark the dependencies of |
| /// that `DepNode` as green. While doing so, it will sometimes encounter a `DepNode` |
| /// where we don't know if it is red or green and we therefore actually have |
| /// to recompute its value in order to find out. Since the only piece of |
| /// information that we have at that point is the `DepNode` we are trying to |
| /// re-evaluate, we need some way to re-run a query from just that. This is what |
| /// `force_from_dep_node()` implements. |
| /// |
| /// In the general case, a `DepNode` consists of a `DepKind` and an opaque |
| /// GUID/fingerprint that will uniquely identify the node. This GUID/fingerprint |
| /// is usually constructed by computing a stable hash of the query-key that the |
| /// `DepNode` corresponds to. Consequently, it is not in general possible to go |
| /// back from hash to query-key (since hash functions are not reversible). For |
| /// this reason `force_from_dep_node()` is expected to fail from time to time |
| /// because we just cannot find out, from the `DepNode` alone, what the |
| /// corresponding query-key is and therefore cannot re-run the query. |
| /// |
| /// The system deals with this case letting `try_mark_green` fail which forces |
| /// the root query to be re-evaluated. |
| /// |
| /// Now, if `force_from_dep_node()` would always fail, it would be pretty useless. |
| /// Fortunately, we can use some contextual information that will allow us to |
| /// reconstruct query-keys for certain kinds of `DepNode`s. In particular, we |
| /// enforce by construction that the GUID/fingerprint of certain `DepNode`s is a |
| /// valid `DefPathHash`. Since we also always build a huge table that maps every |
| /// `DefPathHash` in the current codebase to the corresponding `DefId`, we have |
| /// everything we need to re-run the query. |
| /// |
| /// Take the `mir_promoted` query as an example. Like many other queries, it |
| /// just has a single parameter: the `DefId` of the item it will compute the |
| /// validated MIR for. Now, when we call `force_from_dep_node()` on a `DepNode` |
| /// with kind `MirValidated`, we know that the GUID/fingerprint of the `DepNode` |
| /// is actually a `DefPathHash`, and can therefore just look up the corresponding |
| /// `DefId` in `tcx.def_path_hash_to_def_id`. |
| /// |
| /// When you implement a new query, it will likely have a corresponding new |
| /// `DepKind`, and you'll have to support it here in `force_from_dep_node()`. As |
| /// a rule of thumb, if your query takes a `DefId` or `LocalDefId` as sole parameter, |
| /// then `force_from_dep_node()` should not fail for it. Otherwise, you can just |
| /// add it to the "We don't have enough information to reconstruct..." group in |
| /// the match below. |
| pub(super) force_from_dep_node: fn(tcx: TyCtxt<'_>, dep_node: &DepNode) -> bool, |
| |
| /// Invoke a query to put the on-disk cached value in memory. |
| pub(super) try_load_from_on_disk_cache: fn(TyCtxt<'_>, &DepNode), |
| } |
| |
| impl std::ops::Deref for DepKind { |
| type Target = DepKindStruct; |
| fn deref(&self) -> &DepKindStruct { |
| &DEP_KINDS[*self as usize] |
| } |
| } |
| |
| impl DepKind { |
| #[inline(always)] |
| pub fn can_reconstruct_query_key(&self) -> bool { |
| // Only fetch the DepKindStruct once. |
| let data: &DepKindStruct = &**self; |
| if data.is_anon { |
| return false; |
| } |
| |
| (data.can_reconstruct_query_key)() |
| } |
| } |
| |
| // erase!() just makes tokens go away. It's used to specify which macro argument |
| // is repeated (i.e., which sub-expression of the macro we are in) but don't need |
| // to actually use any of the arguments. |
| macro_rules! erase { |
| ($x:tt) => {{}}; |
| } |
| |
| macro_rules! is_anon_attr { |
| (anon) => { |
| true |
| }; |
| ($attr:ident) => { |
| false |
| }; |
| } |
| |
| macro_rules! is_eval_always_attr { |
| (eval_always) => { |
| true |
| }; |
| ($attr:ident) => { |
| false |
| }; |
| } |
| |
| macro_rules! contains_anon_attr { |
| ($($attr:ident $(($($attr_args:tt)*))* ),*) => ({$(is_anon_attr!($attr) | )* false}); |
| } |
| |
| macro_rules! contains_eval_always_attr { |
| ($($attr:ident $(($($attr_args:tt)*))* ),*) => ({$(is_eval_always_attr!($attr) | )* false}); |
| } |
| |
| #[allow(non_upper_case_globals)] |
| pub mod dep_kind { |
| use super::*; |
| use crate::ty::query::{queries, query_keys}; |
| use rustc_query_system::query::{force_query, QueryDescription}; |
| |
| // We use this for most things when incr. comp. is turned off. |
| pub const Null: DepKindStruct = DepKindStruct { |
| has_params: false, |
| is_anon: false, |
| is_eval_always: false, |
| |
| can_reconstruct_query_key: || true, |
| force_from_dep_node: |_, dep_node| bug!("force_from_dep_node: encountered {:?}", dep_node), |
| try_load_from_on_disk_cache: |_, _| {}, |
| }; |
| |
| pub const TraitSelect: DepKindStruct = DepKindStruct { |
| has_params: false, |
| is_anon: true, |
| is_eval_always: false, |
| |
| can_reconstruct_query_key: || true, |
| force_from_dep_node: |_, _| false, |
| try_load_from_on_disk_cache: |_, _| {}, |
| }; |
| |
| pub const CompileCodegenUnit: DepKindStruct = DepKindStruct { |
| has_params: true, |
| is_anon: false, |
| is_eval_always: false, |
| |
| can_reconstruct_query_key: || false, |
| force_from_dep_node: |_, _| false, |
| try_load_from_on_disk_cache: |_, _| {}, |
| }; |
| |
| macro_rules! define_query_dep_kinds { |
| ($( |
| [$($attrs:tt)*] |
| $variant:ident $(( $tuple_arg_ty:ty $(,)? ))* |
| ,)*) => ( |
| $(pub const $variant: DepKindStruct = { |
| const has_params: bool = $({ erase!($tuple_arg_ty); true } |)* false; |
| const is_anon: bool = contains_anon_attr!($($attrs)*); |
| const is_eval_always: bool = contains_eval_always_attr!($($attrs)*); |
| |
| #[inline(always)] |
| fn can_reconstruct_query_key() -> bool { |
| <query_keys::$variant<'_> as DepNodeParams<TyCtxt<'_>>> |
| ::can_reconstruct_query_key() |
| } |
| |
| fn recover<'tcx>(tcx: TyCtxt<'tcx>, dep_node: &DepNode) -> Option<query_keys::$variant<'tcx>> { |
| <query_keys::$variant<'_> as DepNodeParams<TyCtxt<'_>>>::recover(tcx, dep_node) |
| } |
| |
| fn force_from_dep_node(tcx: TyCtxt<'_>, dep_node: &DepNode) -> bool { |
| if is_anon { |
| return false; |
| } |
| |
| if !can_reconstruct_query_key() { |
| return false; |
| } |
| |
| if let Some(key) = recover(tcx, dep_node) { |
| force_query::<queries::$variant<'_>, _>( |
| tcx, |
| key, |
| DUMMY_SP, |
| *dep_node |
| ); |
| return true; |
| } |
| |
| false |
| } |
| |
| fn try_load_from_on_disk_cache(tcx: TyCtxt<'_>, dep_node: &DepNode) { |
| if is_anon { |
| return |
| } |
| |
| if !can_reconstruct_query_key() { |
| return |
| } |
| |
| debug_assert!(tcx.dep_graph |
| .node_color(dep_node) |
| .map(|c| c.is_green()) |
| .unwrap_or(false)); |
| |
| let key = recover(tcx, dep_node).unwrap_or_else(|| panic!("Failed to recover key for {:?} with hash {}", dep_node, dep_node.hash)); |
| if queries::$variant::cache_on_disk(tcx, &key, None) { |
| let _ = tcx.$variant(key); |
| } |
| } |
| |
| DepKindStruct { |
| has_params, |
| is_anon, |
| is_eval_always, |
| can_reconstruct_query_key, |
| force_from_dep_node, |
| try_load_from_on_disk_cache, |
| } |
| };)* |
| ); |
| } |
| |
| rustc_dep_node_append!([define_query_dep_kinds!][]); |
| } |
| |
| macro_rules! define_dep_nodes { |
| (<$tcx:tt> |
| $( |
| [$($attrs:tt)*] |
| $variant:ident $(( $tuple_arg_ty:ty $(,)? ))* |
| ,)* |
| ) => ( |
| static DEP_KINDS: &[DepKindStruct] = &[ $(dep_kind::$variant),* ]; |
| |
| /// This enum serves as an index into the `DEP_KINDS` array. |
| #[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Encodable, Decodable)] |
| #[allow(non_camel_case_types)] |
| pub enum DepKind { |
| $($variant),* |
| } |
| |
| fn dep_kind_from_label_string(label: &str) -> Result<DepKind, ()> { |
| match label { |
| $(stringify!($variant) => Ok(DepKind::$variant),)* |
| _ => Err(()), |
| } |
| } |
| |
| /// Contains variant => str representations for constructing |
| /// DepNode groups for tests. |
| #[allow(dead_code, non_upper_case_globals)] |
| pub mod label_strs { |
| $( |
| pub const $variant: &str = stringify!($variant); |
| )* |
| } |
| ); |
| } |
| |
| rustc_dep_node_append!([define_dep_nodes!][ <'tcx> |
| // We use this for most things when incr. comp. is turned off. |
| [] Null, |
| |
| [anon] TraitSelect, |
| |
| // WARNING: if `Symbol` is changed, make sure you update `make_compile_codegen_unit` below. |
| [] CompileCodegenUnit(Symbol), |
| ]); |
| |
| // WARNING: `construct` is generic and does not know that `CompileCodegenUnit` takes `Symbol`s as keys. |
| // Be very careful changing this type signature! |
| crate fn make_compile_codegen_unit(tcx: TyCtxt<'_>, name: Symbol) -> DepNode { |
| DepNode::construct(tcx, DepKind::CompileCodegenUnit, &name) |
| } |
| |
| pub type DepNode = rustc_query_system::dep_graph::DepNode<DepKind>; |
| |
| // We keep a lot of `DepNode`s in memory during compilation. It's not |
| // required that their size stay the same, but we don't want to change |
| // it inadvertently. This assert just ensures we're aware of any change. |
| #[cfg(any(target_arch = "x86", target_arch = "x86_64"))] |
| static_assert_size!(DepNode, 17); |
| |
| #[cfg(not(any(target_arch = "x86", target_arch = "x86_64")))] |
| static_assert_size!(DepNode, 24); |
| |
| pub trait DepNodeExt: Sized { |
| /// Construct a DepNode from the given DepKind and DefPathHash. This |
| /// method will assert that the given DepKind actually requires a |
| /// single DefId/DefPathHash parameter. |
| fn from_def_path_hash(def_path_hash: DefPathHash, kind: DepKind) -> Self; |
| |
| /// Extracts the DefId corresponding to this DepNode. This will work |
| /// if two conditions are met: |
| /// |
| /// 1. The Fingerprint of the DepNode actually is a DefPathHash, and |
| /// 2. the item that the DefPath refers to exists in the current tcx. |
| /// |
| /// Condition (1) is determined by the DepKind variant of the |
| /// DepNode. Condition (2) might not be fulfilled if a DepNode |
| /// refers to something from the previous compilation session that |
| /// has been removed. |
| fn extract_def_id(&self, tcx: TyCtxt<'_>) -> Option<DefId>; |
| |
| /// Used in testing |
| fn from_label_string(label: &str, def_path_hash: DefPathHash) -> Result<Self, ()>; |
| |
| /// Used in testing |
| fn has_label_string(label: &str) -> bool; |
| } |
| |
| impl DepNodeExt for DepNode { |
| /// Construct a DepNode from the given DepKind and DefPathHash. This |
| /// method will assert that the given DepKind actually requires a |
| /// single DefId/DefPathHash parameter. |
| fn from_def_path_hash(def_path_hash: DefPathHash, kind: DepKind) -> DepNode { |
| debug_assert!(kind.can_reconstruct_query_key() && kind.has_params); |
| DepNode { kind, hash: def_path_hash.0.into() } |
| } |
| |
| /// Extracts the DefId corresponding to this DepNode. This will work |
| /// if two conditions are met: |
| /// |
| /// 1. The Fingerprint of the DepNode actually is a DefPathHash, and |
| /// 2. the item that the DefPath refers to exists in the current tcx. |
| /// |
| /// Condition (1) is determined by the DepKind variant of the |
| /// DepNode. Condition (2) might not be fulfilled if a DepNode |
| /// refers to something from the previous compilation session that |
| /// has been removed. |
| fn extract_def_id(&self, tcx: TyCtxt<'tcx>) -> Option<DefId> { |
| if self.kind.can_reconstruct_query_key() { |
| tcx.queries |
| .on_disk_cache |
| .as_ref()? |
| .def_path_hash_to_def_id(tcx, DefPathHash(self.hash.into())) |
| } else { |
| None |
| } |
| } |
| |
| /// Used in testing |
| fn from_label_string(label: &str, def_path_hash: DefPathHash) -> Result<DepNode, ()> { |
| let kind = dep_kind_from_label_string(label)?; |
| |
| if !kind.can_reconstruct_query_key() { |
| return Err(()); |
| } |
| |
| if kind.has_params { |
| Ok(DepNode::from_def_path_hash(def_path_hash, kind)) |
| } else { |
| Ok(DepNode::new_no_params(kind)) |
| } |
| } |
| |
| /// Used in testing |
| fn has_label_string(label: &str) -> bool { |
| dep_kind_from_label_string(label).is_ok() |
| } |
| } |
| |
| impl<'tcx> DepNodeParams<TyCtxt<'tcx>> for () { |
| #[inline(always)] |
| fn can_reconstruct_query_key() -> bool { |
| true |
| } |
| |
| fn to_fingerprint(&self, _: TyCtxt<'tcx>) -> Fingerprint { |
| Fingerprint::ZERO |
| } |
| |
| fn recover(_: TyCtxt<'tcx>, _: &DepNode) -> Option<Self> { |
| Some(()) |
| } |
| } |
| |
| impl<'tcx> DepNodeParams<TyCtxt<'tcx>> for DefId { |
| #[inline(always)] |
| fn can_reconstruct_query_key() -> bool { |
| true |
| } |
| |
| fn to_fingerprint(&self, tcx: TyCtxt<'tcx>) -> Fingerprint { |
| let hash = tcx.def_path_hash(*self); |
| // If this is a foreign `DefId`, store its current value |
| // in the incremental cache. When we decode the cache, |
| // we will use the old DefIndex as an initial guess for |
| // a lookup into the crate metadata. |
| if !self.is_local() { |
| if let Some(cache) = &tcx.queries.on_disk_cache { |
| cache.store_foreign_def_id_hash(*self, hash); |
| } |
| } |
| hash.0 |
| } |
| |
| fn to_debug_str(&self, tcx: TyCtxt<'tcx>) -> String { |
| tcx.def_path_str(*self) |
| } |
| |
| fn recover(tcx: TyCtxt<'tcx>, dep_node: &DepNode) -> Option<Self> { |
| dep_node.extract_def_id(tcx) |
| } |
| } |
| |
| impl<'tcx> DepNodeParams<TyCtxt<'tcx>> for LocalDefId { |
| #[inline(always)] |
| fn can_reconstruct_query_key() -> bool { |
| true |
| } |
| |
| fn to_fingerprint(&self, tcx: TyCtxt<'tcx>) -> Fingerprint { |
| self.to_def_id().to_fingerprint(tcx) |
| } |
| |
| fn to_debug_str(&self, tcx: TyCtxt<'tcx>) -> String { |
| self.to_def_id().to_debug_str(tcx) |
| } |
| |
| fn recover(tcx: TyCtxt<'tcx>, dep_node: &DepNode) -> Option<Self> { |
| dep_node.extract_def_id(tcx).map(|id| id.expect_local()) |
| } |
| } |
| |
| impl<'tcx> DepNodeParams<TyCtxt<'tcx>> for CrateNum { |
| #[inline(always)] |
| fn can_reconstruct_query_key() -> bool { |
| true |
| } |
| |
| fn to_fingerprint(&self, tcx: TyCtxt<'tcx>) -> Fingerprint { |
| let def_id = DefId { krate: *self, index: CRATE_DEF_INDEX }; |
| def_id.to_fingerprint(tcx) |
| } |
| |
| fn to_debug_str(&self, tcx: TyCtxt<'tcx>) -> String { |
| tcx.crate_name(*self).to_string() |
| } |
| |
| fn recover(tcx: TyCtxt<'tcx>, dep_node: &DepNode) -> Option<Self> { |
| dep_node.extract_def_id(tcx).map(|id| id.krate) |
| } |
| } |
| |
| impl<'tcx> DepNodeParams<TyCtxt<'tcx>> for (DefId, DefId) { |
| #[inline(always)] |
| fn can_reconstruct_query_key() -> bool { |
| false |
| } |
| |
| // We actually would not need to specialize the implementation of this |
| // method but it's faster to combine the hashes than to instantiate a full |
| // hashing context and stable-hashing state. |
| fn to_fingerprint(&self, tcx: TyCtxt<'tcx>) -> Fingerprint { |
| let (def_id_0, def_id_1) = *self; |
| |
| let def_path_hash_0 = tcx.def_path_hash(def_id_0); |
| let def_path_hash_1 = tcx.def_path_hash(def_id_1); |
| |
| def_path_hash_0.0.combine(def_path_hash_1.0) |
| } |
| |
| fn to_debug_str(&self, tcx: TyCtxt<'tcx>) -> String { |
| let (def_id_0, def_id_1) = *self; |
| |
| format!("({}, {})", tcx.def_path_debug_str(def_id_0), tcx.def_path_debug_str(def_id_1)) |
| } |
| } |
| |
| impl<'tcx> DepNodeParams<TyCtxt<'tcx>> for HirId { |
| #[inline(always)] |
| fn can_reconstruct_query_key() -> bool { |
| false |
| } |
| |
| // We actually would not need to specialize the implementation of this |
| // method but it's faster to combine the hashes than to instantiate a full |
| // hashing context and stable-hashing state. |
| fn to_fingerprint(&self, tcx: TyCtxt<'tcx>) -> Fingerprint { |
| let HirId { owner, local_id } = *self; |
| |
| let def_path_hash = tcx.def_path_hash(owner.to_def_id()); |
| let local_id = Fingerprint::from_smaller_hash(local_id.as_u32().into()); |
| |
| def_path_hash.0.combine(local_id) |
| } |
| } |