Skip to content

Commit 300bd13

Browse files
committed
Auto merge of rust-lang#122568 - RalfJung:mentioned-items, r=<try>
recursively evaluate the constants in everything that is 'mentioned' This is another attempt at fixing rust-lang#107503. The previous attempt at rust-lang#112879 seems stuck in figuring out where the [perf regression](https://perf.rust-lang.org/compare.html?start=c55d1ee8d4e3162187214692229a63c2cc5e0f31&end=ec8de1ebe0d698b109beeaaac83e60f4ef8bb7d1&stat=instructions:u) comes from. In rust-lang#122258 I learned some things, which informed the approach this PR is taking. Quoting from the new collector docs, which explain the high-level idea: ```rust //! One important role of collection is to evaluate all constants that are used by all the items //! which are being collected. Codegen can then rely on only encountering constants that evaluate //! successfully, and if a constant fails to evaluate, the collector has much better context to be //! able to show where this constant comes up. //! //! However, the exact set of "used" items (collected as described above), and therefore the exact //! set of used constants, can depend on optimizations. Optimizing away dead code may optimize away //! a function call that uses a failing constant, so an unoptimized build may fail where an //! optimized build succeeds. This is undesirable. //! //! To fix this, the collector has the concept of "mentioned" items. Some time during the MIR //! pipeline, before any optimization-level-dependent optimizations, we compute a list of all items //! that syntactically appear in the code. These are considered "mentioned", and even if they are in //! dead code and get optimized away (which makes them no longer "used"), they are still //! "mentioned". For every used item, the collector ensures that all mentioned items, recursively, //! do not use a failing constant. This is reflected via the [`CollectionMode`], which determines //! whether we are visiting a used item or merely a mentioned item. enum CollectionMode { /// Collect items that are used, i.e., actually needed for codegen. /// /// Which items are used can depend on optimization levels, as MIR optimizations can remove /// uses. UsedItems, /// Collect items that are mentioned. The goal of this mode is that it is independent of /// optimizations: the set of "mentioned" items is computed before optimizations are run. /// /// The exact contents of this set are *not* a stable guarantee. (For instance, it is currently /// computed after drop-elaboration. If we ever do some optimizations even in debug builds, we /// might decide to run them before computing mentioned items.) The key property of this set is /// that it is optimization-independent. MentionedItems, } ``` Fixes rust-lang#107503
2 parents ecdea9e + a7000b6 commit 300bd13

31 files changed

+888
-189
lines changed

compiler/rustc_data_structures/src/sync.rs

+6-3
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,7 @@
2020
//! | ----------------------- | ------------------- | ------------------------------- |
2121
//! | `Lrc<T>` | `rc::Rc<T>` | `sync::Arc<T>` |
2222
//! |` Weak<T>` | `rc::Weak<T>` | `sync::Weak<T>` |
23+
//! | `LRef<'a, T>` [^2] | `&'a mut T` | `&'a T` |
2324
//! | | | |
2425
//! | `AtomicBool` | `Cell<bool>` | `atomic::AtomicBool` |
2526
//! | `AtomicU32` | `Cell<u32>` | `atomic::AtomicU32` |
@@ -38,7 +39,7 @@
3839
//! of a `RefCell`. This is appropriate when interior mutability is not
3940
//! required.
4041
//!
41-
//! [^2] `MTLockRef` is a typedef.
42+
//! [^2] `MTRef`, `MTLockRef` are type aliases.
4243
4344
pub use crate::marker::*;
4445
use std::collections::HashMap;
@@ -208,7 +209,7 @@ cfg_match! {
208209

209210
use std::cell::RefCell as InnerRwLock;
210211

211-
pub type MTLockRef<'a, T> = &'a mut MTLock<T>;
212+
pub type LRef<'a, T> = &'a mut T;
212213

213214
#[derive(Debug, Default)]
214215
pub struct MTLock<T>(T);
@@ -274,7 +275,7 @@ cfg_match! {
274275
pub use std::sync::Arc as Lrc;
275276
pub use std::sync::Weak as Weak;
276277

277-
pub type MTLockRef<'a, T> = &'a MTLock<T>;
278+
pub type LRef<'a, T> = &'a T;
278279

279280
#[derive(Debug, Default)]
280281
pub struct MTLock<T>(Lock<T>);
@@ -314,6 +315,8 @@ cfg_match! {
314315
}
315316
}
316317

318+
pub type MTLockRef<'a, T> = LRef<'a, MTLock<T>>;
319+
317320
#[derive(Default)]
318321
#[cfg_attr(parallel_compiler, repr(align(64)))]
319322
pub struct CacheAligned<T>(pub T);

compiler/rustc_middle/src/mir/mod.rs

+31
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,7 @@ use rustc_hir::def_id::{DefId, CRATE_DEF_ID};
2020
use rustc_hir::{self, CoroutineDesugaring, CoroutineKind, ImplicitSelfKind};
2121
use rustc_hir::{self as hir, HirId};
2222
use rustc_session::Session;
23+
use rustc_span::source_map::Spanned;
2324
use rustc_target::abi::{FieldIdx, VariantIdx};
2425

2526
use polonius_engine::Atom;
@@ -312,6 +313,21 @@ impl<'tcx> CoroutineInfo<'tcx> {
312313
}
313314
}
314315

316+
/// Some item that needs to monomorphize successfully for a MIR body to be considered well-formed.
317+
#[derive(Copy, Clone, PartialEq, Eq, Debug, Hash, HashStable, TyEncodable, TyDecodable)]
318+
#[derive(TypeFoldable, TypeVisitable)]
319+
pub enum MentionedItem<'tcx> {
320+
Fn(DefId, GenericArgsRef<'tcx>),
321+
Drop(Ty<'tcx>),
322+
/// Unsizing casts might require vtables, so we have to record them.
323+
UnsizeCast {
324+
source_ty: Ty<'tcx>,
325+
target_ty: Ty<'tcx>,
326+
},
327+
/// A closure that is coerced to a function pointer.
328+
Closure(DefId, GenericArgsRef<'tcx>),
329+
}
330+
315331
/// The lowered representation of a single function.
316332
#[derive(Clone, TyEncodable, TyDecodable, Debug, HashStable, TypeFoldable, TypeVisitable)]
317333
pub struct Body<'tcx> {
@@ -375,8 +391,21 @@ pub struct Body<'tcx> {
375391

376392
/// Constants that are required to evaluate successfully for this MIR to be well-formed.
377393
/// We hold in this field all the constants we are not able to evaluate yet.
394+
///
395+
/// This is soundness-critical, we make a guarantee that all consts syntactically mentioned in a
396+
/// function have successfully evaluated if the function ever gets executed at runtime.
378397
pub required_consts: Vec<ConstOperand<'tcx>>,
379398

399+
/// Further items that were mentioned in this function and hence *may* become monomorphized,
400+
/// depending on optimizations. We use this to avoid optimization-dependent compile errors: the
401+
/// collector recursively traverses all "mentioned" items and evaluates all their
402+
/// `requiered_consts`.
403+
///
404+
/// This is *not* soundness-critical and the contents of this list are *not* a stable guarantee.
405+
/// See the documentation of `CollectionMode` in `compiler/rustc_monomorphize/src/collector.rs`
406+
/// for more context.
407+
pub mentioned_items: Vec<Spanned<MentionedItem<'tcx>>>,
408+
380409
/// Does this body use generic parameters. This is used for the `ConstEvaluatable` check.
381410
///
382411
/// Note that this does not actually mean that this body is not computable right now.
@@ -453,6 +482,7 @@ impl<'tcx> Body<'tcx> {
453482
var_debug_info,
454483
span,
455484
required_consts: Vec::new(),
485+
mentioned_items: Vec::new(),
456486
is_polymorphic: false,
457487
injection_phase: None,
458488
tainted_by_errors,
@@ -482,6 +512,7 @@ impl<'tcx> Body<'tcx> {
482512
spread_arg: None,
483513
span: DUMMY_SP,
484514
required_consts: Vec::new(),
515+
mentioned_items: Vec::new(),
485516
var_debug_info: Vec::new(),
486517
is_polymorphic: false,
487518
injection_phase: None,

compiler/rustc_mir_build/src/build/custom/mod.rs

+1
Original file line numberDiff line numberDiff line change
@@ -56,6 +56,7 @@ pub(super) fn build_custom_mir<'tcx>(
5656
var_debug_info: Vec::new(),
5757
span,
5858
required_consts: Vec::new(),
59+
mentioned_items: Vec::new(),
5960
is_polymorphic: false,
6061
tainted_by_errors: None,
6162
injection_phase: None,

compiler/rustc_mir_transform/src/inline.rs

+25-1
Original file line numberDiff line numberDiff line change
@@ -565,7 +565,8 @@ impl<'tcx> Inliner<'tcx> {
565565
mut callee_body: Body<'tcx>,
566566
) {
567567
let terminator = caller_body[callsite.block].terminator.take().unwrap();
568-
let TerminatorKind::Call { args, destination, unwind, target, .. } = terminator.kind else {
568+
let TerminatorKind::Call { func, args, destination, unwind, target, .. } = terminator.kind
569+
else {
569570
bug!("unexpected terminator kind {:?}", terminator.kind);
570571
};
571572

@@ -717,6 +718,29 @@ impl<'tcx> Inliner<'tcx> {
717718
Const::Val(..) | Const::Unevaluated(..) => true,
718719
},
719720
));
721+
// Now that we incorporated the callee's `required_consts`, we can remove the callee from
722+
// `mentioned_items` -- but we have to take their `mentioned_items` in return.
723+
// This does some extra work here to save the monomorphization collector work later.
724+
// FIXME: benchmark which option is better.
725+
let callee_item = {
726+
// We need to reconstruct the `required_item` for the callee so that we can find and
727+
// remove it.
728+
let func_ty = func.ty(caller_body, self.tcx);
729+
match func_ty.kind() {
730+
ty::FnDef(def_id, args) => MentionedItem::Fn(*def_id, args),
731+
_ => bug!(),
732+
}
733+
};
734+
if let Some(idx) =
735+
caller_body.mentioned_items.iter().position(|item| item.node == callee_item)
736+
{
737+
// We found the callee, so remove it and add its items instead.
738+
caller_body.mentioned_items.remove(idx);
739+
caller_body.mentioned_items.extend(callee_body.mentioned_items);
740+
} else {
741+
// If we can't find the callee, there's no point in adding its items.
742+
// Probably it already got removed by being inlined elsewhere in the same function.
743+
}
720744
}
721745

722746
fn make_call_args(

compiler/rustc_mir_transform/src/lib.rs

+5
Original file line numberDiff line numberDiff line change
@@ -89,6 +89,7 @@ mod lint;
8989
mod lower_intrinsics;
9090
mod lower_slice_len;
9191
mod match_branches;
92+
mod mentioned_items;
9293
mod multiple_return_terminators;
9394
mod normalize_array_len;
9495
mod nrvo;
@@ -566,6 +567,10 @@ fn run_optimization_passes<'tcx>(tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
566567
tcx,
567568
body,
568569
&[
570+
// Before doing anything, remember which items are being mentioned so that the set of items
571+
// visited does not depend on the optimization level.
572+
&mentioned_items::MentionedItems,
573+
// Add some UB checks before any UB gets optimized away.
569574
&check_alignment::CheckAlignment,
570575
// Before inlining: trim down MIR with passes to reduce inlining work.
571576

Original file line numberDiff line numberDiff line change
@@ -0,0 +1,126 @@
1+
use rustc_hir::def_id::DefId;
2+
use rustc_middle::mir::visit::Visitor;
3+
use rustc_middle::mir::{self, ConstOperand, Location, MentionedItem, MirPass};
4+
use rustc_middle::ty::{self, adjustment::PointerCoercion, TyCtxt};
5+
use rustc_session::Session;
6+
use rustc_span::source_map::Spanned;
7+
8+
pub struct MentionedItems;
9+
10+
struct MentionedItemsVisitor<'a, 'tcx> {
11+
tcx: TyCtxt<'tcx>,
12+
body: &'a mir::Body<'tcx>,
13+
mentioned_items: &'a mut Vec<Spanned<MentionedItem<'tcx>>>,
14+
}
15+
16+
impl<'tcx> MirPass<'tcx> for MentionedItems {
17+
fn is_enabled(&self, _sess: &Session) -> bool {
18+
// If this pass is skipped the collector assume that nothing got mentioned! We could
19+
// potentially skip it in opt-level 0 if we are sure that opt-level will never *remove* uses
20+
// of anything, but that still seems fragile. Furthermore, even debug builds use level 1, so
21+
// special-casing level 0 is just not worth it.
22+
true
23+
}
24+
25+
fn run_pass(&self, tcx: TyCtxt<'tcx>, body: &mut mir::Body<'tcx>) {
26+
debug_assert!(body.mentioned_items.is_empty());
27+
let mut mentioned_items = Vec::new();
28+
MentionedItemsVisitor { tcx, body, mentioned_items: &mut mentioned_items }.visit_body(body);
29+
body.mentioned_items = mentioned_items;
30+
}
31+
}
32+
33+
impl<'tcx> Visitor<'tcx> for MentionedItemsVisitor<'_, 'tcx> {
34+
fn visit_constant(&mut self, constant: &ConstOperand<'tcx>, _: Location) {
35+
let const_ = constant.const_;
36+
// This is how function items get referenced: via constants of `FnDef` type. This handles
37+
// both functions that are called and those that are just turned to function pointers.
38+
if let ty::FnDef(def_id, args) = *const_.ty().kind()
39+
&& may_codegen_locally(self.tcx, def_id)
40+
{
41+
debug!("adding to required_items: {def_id:?}");
42+
self.mentioned_items
43+
.push(Spanned { node: MentionedItem::Fn(def_id, args), span: constant.span });
44+
}
45+
}
46+
47+
fn visit_terminator(&mut self, terminator: &mir::Terminator<'tcx>, location: Location) {
48+
self.super_terminator(terminator, location);
49+
match terminator.kind {
50+
// We don't need to handle `Call` as we already handled all function type operands in
51+
// `visit_constant`. But we do need to handle `Drop`.
52+
mir::TerminatorKind::Drop { place, .. } => {
53+
let ty = place.ty(self.body, self.tcx).ty;
54+
let span = self.body.source_info(location).span;
55+
self.mentioned_items.push(Spanned { node: MentionedItem::Drop(ty), span });
56+
}
57+
_ => {}
58+
}
59+
}
60+
61+
fn visit_rvalue(&mut self, rvalue: &mir::Rvalue<'tcx>, location: Location) {
62+
self.super_rvalue(rvalue, location);
63+
match *rvalue {
64+
// We need to detect unsizing casts that required vtables.
65+
mir::Rvalue::Cast(
66+
mir::CastKind::PointerCoercion(PointerCoercion::Unsize),
67+
ref operand,
68+
target_ty,
69+
)
70+
| mir::Rvalue::Cast(mir::CastKind::DynStar, ref operand, target_ty) => {
71+
let span = self.body.source_info(location).span;
72+
self.mentioned_items.push(Spanned {
73+
node: MentionedItem::UnsizeCast {
74+
source_ty: operand.ty(self.body, self.tcx),
75+
target_ty,
76+
},
77+
span,
78+
});
79+
}
80+
// Similarly, record closures that are turned into function pointers.
81+
mir::Rvalue::Cast(
82+
mir::CastKind::PointerCoercion(PointerCoercion::ClosureFnPointer(_)),
83+
ref operand,
84+
_,
85+
) => {
86+
let span = self.body.source_info(location).span;
87+
let source_ty = operand.ty(self.body, self.tcx);
88+
match *source_ty.kind() {
89+
ty::Closure(def_id, args) => {
90+
self.mentioned_items
91+
.push(Spanned { node: MentionedItem::Closure(def_id, args), span });
92+
}
93+
_ => bug!(),
94+
}
95+
}
96+
// Function pointer casts are already handled by `visit_constant` above.
97+
_ => {}
98+
}
99+
}
100+
}
101+
102+
/// Returns `true` if we should codegen an item in the local crate, or returns `false` if we
103+
/// can just link to the upstream crate and therefore don't need a mono item.
104+
///
105+
/// This is an approximation of the collector's `should_codegen_locally`, in the sense that this
106+
/// here may return `true` even if `should_codegen_locally` says `false`. The point is to let us
107+
/// filter out items that definitely will not be considered by the collector.
108+
fn may_codegen_locally<'tcx>(tcx: TyCtxt<'tcx>, def_id: DefId) -> bool {
109+
if tcx.is_foreign_item(def_id) {
110+
// Foreign items are always linked against, there's no way of instantiating them.
111+
return false;
112+
}
113+
114+
if def_id.is_local() {
115+
// Local items cannot be referred to locally without monomorphizing them locally.
116+
return true;
117+
}
118+
119+
if tcx.is_reachable_non_generic(def_id) {
120+
// We can link to the item in question, no instance needed in this crate.
121+
return false;
122+
}
123+
124+
// Conservative fall-back.
125+
true
126+
}

compiler/rustc_mir_transform/src/shim.rs

+3-1
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ use std::iter;
1717

1818
use crate::{
1919
abort_unwinding_calls, add_call_guards, add_moves_for_packed_drops, deref_separator,
20-
pass_manager as pm, remove_noop_landing_pads, simplify,
20+
mentioned_items, pass_manager as pm, remove_noop_landing_pads, simplify,
2121
};
2222
use rustc_middle::mir::patch::MirPatch;
2323
use rustc_mir_dataflow::elaborate_drops::{self, DropElaborator, DropFlagMode, DropStyle};
@@ -147,6 +147,7 @@ fn make_shim<'tcx>(tcx: TyCtxt<'tcx>, instance: ty::InstanceDef<'tcx>) -> Body<'
147147
tcx,
148148
&mut body,
149149
&[
150+
&mentioned_items::MentionedItems,
150151
&abort_unwinding_calls::AbortUnwindingCalls,
151152
&add_call_guards::CriticalCallEdges,
152153
],
@@ -178,6 +179,7 @@ fn make_shim<'tcx>(tcx: TyCtxt<'tcx>, instance: ty::InstanceDef<'tcx>) -> Body<'
178179
tcx,
179180
&mut result,
180181
&[
182+
&mentioned_items::MentionedItems,
181183
&add_moves_for_packed_drops::AddMovesForPackedDrops,
182184
&deref_separator::Derefer,
183185
&remove_noop_landing_pads::RemoveNoopLandingPads,

0 commit comments

Comments
 (0)