Skip to content

Commit f34cc65

Browse files
committed
Auto merge of #106612 - JakobDegen:cleanup-wf, r=tmiasko
Document wf constraints on control flow in cleanup blocks Was recently made aware of [this code](https://github.com/rust-lang/rust/blob/a377893da2cd7124e5a18c7116cbb70e16dd5541/compiler/rustc_codegen_ssa/src/mir/analyze.rs#L247-L368), which has this potential ICE: https://github.com/rust-lang/rust/blob/a377893da2cd7124e5a18c7116cbb70e16dd5541/compiler/rustc_codegen_ssa/src/mir/analyze.rs#L308-L314 Roughly speaking, the code there is attempting to partition the cleanup blocks into funclets that satisfy a "unique successor" property, and the ICE is set off if that's not possible. This PR documents the well-formedness constraints that MIR must satisfy to avoid setting off that ICE. The constraints documented are slightly stronger than the cases in which the ICE would have been set off in that code. This is necessary though, since whether or not that ICE gets set off can depend on iteration order in some graphs. This sort of constraint is kind of ugly, but I don't know a better alternative at the moment. It's worth knowing that two important optimizations are still correct: - Removing edges in the cfg: Fewer edges => fewer paths => stronger dominance relations => more contractions, and more contractions can't turn a forest into not-a-forest. - Contracting an edge u -> v when u only has one successor and v only has one predecessor: u already dominated v, so this contraction was going to happen anyway. There is definitely a MIR opt somewhere that can run afoul of this, but I don't know where it is. `@saethlin` was able to set it off though, so maybe he'll be able to shed some light on it. r? `@RalfJung` I suppose, and cc `@tmiasko` who might have insight/opinions on this
2 parents 159ba8a + 4bc963e commit f34cc65

File tree

3 files changed

+110
-9
lines changed

3 files changed

+110
-9
lines changed

compiler/rustc_const_eval/src/transform/validate.rs

+96-8
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,8 @@
11
//! Validates the MIR to ensure that invariants are upheld.
22
3-
use rustc_data_structures::fx::FxHashSet;
3+
use rustc_data_structures::fx::{FxHashMap, FxHashSet};
44
use rustc_index::bit_set::BitSet;
5+
use rustc_index::vec::IndexVec;
56
use rustc_infer::traits::Reveal;
67
use rustc_middle::mir::interpret::Scalar;
78
use rustc_middle::mir::visit::NonUseContext::VarDebugInfo;
@@ -18,7 +19,7 @@ use rustc_mir_dataflow::storage::always_storage_live_locals;
1819
use rustc_mir_dataflow::{Analysis, ResultsCursor};
1920
use rustc_target::abi::{Size, VariantIdx};
2021

21-
#[derive(Copy, Clone, Debug)]
22+
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
2223
enum EdgeKind {
2324
Unwind,
2425
Normal,
@@ -57,18 +58,20 @@ impl<'tcx> MirPass<'tcx> for Validator {
5758
.iterate_to_fixpoint()
5859
.into_results_cursor(body);
5960

60-
TypeChecker {
61+
let mut checker = TypeChecker {
6162
when: &self.when,
6263
body,
6364
tcx,
6465
param_env,
6566
mir_phase,
67+
unwind_edge_count: 0,
6668
reachable_blocks: traversal::reachable_as_bitset(body),
6769
storage_liveness,
6870
place_cache: Vec::new(),
6971
value_cache: Vec::new(),
70-
}
71-
.visit_body(body);
72+
};
73+
checker.visit_body(body);
74+
checker.check_cleanup_control_flow();
7275
}
7376
}
7477

@@ -78,6 +81,7 @@ struct TypeChecker<'a, 'tcx> {
7881
tcx: TyCtxt<'tcx>,
7982
param_env: ParamEnv<'tcx>,
8083
mir_phase: MirPhase,
84+
unwind_edge_count: usize,
8185
reachable_blocks: BitSet<BasicBlock>,
8286
storage_liveness: ResultsCursor<'a, 'tcx, MaybeStorageLive<'static>>,
8387
place_cache: Vec<PlaceRef<'tcx>>,
@@ -102,7 +106,7 @@ impl<'a, 'tcx> TypeChecker<'a, 'tcx> {
102106
);
103107
}
104108

105-
fn check_edge(&self, location: Location, bb: BasicBlock, edge_kind: EdgeKind) {
109+
fn check_edge(&mut self, location: Location, bb: BasicBlock, edge_kind: EdgeKind) {
106110
if bb == START_BLOCK {
107111
self.fail(location, "start block must not have predecessors")
108112
}
@@ -111,10 +115,12 @@ impl<'a, 'tcx> TypeChecker<'a, 'tcx> {
111115
match (src.is_cleanup, bb.is_cleanup, edge_kind) {
112116
// Non-cleanup blocks can jump to non-cleanup blocks along non-unwind edges
113117
(false, false, EdgeKind::Normal)
114-
// Non-cleanup blocks can jump to cleanup blocks along unwind edges
115-
| (false, true, EdgeKind::Unwind)
116118
// Cleanup blocks can jump to cleanup blocks along non-unwind edges
117119
| (true, true, EdgeKind::Normal) => {}
120+
// Non-cleanup blocks can jump to cleanup blocks along unwind edges
121+
(false, true, EdgeKind::Unwind) => {
122+
self.unwind_edge_count += 1;
123+
}
118124
// All other jumps are invalid
119125
_ => {
120126
self.fail(
@@ -134,6 +140,88 @@ impl<'a, 'tcx> TypeChecker<'a, 'tcx> {
134140
}
135141
}
136142

143+
fn check_cleanup_control_flow(&self) {
144+
if self.unwind_edge_count <= 1 {
145+
return;
146+
}
147+
let doms = self.body.basic_blocks.dominators();
148+
let mut post_contract_node = FxHashMap::default();
149+
// Reusing the allocation across invocations of the closure
150+
let mut dom_path = vec![];
151+
let mut get_post_contract_node = |mut bb| {
152+
let root = loop {
153+
if let Some(root) = post_contract_node.get(&bb) {
154+
break *root;
155+
}
156+
let parent = doms.immediate_dominator(bb);
157+
dom_path.push(bb);
158+
if !self.body.basic_blocks[parent].is_cleanup {
159+
break bb;
160+
}
161+
bb = parent;
162+
};
163+
for bb in dom_path.drain(..) {
164+
post_contract_node.insert(bb, root);
165+
}
166+
root
167+
};
168+
169+
let mut parent = IndexVec::from_elem(None, &self.body.basic_blocks);
170+
for (bb, bb_data) in self.body.basic_blocks.iter_enumerated() {
171+
if !bb_data.is_cleanup || !self.reachable_blocks.contains(bb) {
172+
continue;
173+
}
174+
let bb = get_post_contract_node(bb);
175+
for s in bb_data.terminator().successors() {
176+
let s = get_post_contract_node(s);
177+
if s == bb {
178+
continue;
179+
}
180+
let parent = &mut parent[bb];
181+
match parent {
182+
None => {
183+
*parent = Some(s);
184+
}
185+
Some(e) if *e == s => (),
186+
Some(e) => self.fail(
187+
Location { block: bb, statement_index: 0 },
188+
format!(
189+
"Cleanup control flow violation: The blocks dominated by {:?} have edges to both {:?} and {:?}",
190+
bb,
191+
s,
192+
*e
193+
)
194+
),
195+
}
196+
}
197+
}
198+
199+
// Check for cycles
200+
let mut stack = FxHashSet::default();
201+
for i in 0..parent.len() {
202+
let mut bb = BasicBlock::from_usize(i);
203+
stack.clear();
204+
stack.insert(bb);
205+
loop {
206+
let Some(parent)= parent[bb].take() else {
207+
break
208+
};
209+
let no_cycle = stack.insert(parent);
210+
if !no_cycle {
211+
self.fail(
212+
Location { block: bb, statement_index: 0 },
213+
format!(
214+
"Cleanup control flow violation: Cycle involving edge {:?} -> {:?}",
215+
bb, parent,
216+
),
217+
);
218+
break;
219+
}
220+
bb = parent;
221+
}
222+
}
223+
}
224+
137225
/// Check if src can be assigned into dest.
138226
/// This is not precise, it will accept some incorrect assignments.
139227
fn mir_assign_valid_types(&self, src: Ty<'tcx>, dest: Ty<'tcx>) -> bool {

compiler/rustc_data_structures/src/graph/dominators/mod.rs

+4-1
Original file line numberDiff line numberDiff line change
@@ -135,7 +135,10 @@ pub fn dominators<G: ControlFlowGraph>(graph: G) -> Dominators<G::Node> {
135135
// This loop computes the semi[w] for w.
136136
semi[w] = w;
137137
for v in graph.predecessors(pre_order_to_real[w]) {
138-
let v = real_to_pre_order[v].unwrap();
138+
// Reachable vertices may have unreachable predecessors, so ignore any of them
139+
let Some(v) = real_to_pre_order[v] else {
140+
continue
141+
};
139142

140143
// eval returns a vertex x from which semi[x] is minimum among
141144
// vertices semi[v] +> x *> v.

compiler/rustc_middle/src/mir/syntax.rs

+10
Original file line numberDiff line numberDiff line change
@@ -512,6 +512,16 @@ pub struct CopyNonOverlapping<'tcx> {
512512
/// must also be `cleanup`. This is a part of the type system and checked statically, so it is
513513
/// still an error to have such an edge in the CFG even if it's known that it won't be taken at
514514
/// runtime.
515+
/// 4. The control flow between cleanup blocks must look like an upside down tree. Roughly
516+
/// speaking, this means that control flow that looks like a V is allowed, while control flow
517+
/// that looks like a W is not. This is necessary to ensure that landing pad information can be
518+
/// correctly codegened on MSVC. More precisely:
519+
///
520+
/// Begin with the standard control flow graph `G`. Modify `G` as follows: for any two cleanup
521+
/// vertices `u` and `v` such that `u` dominates `v`, contract `u` and `v` into a single vertex,
522+
/// deleting self edges and duplicate edges in the process. Now remove all vertices from `G`
523+
/// that are not cleanup vertices or are not reachable. The resulting graph must be an inverted
524+
/// tree, that is each vertex may have at most one successor and there may be no cycles.
515525
#[derive(Clone, TyEncodable, TyDecodable, Hash, HashStable, PartialEq, TypeFoldable, TypeVisitable)]
516526
pub enum TerminatorKind<'tcx> {
517527
/// Block has one successor; we continue execution there.

0 commit comments

Comments
 (0)