Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

mir-opt: Merge all branch BBs into a single copy statement #129931

Open
wants to merge 4 commits into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
95 changes: 59 additions & 36 deletions compiler/rustc_mir_transform/src/dead_store_elimination.rs
Original file line number Diff line number Diff line change
Expand Up @@ -12,18 +12,71 @@
//! will still not cause any further changes.
//!

use rustc_index::bit_set::BitSet;
use rustc_middle::bug;
use rustc_middle::mir::visit::Visitor;
use rustc_middle::mir::*;
use rustc_middle::ty::TyCtxt;
use rustc_mir_dataflow::Analysis;
use rustc_mir_dataflow::debuginfo::debuginfo_locals;
use rustc_mir_dataflow::impls::{
LivenessTransferFunction, MaybeTransitiveLiveLocals, borrowed_locals,
};
use rustc_mir_dataflow::{Analysis, ResultsCursor};

use crate::util::is_within_packed;

pub(crate) struct DeadStoreAnalysis<'tcx, 'mir, 'a> {
live: ResultsCursor<'mir, 'tcx, MaybeTransitiveLiveLocals<'a>>,
always_live: &'a BitSet<Local>,
}

impl<'tcx, 'mir, 'a> DeadStoreAnalysis<'tcx, 'mir, 'a> {
pub(crate) fn new(
tcx: TyCtxt<'tcx>,
body: &'mir Body<'tcx>,
always_live: &'a BitSet<Local>,
) -> Self {
let live = MaybeTransitiveLiveLocals::new(&always_live)
.into_engine(tcx, body)
.iterate_to_fixpoint()
.into_results_cursor(body);
Self { live, always_live }
}

pub(crate) fn is_dead_store(&mut self, loc: Location, stmt_kind: &StatementKind<'tcx>) -> bool {
if let StatementKind::Assign(assign) = stmt_kind {
if !assign.1.is_safe_to_remove() {
return false;
}
}
match stmt_kind {
StatementKind::Assign(box (place, _))
| StatementKind::SetDiscriminant { place: box place, .. }
| StatementKind::Deinit(box place) => {
if !place.is_indirect() && !self.always_live.contains(place.local) {
self.live.seek_before_primary_effect(loc);
!self.live.get().contains(place.local)
} else {
false
}
}

StatementKind::Retag(_, _)
| StatementKind::StorageLive(_)
| StatementKind::StorageDead(_)
| StatementKind::Coverage(_)
| StatementKind::Intrinsic(_)
| StatementKind::ConstEvalCounter
| StatementKind::PlaceMention(_)
| StatementKind::Nop => false,

StatementKind::FakeRead(_) | StatementKind::AscribeUserType(_, _) => {
bug!("{:?} not found in this MIR phase!", stmt_kind)
}
}
}
}

/// Performs the optimization on the body
///
/// The `borrowed` set must be a `BitSet` of all the locals that are ever borrowed in this body. It
Expand All @@ -36,10 +89,7 @@ fn eliminate<'tcx>(tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
let mut always_live = debuginfo_locals(body);
always_live.union(&borrowed_locals);

let mut live = MaybeTransitiveLiveLocals::new(&always_live)
.into_engine(tcx, body)
.iterate_to_fixpoint()
.into_results_cursor(body);
let mut analysis = DeadStoreAnalysis::new(tcx, body, &always_live);

// For blocks with a call terminator, if an argument copy can be turned into a move,
// record it as (block, argument index).
Expand All @@ -51,8 +101,8 @@ fn eliminate<'tcx>(tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
let loc = Location { block: bb, statement_index: bb_data.statements.len() };

// Position ourselves between the evaluation of `args` and the write to `destination`.
live.seek_to_block_end(bb);
let mut state = live.get().clone();
analysis.live.seek_to_block_end(bb);
let mut state = analysis.live.get().clone();

for (index, arg) in args.iter().map(|a| &a.node).enumerate().rev() {
if let Operand::Copy(place) = *arg
Expand All @@ -74,37 +124,10 @@ fn eliminate<'tcx>(tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
LivenessTransferFunction(&mut state).visit_operand(arg, loc);
}
}

for (statement_index, statement) in bb_data.statements.iter().enumerate().rev() {
let loc = Location { block: bb, statement_index };
if let StatementKind::Assign(assign) = &statement.kind {
if !assign.1.is_safe_to_remove() {
continue;
}
}
match &statement.kind {
StatementKind::Assign(box (place, _))
| StatementKind::SetDiscriminant { place: box place, .. }
| StatementKind::Deinit(box place) => {
if !place.is_indirect() && !always_live.contains(place.local) {
live.seek_before_primary_effect(loc);
if !live.get().contains(place.local) {
patch.push(loc);
}
}
}
StatementKind::Retag(_, _)
| StatementKind::StorageLive(_)
| StatementKind::StorageDead(_)
| StatementKind::Coverage(_)
| StatementKind::Intrinsic(_)
| StatementKind::ConstEvalCounter
| StatementKind::PlaceMention(_)
| StatementKind::Nop => (),

StatementKind::FakeRead(_) | StatementKind::AscribeUserType(_, _) => {
bug!("{:?} not found in this MIR phase!", statement.kind)
}
if analysis.is_dead_store(loc, &statement.kind) {
patch.push(loc);
}
}
}
Expand Down
2 changes: 2 additions & 0 deletions compiler/rustc_mir_transform/src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -86,6 +86,7 @@ mod lower_intrinsics;
mod lower_slice_len;
mod match_branches;
mod mentioned_items;
mod merge_branches;
mod multiple_return_terminators;
mod nrvo;
mod post_drop_elaboration;
Expand Down Expand Up @@ -611,6 +612,7 @@ fn run_optimization_passes<'tcx>(tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
&dead_store_elimination::DeadStoreElimination::Initial,
&gvn::GVN,
&simplify::SimplifyLocals::AfterGVN,
&merge_branches::MergeBranchSimplification,
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Why here in the pipeline?

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This needs to run after GVN. I expect SimplifyLocals::AfterGVN can simplify the analysis in MergeBranchSimplification. Additionally, after MergeBranchSimplification simplifies the CFG, it will benefit subsequent passes that are related to the CFG.

&dataflow_const_prop::DataflowConstProp,
&single_use_consts::SingleUseConsts,
&o1(simplify_branches::SimplifyConstCondition::AfterConstProp),
Expand Down
240 changes: 240 additions & 0 deletions compiler/rustc_mir_transform/src/merge_branches.rs
Original file line number Diff line number Diff line change
@@ -0,0 +1,240 @@
//! This pass attempts to merge all branches to eliminate switch terminator.
//! Ideally, we could combine it with `MatchBranchSimplification`, as these two passes
//! match and merge statements with different patterns. Given the compile time and
//! code complexity, we have not merged them into a more general pass for now.
use rustc_const_eval::const_eval::mk_eval_cx_for_const_val;
use rustc_index::bit_set::BitSet;
use rustc_middle::mir::patch::MirPatch;
use rustc_middle::mir::*;
use rustc_middle::ty;
use rustc_middle::ty::util::Discr;
use rustc_middle::ty::{ParamEnv, TyCtxt};
use rustc_mir_dataflow::impls::borrowed_locals;

use crate::dead_store_elimination::DeadStoreAnalysis;

pub(super) struct MergeBranchSimplification;

impl<'tcx> crate::MirPass<'tcx> for MergeBranchSimplification {
fn is_enabled(&self, sess: &rustc_session::Session) -> bool {
sess.mir_opt_level() >= 2
}

fn run_pass(&self, tcx: TyCtxt<'tcx>, body: &mut Body<'tcx>) {
let def_id = body.source.def_id();
let param_env = tcx.param_env_reveal_all_normalized(def_id);

let borrowed_locals = borrowed_locals(body);
let mut dead_store_analysis = DeadStoreAnalysis::new(tcx, body, &borrowed_locals);

for switch_bb_idx in body.basic_blocks.indices() {
let bbs = &*body.basic_blocks;
let Some((switch_discr, targets)) = bbs[switch_bb_idx].terminator().kind.as_switch()
else {
continue;
};
// Check that destinations are identical, and if not, then don't optimize this block.
let mut targets_iter = targets.iter();
let first_terminator_kind = &bbs[targets_iter.next().unwrap().1].terminator().kind;
if targets_iter.any(|(_, other_target)| {
first_terminator_kind != &bbs[other_target].terminator().kind
}) {
continue;
}
// We require that the possible target blocks all be distinct.
if !targets.is_distinct() {
continue;
}
if !bbs[targets.otherwise()].is_empty_unreachable() {
continue;
}
// Check if the copy source matches the following pattern.
// _2 = discriminant(*_1); // "*_1" is the expected the copy source.
// switchInt(move _2) -> [0: bb3, 1: bb2, otherwise: bb1];
let Some(&Statement {
kind: StatementKind::Assign(box (discr_place, Rvalue::Discriminant(src_place))),
..
}) = bbs[switch_bb_idx].statements.last()
else {
continue;
};
if switch_discr.place() != Some(discr_place) {
continue;
}
let src_ty = src_place.ty(body.local_decls(), tcx);
if let Some(dest_place) = can_simplify_to_copy(
tcx,
param_env,
body,
targets,
src_place,
src_ty,
&mut dead_store_analysis,
) {
let statement_index = bbs[switch_bb_idx].statements.len();
let parent_end = Location { block: switch_bb_idx, statement_index };
let mut patch = MirPatch::new(body);
patch.add_assign(parent_end, dest_place, Rvalue::Use(Operand::Copy(src_place)));
patch.patch_terminator(switch_bb_idx, first_terminator_kind.clone());
patch.apply(body);
super::simplify::remove_dead_blocks(body);
// After modifying the MIR, the result of `MaybeTransitiveLiveLocals` may become invalid,
// keeping it simple to process only once.
break;
}
}
}
}

/// The GVN simplified
/// ```ignore (syntax-highlighting-only)
/// match a {
/// Foo::A(x) => Foo::A(*x),
/// Foo::B => Foo::B
/// }
/// ```
/// to
/// ```ignore (syntax-highlighting-only)
/// match a {
/// Foo::A(_x) => a, // copy a
/// Foo::B => Foo::B
/// }
/// ```
/// This function answers whether it can be simplified to a copy statement
/// by returning the copy destination.
fn can_simplify_to_copy<'tcx>(
tcx: TyCtxt<'tcx>,
param_env: ParamEnv<'tcx>,
body: &Body<'tcx>,
targets: &SwitchTargets,
src_place: Place<'tcx>,
src_ty: tcx::PlaceTy<'tcx>,
dead_store_analysis: &mut DeadStoreAnalysis<'tcx, '_, '_>,
) -> Option<Place<'tcx>> {
let mut targets_iter = targets.iter();
let (first_index, first_target) = targets_iter.next()?;
let dest_place = find_copy_assign(
tcx,
param_env,
body,
first_index,
first_target,
src_place,
src_ty,
dead_store_analysis,
)?;
let dest_ty = dest_place.ty(body.local_decls(), tcx);
if dest_ty.ty != src_ty.ty {
return None;
}
for (other_index, other_target) in targets_iter {
if dest_place
!= find_copy_assign(
tcx,
param_env,
body,
other_index,
other_target,
src_place,
src_ty,
dead_store_analysis,
)?
{
return None;
}
}
Some(dest_place)
}

// Find the single assignment statement where the source of the copy is from the source.
// All other statements are dead statements or have no effect that can be eliminated.
fn find_copy_assign<'tcx>(
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Could you doc-comment this? I'm still not sure what pattern you are looking for.

tcx: TyCtxt<'tcx>,
param_env: ParamEnv<'tcx>,
body: &Body<'tcx>,
index: u128,
target_block: BasicBlock,
src_place: Place<'tcx>,
src_ty: tcx::PlaceTy<'tcx>,
dead_store_analysis: &mut DeadStoreAnalysis<'tcx, '_, '_>,
) -> Option<Place<'tcx>> {
let statements = &body.basic_blocks[target_block].statements;
if statements.is_empty() {
return None;
}
let assign_stmt = if statements.len() == 1 {
0
} else {
let mut lived_stmts: BitSet<usize> = BitSet::new_filled(statements.len());
let mut expected_assign_stmt = None;
for (statement_index, statement) in statements.iter().enumerate().rev() {
let loc = Location { block: target_block, statement_index };
if dead_store_analysis.is_dead_store(loc, &statement.kind) {
lived_stmts.remove(statement_index);
} else if matches!(
statement.kind,
StatementKind::StorageLive(_) | StatementKind::StorageDead(_)
) {
} else if matches!(statement.kind, StatementKind::Assign(_))
&& expected_assign_stmt.is_none()
{
// There is only one assign statement that cannot be ignored
// that can be used as an expected copy statement.
expected_assign_stmt = Some(statement_index);
lived_stmts.remove(statement_index);
} else {
return None;
}
}
let expected_assign = expected_assign_stmt?;
if !lived_stmts.is_empty() {
// We can ignore the paired StorageLive and StorageDead.
let mut storage_live_locals: BitSet<Local> = BitSet::new_empty(body.local_decls.len());
for stmt_index in lived_stmts.iter() {
let statement = &statements[stmt_index];
match &statement.kind {
StatementKind::StorageLive(local) if storage_live_locals.insert(*local) => {}
StatementKind::StorageDead(local) if storage_live_locals.remove(*local) => {}
_ => return None,
}
}
if !storage_live_locals.is_empty() {
return None;
}
}
expected_assign
};
let &(dest_place, ref rvalue) = statements[assign_stmt].kind.as_assign()?;
let dest_ty = dest_place.ty(body.local_decls(), tcx);
if dest_ty.ty != src_ty.ty {
return None;
}
let ty::Adt(def, _) = dest_ty.ty.kind() else {
return None;
};
match rvalue {
// Check if `_3 = const Foo::B` can be transformed to `_3 = copy *_1`.
Rvalue::Use(Operand::Constant(box constant))
if let Const::Val(const_, ty) = constant.const_ =>
{
let (ecx, op) = mk_eval_cx_for_const_val(tcx.at(constant.span), param_env, const_, ty)?;
let variant = ecx.read_discriminant(&op).discard_err()?;
if !def.variants()[variant].fields.is_empty() {
return None;
}
let Discr { val, .. } = ty.discriminant_for_variant(tcx, variant)?;
if val != index {
return None;
}
}
Rvalue::Use(Operand::Copy(place)) if *place == src_place => {}
// Check if `_3 = Foo::B` can be transformed to `_3 = copy *_1`.
Rvalue::Aggregate(box AggregateKind::Adt(_, variant_index, _, _, None), fields)
if fields.is_empty()
&& let Some(Discr { val, .. }) =
src_ty.ty.discriminant_for_variant(tcx, *variant_index)
&& val == index => {}
_ => return None,
}
Some(dest_place)
}
Loading
Loading