diff --git a/llvm/lib/Target/PowerPC/PPCMIPeephole.cpp b/llvm/lib/Target/PowerPC/PPCMIPeephole.cpp index 76a73436d61b54..ac5672bc86a263 100644 --- a/llvm/lib/Target/PowerPC/PPCMIPeephole.cpp +++ b/llvm/lib/Target/PowerPC/PPCMIPeephole.cpp @@ -895,8 +895,9 @@ bool PPCMIPeephole::simplifyCode() { LLVM_DEBUG(MI.dump()); LLVM_DEBUG(dbgs() << "Through instruction:\n"); LLVM_DEBUG(DefMI->dump()); - RoundInstr->eraseFromParent(); addRegToUpdate(ConvReg1); + addRegToUpdate(FRSPDefines); + ToErase = RoundInstr; } }; diff --git a/llvm/test/CodeGen/PowerPC/kill_flag_verification.ll b/llvm/test/CodeGen/PowerPC/kill_flag_verification.ll new file mode 100644 index 00000000000000..79cc407fc9be97 --- /dev/null +++ b/llvm/test/CodeGen/PowerPC/kill_flag_verification.ll @@ -0,0 +1,45 @@ +; RUN: llc < %s -mtriple powerpc64le-unknown-linux-gnu +; RUN: llc < %s -mtriple powerpc64-unknown-linux-gnu +; RUN: llc < %s -mtriple powerpc-ibm-aix +; RUN: llc < %s -mtriple powerpc64-ibm-aix + +define void @xvcvdpsp_kill_flag() { +entry: + %call49 = tail call double @sin() + %0 = insertelement <2 x double> poison, double %call49, i64 1 + %1 = fmul <2 x double> %0, zeroinitializer + %2 = shufflevector <2 x double> %1, <2 x double> poison, <4 x i32> + %3 = insertelement <4 x double> %2, double 0.000000e+00, i64 2 + %4 = insertelement <4 x double> %3, double poison, i64 3 + %5 = fptrunc <4 x double> %4 to <4 x float> + %6 = shufflevector <4 x float> %5, <4 x float> poison, <4 x i32> + %7 = shufflevector <4 x float> %5, <4 x float> poison, <4 x i32> + %8 = tail call <4 x float> @llvm.fma.v4f32(<4 x float> %7, <4 x float> , <4 x float> zeroinitializer) + br label %if.end1 + +if.end1: ; preds = %entry + br i1 poison, label %for.cond1.preheader, label %if.then2 + +for.cond1.preheader: ; preds = %if.end1 + br label %for.body2.preheader + +for.body2.preheader: ; preds = %for.cond1.preheader + br i1 poison, label %for.loopexit, label %for.body3 + +for.body3: ; preds = %for.body2.preheader + %9 = tail call <4 x float> @llvm.ppc.fnmsub.v4f32(<4 x float> zeroinitializer, <4 x float> %6, <4 x float> zeroinitializer) + %10 = tail call <4 x float> @llvm.fma.v4f32(<4 x float> , <4 x float> %8, <4 x float> %9) + %11 = tail call <4 x float> @llvm.fma.v4f32(<4 x float> %10, <4 x float> zeroinitializer, <4 x float> zeroinitializer) + store <4 x float> %11, ptr poison, align 16 + unreachable + +for.loopexit: ; preds = %for.body2.preheader + unreachable + +if.then2: ; preds = %if.end1 + ret void +} + +declare double @sin() local_unnamed_addr #0 +declare <4 x float> @llvm.fma.v4f32(<4 x float>, <4 x float>, <4 x float>) +declare <4 x float> @llvm.ppc.fnmsub.v4f32(<4 x float>, <4 x float>, <4 x float>)