diff --git a/llvm/lib/CodeGen/PeepholeOptimizer.cpp b/llvm/lib/CodeGen/PeepholeOptimizer.cpp --- a/llvm/lib/CodeGen/PeepholeOptimizer.cpp +++ b/llvm/lib/CodeGen/PeepholeOptimizer.cpp @@ -1853,6 +1853,11 @@ SrcIdx = OpIdx; } + // In some rare case, Def has no input, SrcIdx is out of bound, + // getOperand(SrcIdx) will fail below. + if (SrcIdx >= Def->getNumOperands()) + return ValueTrackerResult(); + // Stop when any user of the bitcast is a SUBREG_TO_REG, replacing with a COPY // will break the assumed guarantees for the upper bits. for (const MachineInstr &UseMI : MRI.use_nodbg_instructions(DefOp.getReg())) { diff --git a/llvm/lib/Target/PowerPC/PPCInstrVSX.td b/llvm/lib/Target/PowerPC/PPCInstrVSX.td --- a/llvm/lib/Target/PowerPC/PPCInstrVSX.td +++ b/llvm/lib/Target/PowerPC/PPCInstrVSX.td @@ -1314,7 +1314,7 @@ isReMaterializable = 1 in { def XXLEQVOnes : XX3Form_SameOp<60, 186, (outs vsrc:$XT), (ins), "xxleqv $XT, $XT, $XT", IIC_VecGeneral, - [(set v4i32:$XT, (v4i32 immAllOnesV))]>; + [(set v4i32:$XT, (bitconvert (v16i8 immAllOnesV)))]>; } def XXLORC : XX3Form<60, 170, @@ -4103,8 +4103,6 @@ } let Predicates = [HasP8Vector] in { - def : Pat<(v4i32 (bitconvert (v16i8 immAllOnesV))), - (XXLEQVOnes)>; def : Pat<(v1i128 (bitconvert (v16i8 immAllOnesV))), (v1i128 (COPY_TO_REGCLASS(XXLEQVOnes), VSRC))>; def : Pat<(v2i64 (bitconvert (v16i8 immAllOnesV))), diff --git a/llvm/test/CodeGen/PowerPC/bitcast-peelhole.ll b/llvm/test/CodeGen/PowerPC/bitcast-peelhole.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/PowerPC/bitcast-peelhole.ll @@ -0,0 +1,13 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; REQUIRES: asserts +; RUN: llc -mcpu=pwr9 -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr \ +; RUN: -mtriple=powerpc64le-unknown-unknown < %s | FileCheck %s + +define < 4 x i32> @bitCast() { +; CHECK-LABEL: bitCast: +; CHECK: # %bb.0: # %entry +; CHECK-NEXT: xxleqv v2, v2, v2 +; CHECK-NEXT: blr +entry: + ret < 4 x i32> +}