Skip to content

Commit 9762b26

Browse files
committedJun 25, 2019
[DAGCombine] combineRepeatedFPDivisors - recognize -1.0 / X as a reciprocal
Fixes issue identified by @nemanjai (Nemanja Ivanovic) in D62963 / rL363040 - infinite loop due to GetNegatedExpression fighting combineRepeatedFPDivisors resulting in fneg(fdiv(x,splat)) -> fneg(fmul(x,1.0/splat)) -> fmul(x,-1.0/splat) -> fmul(x,(-1.0 * 1.0)/splat) ...... llvm-svn: 364326
1 parent 635eb80 commit 9762b26

File tree

2 files changed

+34
-2
lines changed

2 files changed

+34
-2
lines changed
 

‎llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12362,10 +12362,10 @@ SDValue DAGCombiner::combineRepeatedFPDivisors(SDNode *N) {
1236212362
if (!UnsafeMath && !Flags.hasAllowReciprocal())
1236312363
return SDValue();
1236412364

12365-
// Skip if current node is a reciprocal.
12365+
// Skip if current node is a reciprocal/fneg-reciprocal.
1236612366
SDValue N0 = N->getOperand(0);
1236712367
ConstantFPSDNode *N0CFP = isConstOrConstSplatFP(N0, /* AllowUndefs */ true);
12368-
if (N0CFP && N0CFP->isExactlyValue(1.0))
12368+
if (N0CFP && (N0CFP->isExactlyValue(1.0) || N0CFP->isExactlyValue(-1.0)))
1236912369
return SDValue();
1237012370

1237112371
// Exit early if the target does not want this transform or if there can't
Lines changed: 32 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,32 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2+
; RUN: llc < %s -mtriple=powerpc64le-unknown-unknown | FileCheck %s
3+
4+
; Infinite loop identified in D62963.
5+
define <4 x double> @fneg_fdiv_splat(double %a0, <4 x double> %a1) {
6+
; CHECK-LABEL: fneg_fdiv_splat:
7+
; CHECK: # %bb.0: # %entry
8+
; CHECK-NEXT: # kill: def $f1 killed $f1 def $vsl1
9+
; CHECK-NEXT: xxspltd 0, 1, 0
10+
; CHECK-NEXT: addis 3, 2, .LCPI0_0@toc@ha
11+
; CHECK-NEXT: addi 3, 3, .LCPI0_0@toc@l
12+
; CHECK-NEXT: lxvd2x 1, 0, 3
13+
; CHECK-NEXT: addis 3, 2, .LCPI0_1@toc@ha
14+
; CHECK-NEXT: xvredp 2, 0
15+
; CHECK-NEXT: addi 3, 3, .LCPI0_1@toc@l
16+
; CHECK-NEXT: xxswapd 1, 1
17+
; CHECK-NEXT: xvnmsubadp 1, 2, 0
18+
; CHECK-NEXT: xvmaddadp 2, 2, 1
19+
; CHECK-NEXT: lxvd2x 1, 0, 3
20+
; CHECK-NEXT: xxswapd 1, 1
21+
; CHECK-NEXT: xvmaddadp 1, 0, 2
22+
; CHECK-NEXT: xvmsubadp 2, 2, 1
23+
; CHECK-NEXT: xvmuldp 34, 34, 2
24+
; CHECK-NEXT: xvmuldp 35, 35, 2
25+
; CHECK-NEXT: blr
26+
entry:
27+
%splat.splatinsert = insertelement <4 x double> undef, double %a0, i32 0
28+
%splat.splat = shufflevector <4 x double> %splat.splatinsert, <4 x double> undef, <4 x i32> zeroinitializer
29+
%div = fdiv fast <4 x double> %a1, %splat.splat
30+
%sub = fsub fast <4 x double> <double 0.000000e+00, double 0.000000e+00, double 0.000000e+00, double 0.000000e+00>, %div
31+
ret <4 x double> %sub
32+
}

0 commit comments

Comments
 (0)
Please sign in to comment.