Skip to content

Commit bb5c389

Browse files
zjaffalarsenm
andauthored
[InstCombine] Optimise x / sqrt(y / z) with fast-math pattern. (#76737)
Replace the pattern with x * sqrt(z/y) --------- Co-authored-by: Matt Arsenault <[email protected]>
1 parent 2884d04 commit bb5c389

File tree

2 files changed

+39
-9
lines changed

2 files changed

+39
-9
lines changed

llvm/lib/Transforms/InstCombine/InstCombineMulDivRem.cpp

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1709,6 +1709,33 @@ static Instruction *foldFDivPowDivisor(BinaryOperator &I,
17091709
return BinaryOperator::CreateFMulFMF(Op0, Pow, &I);
17101710
}
17111711

1712+
/// Convert div to mul if we have an sqrt divisor iff sqrt's operand is a fdiv
1713+
/// instruction.
1714+
static Instruction *foldFDivSqrtDivisor(BinaryOperator &I,
1715+
InstCombiner::BuilderTy &Builder) {
1716+
// X / sqrt(Y / Z) --> X * sqrt(Z / Y)
1717+
if (!I.hasAllowReassoc() || !I.hasAllowReciprocal())
1718+
return nullptr;
1719+
Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
1720+
auto *II = dyn_cast<IntrinsicInst>(Op1);
1721+
if (!II || II->getIntrinsicID() != Intrinsic::sqrt || !II->hasOneUse() ||
1722+
!II->hasAllowReassoc() || !II->hasAllowReciprocal())
1723+
return nullptr;
1724+
1725+
Value *Y, *Z;
1726+
auto *DivOp = dyn_cast<Instruction>(II->getOperand(0));
1727+
if (!DivOp || !DivOp->hasAllowReassoc() || !I.hasAllowReciprocal() ||
1728+
!DivOp->hasOneUse())
1729+
return nullptr;
1730+
if (match(DivOp, m_FDiv(m_Value(Y), m_Value(Z)))) {
1731+
Value *SwapDiv = Builder.CreateFDivFMF(Z, Y, DivOp);
1732+
Value *NewSqrt =
1733+
Builder.CreateUnaryIntrinsic(II->getIntrinsicID(), SwapDiv, II);
1734+
return BinaryOperator::CreateFMulFMF(Op0, NewSqrt, &I);
1735+
}
1736+
return nullptr;
1737+
}
1738+
17121739
Instruction *InstCombinerImpl::visitFDiv(BinaryOperator &I) {
17131740
Module *M = I.getModule();
17141741

@@ -1816,6 +1843,9 @@ Instruction *InstCombinerImpl::visitFDiv(BinaryOperator &I) {
18161843
if (Instruction *Mul = foldFDivPowDivisor(I, Builder))
18171844
return Mul;
18181845

1846+
if (Instruction *Mul = foldFDivSqrtDivisor(I, Builder))
1847+
return Mul;
1848+
18191849
// pow(X, Y) / X --> pow(X, Y-1)
18201850
if (I.hasAllowReassoc() &&
18211851
match(Op0, m_OneUse(m_Intrinsic<Intrinsic::pow>(m_Specific(Op1),

llvm/test/Transforms/InstCombine/fdiv-sqrt.ll

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -6,9 +6,9 @@ declare double @llvm.sqrt.f64(double)
66
define double @sqrt_div_fast(double %x, double %y, double %z) {
77
; CHECK-LABEL: @sqrt_div_fast(
88
; CHECK-NEXT: entry:
9-
; CHECK-NEXT: [[DIV:%.*]] = fdiv fast double [[Y:%.*]], [[Z:%.*]]
10-
; CHECK-NEXT: [[SQRT:%.*]] = call fast double @llvm.sqrt.f64(double [[DIV]])
11-
; CHECK-NEXT: [[DIV1:%.*]] = fdiv fast double [[X:%.*]], [[SQRT]]
9+
; CHECK-NEXT: [[TMP0:%.*]] = fdiv fast double [[Z:%.*]], [[Y:%.*]]
10+
; CHECK-NEXT: [[TMP1:%.*]] = call fast double @llvm.sqrt.f64(double [[TMP0]])
11+
; CHECK-NEXT: [[DIV1:%.*]] = fmul fast double [[TMP1]], [[X:%.*]]
1212
; CHECK-NEXT: ret double [[DIV1]]
1313
;
1414
entry:
@@ -36,9 +36,9 @@ entry:
3636
define double @sqrt_div_reassoc_arcp(double %x, double %y, double %z) {
3737
; CHECK-LABEL: @sqrt_div_reassoc_arcp(
3838
; CHECK-NEXT: entry:
39-
; CHECK-NEXT: [[DIV:%.*]] = fdiv reassoc arcp double [[Y:%.*]], [[Z:%.*]]
40-
; CHECK-NEXT: [[SQRT:%.*]] = call reassoc arcp double @llvm.sqrt.f64(double [[DIV]])
41-
; CHECK-NEXT: [[DIV1:%.*]] = fdiv reassoc arcp double [[X:%.*]], [[SQRT]]
39+
; CHECK-NEXT: [[TMP0:%.*]] = fdiv reassoc arcp double [[Z:%.*]], [[Y:%.*]]
40+
; CHECK-NEXT: [[TMP1:%.*]] = call reassoc arcp double @llvm.sqrt.f64(double [[TMP0]])
41+
; CHECK-NEXT: [[DIV1:%.*]] = fmul reassoc arcp double [[TMP1]], [[X:%.*]]
4242
; CHECK-NEXT: ret double [[DIV1]]
4343
;
4444
entry:
@@ -96,9 +96,9 @@ entry:
9696
define double @sqrt_div_arcp_missing(double %x, double %y, double %z) {
9797
; CHECK-LABEL: @sqrt_div_arcp_missing(
9898
; CHECK-NEXT: entry:
99-
; CHECK-NEXT: [[DIV:%.*]] = fdiv reassoc double [[Y:%.*]], [[Z:%.*]]
100-
; CHECK-NEXT: [[SQRT:%.*]] = call reassoc arcp double @llvm.sqrt.f64(double [[DIV]])
101-
; CHECK-NEXT: [[DIV1:%.*]] = fdiv reassoc arcp double [[X:%.*]], [[SQRT]]
99+
; CHECK-NEXT: [[TMP0:%.*]] = fdiv reassoc double [[Z:%.*]], [[Y:%.*]]
100+
; CHECK-NEXT: [[TMP1:%.*]] = call reassoc arcp double @llvm.sqrt.f64(double [[TMP0]])
101+
; CHECK-NEXT: [[DIV1:%.*]] = fmul reassoc arcp double [[TMP1]], [[X:%.*]]
102102
; CHECK-NEXT: ret double [[DIV1]]
103103
;
104104
entry:

0 commit comments

Comments
 (0)