[sil-optimizer] Add FP comparison support in constant folder

jkshtj · jkshtj · commit 02c2e0432b2b · 2023-11-13T15:32:02.000-08:00
diff --git a/include/swift/SILOptimizer/Utils/ConstantFolding.h b/include/swift/SILOptimizer/Utils/ConstantFolding.h
@@ -31,10 +31,16 @@ class SILOptFunctionBuilder;
 /// The \p ID must be the ID of a binary bit-operation builtin.
 APInt constantFoldBitOperation(APInt lhs, APInt rhs, BuiltinValueKind ID);
 
+/// Evaluates the constant result of a floating point comparison.
+///
+/// The \p ID must be the ID of a floating point builtin operation.
+APInt constantFoldComparisonFloat(APFloat lhs, APFloat rhs,
+                                  BuiltinValueKind ID);
+
 /// Evaluates the constant result of an integer comparison.
 ///
 /// The \p ID must be the ID of an integer builtin operation.
-APInt constantFoldComparison(APInt lhs, APInt rhs, BuiltinValueKind ID);
+APInt constantFoldComparisonInt(APInt lhs, APInt rhs, BuiltinValueKind ID);
 
 /// Evaluates the constant result of a binary operation with overflow.
 ///
diff --git a/lib/SILOptimizer/Utils/ConstantFolding.cpp b/lib/SILOptimizer/Utils/ConstantFolding.cpp
@@ -50,7 +50,66 @@ APInt swift::constantFoldBitOperation(APInt lhs, APInt rhs, BuiltinValueKind ID)
   }
 }
 
-APInt swift::constantFoldComparison(APInt lhs, APInt rhs, BuiltinValueKind ID) {
+APInt swift::constantFoldComparisonFloat(APFloat lhs, APFloat rhs,
+                                         BuiltinValueKind ID) {
+  bool result;
+  bool isOrdered = !lhs.isNaN() && !rhs.isNaN();
+
+  switch (ID) {
+  default:
+      llvm_unreachable("Invalid float compare kind");
+  // Ordered comparisons
+  case BuiltinValueKind::FCMP_OEQ:
+      result = isOrdered && lhs == rhs;
+      break;
+  case BuiltinValueKind::FCMP_OGT:
+      result = isOrdered && lhs > rhs;
+      break;
+  case BuiltinValueKind::FCMP_OGE:
+      result = isOrdered && lhs >= rhs;
+      break;
+  case BuiltinValueKind::FCMP_OLT:
+      result = isOrdered && lhs < rhs;
+      break;
+  case BuiltinValueKind::FCMP_OLE:
+      result = isOrdered && lhs <= rhs;
+      break;
+  case BuiltinValueKind::FCMP_ONE:
+      result = isOrdered && lhs != rhs;
+      break;
+  case BuiltinValueKind::FCMP_ORD:
+      result = isOrdered;
+      break;
+
+  // Unordered comparisons
+  case BuiltinValueKind::FCMP_UEQ:
+      result = !isOrdered || lhs == rhs;
+      break;
+  case BuiltinValueKind::FCMP_UGT:
+      result = !isOrdered || lhs > rhs;
+      break;
+  case BuiltinValueKind::FCMP_UGE:
+      result = !isOrdered || lhs >= rhs;
+      break;
+  case BuiltinValueKind::FCMP_ULT:
+      result = !isOrdered || lhs < rhs;
+      break;
+  case BuiltinValueKind::FCMP_ULE:
+      result = !isOrdered || lhs <= rhs;
+      break;
+  case BuiltinValueKind::FCMP_UNE:
+      result = !isOrdered || lhs != rhs;
+      break;
+  case BuiltinValueKind::FCMP_UNO:
+      result = !isOrdered;
+      break;
+  }
+
+  return APInt(1, result);
+}
+
+APInt swift::constantFoldComparisonInt(APInt lhs, APInt rhs,
+                                       BuiltinValueKind ID) {
   bool result;
   switch (ID) {
     default: llvm_unreachable("Invalid integer compare kind");
@@ -351,14 +410,235 @@ static SILValue constantFoldIntrinsic(BuiltinInst *BI, llvm::Intrinsic::ID ID,
   return nullptr;
 }
 
-static SILValue constantFoldCompare(BuiltinInst *BI, BuiltinValueKind ID) {
+static SILValue constantFoldCompareFloat(BuiltinInst *BI, BuiltinValueKind ID) {
+  static auto hasIEEEFloatNanBitRepr = [](const APInt val) -> bool {
+    auto bitWidth = val.getBitWidth();
+    if (bitWidth == 32) {
+      APInt nanBitRepr =
+          APFloat::getNaN(llvm::APFloatBase::IEEEsingle()).bitcastToAPInt();
+      return bitWidth == nanBitRepr.getBitWidth() && val == nanBitRepr;
+    } else {
+      APInt nanBitRepr =
+          APFloat::getNaN(llvm::APFloatBase::IEEEdouble()).bitcastToAPInt();
+      return bitWidth == nanBitRepr.getBitWidth() && val == nanBitRepr;
+    }
+  };
+
+  static auto hasIEEEFloatPosInfBitRepr = [](const APInt val) -> bool {
+    auto bitWidth = val.getBitWidth();
+    if (bitWidth == 32) {
+      APInt infBitRepr =
+          APFloat::getInf(llvm::APFloatBase::IEEEsingle()).bitcastToAPInt();
+      return bitWidth == infBitRepr.getBitWidth() && val == infBitRepr;
+    } else {
+      APInt infBitRepr =
+          APFloat::getInf(llvm::APFloatBase::IEEEdouble()).bitcastToAPInt();
+      return bitWidth == infBitRepr.getBitWidth() && val == infBitRepr;
+    }
+  };
+
+  OperandValueArrayRef Args = BI->getArguments();
+
+  // Fold for floating point constant arguments.
+  auto *LHS = dyn_cast<FloatLiteralInst>(Args[0]);
+  auto *RHS = dyn_cast<FloatLiteralInst>(Args[1]);
+  if (LHS && RHS) {
+    APInt Res =
+        constantFoldComparisonFloat(LHS->getValue(), RHS->getValue(), ID);
+    SILBuilderWithScope B(BI);
+    return B.createIntegerLiteral(BI->getLoc(), BI->getType(), Res);
+  }
+
+  using namespace swift::PatternMatch;
+
+  // Ordered comparisons with NaN always return false
+  SILValue Other;
+  IntegerLiteralInst *builtinArg;
+  if (match(BI, m_CombineOr(
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OEQ, // x == NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OGT, // x > NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OGE, // x >= NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OLT, // x < NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OLE, // x <= NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_ONE, // x != NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OEQ, // NaN == x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OGT, // NaN > x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OGE, // NaN >= x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OLT, // NaN < x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OLE, // NaN <= x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_ONE, // NaN != x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other))))) {
+    APInt val = builtinArg->getValue();
+    if (hasIEEEFloatNanBitRepr(val)) {
+      SILBuilderWithScope B(BI);
+      return B.createIntegerLiteral(BI->getLoc(), BI->getType(), APInt(1, 0));
+    }
+  }
+
+  // Unordered comparisons with NaN always return true
+  if (match(BI, m_CombineOr(
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UEQ, // x == NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UGT, // x > NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UGE, // x >= NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_ULT, // x < NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_ULE, // x <= NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UNE, // x != NaN
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UEQ, // NaN == x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UGT, // NaN > x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UGE, // NaN >= x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_ULT, // NaN < x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_ULE, // NaN <= x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UNE, // NaN != x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other))))) {
+    APInt val = builtinArg->getValue();
+    if (hasIEEEFloatNanBitRepr(val)) {
+      SILBuilderWithScope B(BI);
+      return B.createIntegerLiteral(BI->getLoc(), BI->getType(), APInt(1, 1));
+    }
+  }
+
+  // Everything is less than or equal positive infinity
+  if (match(BI,
+            m_CombineOr(
+                m_BuiltinInst(BuiltinValueKind::FCMP_OGT, // Inf > x
+                              m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                              m_SILValue(Other)),
+                m_BuiltinInst(BuiltinValueKind::FCMP_OGE, // Inf >= x
+                              m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                              m_SILValue(Other)),
+                m_BuiltinInst(BuiltinValueKind::FCMP_OLT, // x < Inf
+                              m_SILValue(Other),
+                              m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                m_BuiltinInst(BuiltinValueKind::FCMP_OLE, // x <= Inf
+                              m_SILValue(Other),
+                              m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                m_BuiltinInst(BuiltinValueKind::FCMP_UGT, // Inf > x
+                              m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                              m_SILValue(Other)),
+                m_BuiltinInst(BuiltinValueKind::FCMP_UGE, // Inf >= x
+                              m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                              m_SILValue(Other)),
+                m_BuiltinInst(BuiltinValueKind::FCMP_ULT, // x < Inf
+                              m_SILValue(Other),
+                              m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                m_BuiltinInst(BuiltinValueKind::FCMP_ULE, // x <= Inf
+                              m_SILValue(Other),
+                              m_BitCast(m_IntegerLiteralInst(builtinArg)))))) {
+    APInt val = builtinArg->getValue();
+    if (hasIEEEFloatPosInfBitRepr(val)) {
+      SILBuilderWithScope B(BI);
+      return B.createIntegerLiteral(BI->getLoc(), BI->getType(), APInt(1, 1));
+    }
+  }
+
+  // Positive infinity is not less than or equal to anything
+  if (match(BI, m_CombineOr(
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OGT, // x > Inf
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OGE, // x >= Inf
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OLT, // Inf < x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_OLE, // Inf <= x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UGT, // x > Inf
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_UGE, // x >= Inf
+                                  m_SILValue(Other),
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg))),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_ULT, // Inf < x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other)),
+                    m_BuiltinInst(BuiltinValueKind::FCMP_ULE, // Inf <= x
+                                  m_BitCast(m_IntegerLiteralInst(builtinArg)),
+                                  m_SILValue(Other))))) {
+    APInt val = builtinArg->getValue();
+    if (hasIEEEFloatPosInfBitRepr(val)) {
+      SILBuilderWithScope B(BI);
+      return B.createIntegerLiteral(BI->getLoc(), BI->getType(), APInt(1, 0));
+    }
+  }
+
+  // Everything is less than or equal to (but not necessarily less than) MAX
+  // float
+  FloatLiteralInst *max;
+  if (match(BI,
+            m_CombineOr(
+                m_BuiltinInst(BuiltinValueKind::FCMP_OGE, // MAX >= x
+                              m_FloatLiteralInst(max), m_SILValue(Other)),
+                m_BuiltinInst(BuiltinValueKind::FCMP_OLE, // x <= MAX
+                              m_SILValue(Other), m_FloatLiteralInst(max)),
+                m_BuiltinInst(BuiltinValueKind::FCMP_UGE, // MAX >= x
+                              m_FloatLiteralInst(max), m_SILValue(Other)),
+                m_BuiltinInst(BuiltinValueKind::FCMP_ULE, // x <= MAX
+                              m_SILValue(Other), m_FloatLiteralInst(max)))) &&
+      max->getValue().isLargest()) {
+    SILBuilderWithScope B(BI);
+    return B.createIntegerLiteral(BI->getLoc(), BI->getType(), APInt(1, 1));
+  }
+
+  return nullptr;
+}
+
+static SILValue constantFoldCompareInt(BuiltinInst *BI, BuiltinValueKind ID) {
   OperandValueArrayRef Args = BI->getArguments();
 
   // Fold for integer constant arguments.
   auto *LHS = dyn_cast<IntegerLiteralInst>(Args[0]);
   auto *RHS = dyn_cast<IntegerLiteralInst>(Args[1]);
   if (LHS && RHS) {
-    APInt Res = constantFoldComparison(LHS->getValue(), RHS->getValue(), ID);
+    APInt Res = constantFoldComparisonInt(LHS->getValue(), RHS->getValue(), ID);
     SILBuilderWithScope B(BI);
     return B.createIntegerLiteral(BI->getLoc(), BI->getType(), Res);
   }
@@ -480,6 +760,17 @@ static SILValue constantFoldCompare(BuiltinInst *BI, BuiltinValueKind ID) {
   return nullptr;
 }
 
+static SILValue constantFoldCompare(BuiltinInst *BI, BuiltinValueKind ID) {
+  // Try folding integer comparison
+  if (auto result = constantFoldCompareInt(BI, ID))
+    return result;
+  // Try folding floating point comparison
+  if (auto result = constantFoldCompareFloat(BI, ID))
+    return result;
+  // Else, return nullptr
+  return nullptr;
+}
+
 static SILValue
 constantFoldAndCheckDivision(BuiltinInst *BI, BuiltinValueKind ID,
                              llvm::Optional<bool> &ResultsInError) {
@@ -1893,6 +2184,12 @@ ConstantFolder::processWorkList() {
           }
         }
 
+        // If the user is a bitcast, we may be able to constant
+        // fold its users.
+        if (isApplyOfBuiltin(*User, BuiltinValueKind::BitCast)) {
+          WorkList.insert(User);
+        }
+
         // Initialize ResultsInError as a None optional.
         //
         // We are essentially using this optional to represent 3 states: true,
diff --git a/lib/SILOptimizer/Utils/PerformanceInlinerUtils.cpp b/lib/SILOptimizer/Utils/PerformanceInlinerUtils.cpp
@@ -190,9 +190,9 @@ case BuiltinValueKind::id:
       IntConst lhs = getIntConst(Args[0], depth);
       IntConst rhs = getIntConst(Args[1], depth);
       if (lhs.isValid && rhs.isValid) {
-        return IntConst(constantFoldComparison(lhs.value, rhs.value,
-                                               Builtin.ID),
-                        lhs.isFromCaller || rhs.isFromCaller);
+        return IntConst(
+            constantFoldComparisonInt(lhs.value, rhs.value, Builtin.ID),
+            lhs.isFromCaller || rhs.isFromCaller);
       }
       break;
     }
diff --git a/test/AutoDiff/SILOptimizer/vjp_and_pullback_inlining.swift b/test/AutoDiff/SILOptimizer/vjp_and_pullback_inlining.swift
@@ -40,7 +40,12 @@ func caller_of_simple_vjp() -> Float {
 @_silgen_name("pb_with_control_flow")
 func pb_with_control_flow(_ x: Float) -> Float {
   if (x > 0) {
-    return sin(x) * cos(x)
+        let a = x * x;
+        let b = x + x;
+        let c = x * a;
+        let d = a + b;
+        let e = b * c;
+        return a * b / c + d - e ;
   } else {
     return sin(x) + cos(x)
   }
@@ -55,7 +60,6 @@ func caller_of_pb_with_control_flow() -> Float {
 // CHECK: decision {{{.*}}, b=70, {{.*}}} pb_with_control_flowTJpSpSr
 // CHECK-NEXT: "pb_with_control_flowTJpSpSr" inlined into "caller_of_pb_with_control_flow"
 
-
 @differentiable(reverse)
 func double(x: Float) -> Float {
     return x + x
diff --git a/test/SILOptimizer/constant_propagation.sil b/test/SILOptimizer/constant_propagation.sil

Original file line number	Diff line number	Diff line change
`@@ -190,9 +190,9 @@ case BuiltinValueKind::id:`
`190`	`190`	`IntConst lhs = getIntConst(Args[0], depth);`
`191`	`191`	`IntConst rhs = getIntConst(Args[1], depth);`
`192`	`192`	`if (lhs.isValid && rhs.isValid) {`
`193`		`- return IntConst(constantFoldComparison(lhs.value, rhs.value,`
`194`		`- Builtin.ID),`
`195`		`- lhs.isFromCaller \|\| rhs.isFromCaller);`
	`193`	`+ return IntConst(`
	`194`	`+ constantFoldComparisonInt(lhs.value, rhs.value, Builtin.ID),`
	`195`	`+ lhs.isFromCaller \|\| rhs.isFromCaller);`
`196`	`196`	`}`
`197`	`197`	`break;`
`198`	`198`	`}`