address CR

c8ef · c8ef · commit 2555d8f0e829 · 2024-09-04T21:35:20.000+08:00
diff --git a/llvm/lib/Analysis/InstructionSimplify.cpp b/llvm/lib/Analysis/InstructionSimplify.cpp
@@ -4130,47 +4130,19 @@ static Value *simplifyFCmpInst(unsigned Predicate, Value *LHS, Value *RHS,
   //
   // This catches the 2 variable input case, constants are handled below as a
   // class-like compare.
-  KnownFPClass LHSClass = computeKnownFPClass(LHS, fcAllFlags, /*Depth=*/0, Q);
-  KnownFPClass RHSClass = computeKnownFPClass(RHS, fcAllFlags, /*Depth=*/0, Q);
   if (Pred == FCmpInst::FCMP_ORD || Pred == FCmpInst::FCMP_UNO) {
+    KnownFPClass RHSClass =
+        computeKnownFPClass(RHS, fcAllFlags, /*Depth=*/0, Q);
+    KnownFPClass LHSClass =
+        computeKnownFPClass(LHS, fcAllFlags, /*Depth=*/0, Q);
+
     if (FMF.noNaNs() ||
         (RHSClass.isKnownNeverNaN() && LHSClass.isKnownNeverNaN()))
       return ConstantInt::get(RetTy, Pred == FCmpInst::FCMP_ORD);
 
     if (RHSClass.isKnownAlwaysNaN() || LHSClass.isKnownAlwaysNaN())
       return ConstantInt::get(RetTy, Pred == CmpInst::FCMP_UNO);
   }
-  // floor(x) <= x --> true; x <= ceil(x) --> true
-  if (LHSClass.isKnownNeverNaN() &&
-          match(LHS, m_Intrinsic<Intrinsic::floor>(m_Specific(RHS))) ||
-      RHSClass.isKnownNeverNaN() &&
-          match(RHS, m_Intrinsic<Intrinsic::ceil>(m_Specific(LHS)))) {
-    switch (Pred) {
-    case FCmpInst::FCMP_OLE:
-    case FCmpInst::FCMP_ULE:
-      return getTrue(RetTy);
-    case FCmpInst::FCMP_OGT:
-    case FCmpInst::FCMP_UGT:
-      return getFalse(RetTy);
-    default:
-      break;
-    }
-  }
-  if (RHSClass.isKnownNeverNaN() &&
-          match(RHS, m_Intrinsic<Intrinsic::floor>(m_Specific(LHS))) ||
-      LHSClass.isKnownNeverNaN() &&
-          match(LHS, m_Intrinsic<Intrinsic::ceil>(m_Specific(RHS)))) {
-    switch (Pred) {
-    case FCmpInst::FCMP_OGE:
-    case FCmpInst::FCMP_UGE:
-      return getTrue(RetTy);
-    case FCmpInst::FCMP_OLT:
-    case FCmpInst::FCMP_ULT:
-      return getFalse(RetTy);
-    default:
-      break;
-    }
-  }
 
   const APFloat *C = nullptr;
   match(RHS, m_APFloatAllowPoison(C));
diff --git a/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp b/llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp
@@ -8178,6 +8178,87 @@ static Instruction *foldFCmpFSubIntoFCmp(FCmpInst &I, Instruction *LHSI,
   return nullptr;
 }
 
+static Instruction *foldFCmpWithFloorAndCeil(FCmpInst &I,
+                                             InstCombinerImpl &CI) {
+  Value *LHS = I.getOperand(0), *RHS = I.getOperand(1);
+  const CmpInst::Predicate Pred = I.getPredicate();
+  Type *OpType = LHS->getType();
+
+  // fcmp ole floor(x), x => fcmp ord x, 0
+  // fcmp ogt floor(x), x => false
+  if (match(LHS, m_Intrinsic<Intrinsic::floor>(m_Specific(RHS)))) {
+    if (Pred == FCmpInst::FCMP_OLE ||
+        Pred == FCmpInst::FCMP_ULE &&
+            isKnownNeverNaN(LHS, 0,
+                            CI.getSimplifyQuery().getWithInstruction(&I))) {
+      return new FCmpInst(FCmpInst::FCMP_ORD, RHS, ConstantFP::getZero(OpType),
+                          "", &I);
+    }
+    if (Pred == FCmpInst::FCMP_OGT ||
+        Pred == FCmpInst::FCMP_UGT &&
+            isKnownNeverNaN(LHS, 0,
+                            CI.getSimplifyQuery().getWithInstruction(&I))) {
+      return CI.replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));
+    }
+  }
+
+  // fcmp oge x, floor(x) => fcmp ord x, 0
+  // fcmp olt x, floor(x) => false
+  if (match(RHS, m_Intrinsic<Intrinsic::floor>(m_Specific(LHS)))) {
+    if (Pred == FCmpInst::FCMP_OGE ||
+        Pred == FCmpInst::FCMP_UGE &&
+            isKnownNeverNaN(RHS, 0,
+                            CI.getSimplifyQuery().getWithInstruction(&I))) {
+      return new FCmpInst(FCmpInst::FCMP_ORD, RHS, ConstantFP::getZero(OpType),
+                          "", &I);
+    }
+    if (Pred == FCmpInst::FCMP_OLT ||
+        Pred == FCmpInst::FCMP_ULT &&
+            isKnownNeverNaN(RHS, 0,
+                            CI.getSimplifyQuery().getWithInstruction(&I))) {
+      return CI.replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));
+    }
+  }
+
+  // fcmp oge ceil(x), x => fcmp ord x, 0
+  // fcmp olt ceil(x), x => false
+  if (match(LHS, m_Intrinsic<Intrinsic::ceil>(m_Specific(RHS)))) {
+    if (Pred == FCmpInst::FCMP_OGE ||
+        Pred == FCmpInst::FCMP_UGE &&
+            isKnownNeverNaN(LHS, 0,
+                            CI.getSimplifyQuery().getWithInstruction(&I))) {
+      return new FCmpInst(FCmpInst::FCMP_ORD, RHS, ConstantFP::getZero(OpType),
+                          "", &I);
+    }
+    if (Pred == FCmpInst::FCMP_OLT ||
+        Pred == FCmpInst::FCMP_ULT &&
+            isKnownNeverNaN(LHS, 0,
+                            CI.getSimplifyQuery().getWithInstruction(&I))) {
+      return CI.replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));
+    }
+  }
+
+  // fcmp ole x, ceil(x) => fcmp ord x, 0
+  // fcmp ogt x, ceil(x) => false
+  if (match(RHS, m_Intrinsic<Intrinsic::ceil>(m_Specific(LHS)))) {
+    if (Pred == FCmpInst::FCMP_OLE ||
+        Pred == FCmpInst::FCMP_ULE &&
+            isKnownNeverNaN(RHS, 0,
+                            CI.getSimplifyQuery().getWithInstruction(&I))) {
+      return new FCmpInst(FCmpInst::FCMP_ORD, RHS, ConstantFP::getZero(OpType),
+                          "", &I);
+    }
+    if (Pred == FCmpInst::FCMP_OGT ||
+        Pred == FCmpInst::FCMP_UGT &&
+            isKnownNeverNaN(RHS, 0,
+                            CI.getSimplifyQuery().getWithInstruction(&I))) {
+      return CI.replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));
+    }
+  }
+
+  return nullptr;
+}
+
 Instruction *InstCombinerImpl::visitFCmpInst(FCmpInst &I) {
   bool Changed = false;
 
@@ -8382,6 +8463,9 @@ Instruction *InstCombinerImpl::visitFCmpInst(FCmpInst &I) {
   if (Instruction *R = foldSqrtWithFcmpZero(I, *this))
     return R;
 
+  if (Instruction *R = foldFCmpWithFloorAndCeil(I, *this))
+    return R;
+
   if (match(Op0, m_FNeg(m_Value(X)))) {
     // fcmp pred (fneg X), C --> fcmp swap(pred) X, -C
     Constant *C;
diff --git a/llvm/test/Transforms/InstCombine/fp-floor-ceil.ll b/llvm/test/Transforms/InstCombine/fp-floor-ceil.ll
@@ -0,0 +1,194 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
+; RUN: opt < %s -passes=instcombine -S | FileCheck %s
+
+define i1 @floor_x_ole(float %x) {
+; CHECK-LABEL: @floor_x_ole(
+; CHECK-NEXT:    [[RET:%.*]] = fcmp ord float [[X:%.*]], 0.000000e+00
+; CHECK-NEXT:    ret i1 [[RET]]
+;
+  %floor = call float @llvm.floor.f32(float %x)
+  %ret = fcmp ole float %floor, %x
+  ret i1 %ret
+}
+
+define i1 @floor_x_ule(float %x) {
+; CHECK-LABEL: @floor_x_ule(
+; CHECK-NEXT:    [[RET:%.*]] = fcmp ord float [[X:%.*]], 0.000000e+00
+; CHECK-NEXT:    ret i1 [[RET]]
+;
+  %floor = call nnan float @llvm.floor.f32(float %x)
+  %ret = fcmp ule float %floor, %x
+  ret i1 %ret
+}
+
+define i1 @floor_x_ogt(float %x) {
+; CHECK-LABEL: @floor_x_ogt(
+; CHECK-NEXT:    ret i1 false
+;
+  %floor = call float @llvm.floor.f32(float %x)
+  %ret = fcmp ogt float %floor, %x
+  ret i1 %ret
+}
+
+define i1 @floor_x_ugt(float %x) {
+; CHECK-LABEL: @floor_x_ugt(
+; CHECK-NEXT:    ret i1 false
+;
+  %floor = call nnan float @llvm.floor.f32(float %x)
+  %ret = fcmp ugt float %floor, %x
+  ret i1 %ret
+}
+
+define i1 @x_floor_oge(float %x) {
+; CHECK-LABEL: @x_floor_oge(
+; CHECK-NEXT:    [[FLOOR:%.*]] = call float @llvm.floor.f32(float [[X:%.*]])
+; CHECK-NEXT:    [[RET:%.*]] = fcmp ord float [[FLOOR]], 0.000000e+00
+; CHECK-NEXT:    ret i1 [[RET]]
+;
+  %floor = call float @llvm.floor.f32(float %x)
+  %ret = fcmp oge float %x, %floor
+  ret i1 %ret
+}
+
+define i1 @x_floor_uge(float %x) {
+; CHECK-LABEL: @x_floor_uge(
+; CHECK-NEXT:    ret i1 true
+;
+  %floor = call nnan float @llvm.floor.f32(float %x)
+  %ret = fcmp uge float %x, %floor
+  ret i1 %ret
+}
+
+define i1 @x_floor_olt(float %x) {
+; CHECK-LABEL: @x_floor_olt(
+; CHECK-NEXT:    ret i1 false
+;
+  %floor = call float @llvm.floor.f32(float %x)
+  %ret = fcmp olt float %x, %floor
+  ret i1 %ret
+}
+
+define i1 @x_floor_ult(float nofpclass(nan) %x) {
+; CHECK-LABEL: @x_floor_ult(
+; CHECK-NEXT:    ret i1 false
+;
+  %floor = call float @llvm.floor.f32(float %x)
+  %ret = fcmp ult float %x, %floor
+  ret i1 %ret
+}
+
+define <2 x i1> @x_floor_olt_vec(<2 x float> %x) {
+; CHECK-LABEL: @x_floor_olt_vec(
+; CHECK-NEXT:    ret <2 x i1> zeroinitializer
+;
+  %floor = call <2 x float> @llvm.floor.f32(<2 x float> %x)
+  %ret = fcmp olt <2 x float> %x, %floor
+  ret <2 x i1> %ret
+}
+
+define i1 @x_floor_ole_neg(float %x) {
+; CHECK-LABEL: @x_floor_ole_neg(
+; CHECK-NEXT:    [[FLOOR:%.*]] = call float @llvm.floor.f32(float [[X:%.*]])
+; CHECK-NEXT:    [[RET:%.*]] = fcmp ole float [[X]], [[FLOOR]]
+; CHECK-NEXT:    ret i1 [[RET]]
+;
+  %floor = call float @llvm.floor.f32(float %x)
+  %ret = fcmp ole float %x, %floor
+  ret i1 %ret
+}
+
+define i1 @ceil_x_oge(float %x) {
+; CHECK-LABEL: @ceil_x_oge(
+; CHECK-NEXT:    [[RET:%.*]] = fcmp ord float [[X:%.*]], 0.000000e+00
+; CHECK-NEXT:    ret i1 [[RET]]
+;
+  %ceil = call float @llvm.ceil.f32(float %x)
+  %ret = fcmp oge float %ceil, %x
+  ret i1 %ret
+}
+
+define i1 @ceil_x_uge(float %x) {
+; CHECK-LABEL: @ceil_x_uge(
+; CHECK-NEXT:    [[RET:%.*]] = fcmp ord float [[X:%.*]], 0.000000e+00
+; CHECK-NEXT:    ret i1 [[RET]]
+;
+  %ceil = call nnan float @llvm.ceil.f32(float %x)
+  %ret = fcmp uge float %ceil, %x
+  ret i1 %ret
+}
+
+define i1 @ceil_x_olt(float %x) {
+; CHECK-LABEL: @ceil_x_olt(
+; CHECK-NEXT:    ret i1 false
+;
+  %ceil = call float @llvm.ceil.f32(float %x)
+  %ret = fcmp olt float %ceil, %x
+  ret i1 %ret
+}
+
+define i1 @ceil_x_ult(float %x) {
+; CHECK-LABEL: @ceil_x_ult(
+; CHECK-NEXT:    ret i1 false
+;
+  %ceil = call nnan float @llvm.ceil.f32(float %x)
+  %ret = fcmp ult float %ceil, %x
+  ret i1 %ret
+}
+
+define i1 @x_ceil_ole(float %x) {
+; CHECK-LABEL: @x_ceil_ole(
+; CHECK-NEXT:    [[CEIL:%.*]] = call float @llvm.ceil.f32(float [[X:%.*]])
+; CHECK-NEXT:    [[RET:%.*]] = fcmp ord float [[CEIL]], 0.000000e+00
+; CHECK-NEXT:    ret i1 [[RET]]
+;
+  %ceil = call float @llvm.ceil.f32(float %x)
+  %ret = fcmp ole float %x, %ceil
+  ret i1 %ret
+}
+
+define i1 @x_ceil_ule(float %x) {
+; CHECK-LABEL: @x_ceil_ule(
+; CHECK-NEXT:    ret i1 true
+;
+  %ceil = call nnan float @llvm.ceil.f32(float %x)
+  %ret = fcmp ule float %x, %ceil
+  ret i1 %ret
+}
+
+define i1 @x_ceil_ogt(float %x) {
+; CHECK-LABEL: @x_ceil_ogt(
+; CHECK-NEXT:    ret i1 false
+;
+  %ceil = call float @llvm.ceil.f32(float %x)
+  %ret = fcmp ogt float %x, %ceil
+  ret i1 %ret
+}
+
+define i1 @x_ceil_ugt(float nofpclass(nan) %x) {
+; CHECK-LABEL: @x_ceil_ugt(
+; CHECK-NEXT:    ret i1 false
+;
+  %ceil = call float @llvm.ceil.f32(float %x)
+  %ret = fcmp ugt float %x, %ceil
+  ret i1 %ret
+}
+
+define <2 x i1> @x_ceil_ogt_vec(<2 x float> %x) {
+; CHECK-LABEL: @x_ceil_ogt_vec(
+; CHECK-NEXT:    ret <2 x i1> zeroinitializer
+;
+  %ceil = call <2 x float> @llvm.ceil.f32(<2 x float> %x)
+  %ret = fcmp ogt <2 x float> %x, %ceil
+  ret <2 x i1> %ret
+}
+
+define i1 @x_ceil_oge_neg(float %x) {
+; CHECK-LABEL: @x_ceil_oge_neg(
+; CHECK-NEXT:    [[CEIL:%.*]] = call float @llvm.ceil.f32(float [[X:%.*]])
+; CHECK-NEXT:    [[RET:%.*]] = fcmp oge float [[X]], [[CEIL]]
+; CHECK-NEXT:    ret i1 [[RET]]
+;
+  %ceil = call float @llvm.ceil.f32(float %x)
+  %ret = fcmp oge float %x, %ceil
+  ret i1 %ret
+}
diff --git a/llvm/test/Transforms/InstSimplify/fp-floor-ceil.ll b/llvm/test/Transforms/InstSimplify/fp-floor-ceil.ll