llvm
diff --git a/‎llvm/lib/Transforms/Vectorize/VPlanTransforms.cpp
Lines changed: 7 additions & 3 deletions b/‎llvm/lib/Transforms/Vectorize/VPlanTransforms.cpp
Lines changed: 7 additions & 3 deletions
@@ -1105,10 +1105,10 @@ static bool optimizeVectorInductionWidthForTCAndVFUF(VPlan &Plan,
 
   // Calculate the widest type required for known TC, VF and UF.
   auto ComputeBitWidth = [](APInt TC, uint64_t Align) {
-    auto AlignedTC =
+    APInt AlignedTC =
         Align * APIntOps::RoundingUDiv(TC, APInt(TC.getBitWidth(), Align),
                                        APInt::Rounding::UP);
-    auto MaxVal = AlignedTC - 1;
+    APInt MaxVal = AlignedTC - 1;
     return std::max<unsigned>(PowerOf2Ceil(MaxVal.getActiveBits()), 8);
   };
   unsigned NewBitWidth =
@@ -1122,6 +1122,10 @@ static bool optimizeVectorInductionWidthForTCAndVFUF(VPlan &Plan,
   VPBasicBlock *HeaderVPBB = Plan.getVectorLoopRegion()->getEntryBasicBlock();
   for (VPRecipeBase &Phi : HeaderVPBB->phis()) {
     auto *WideIV = dyn_cast<VPWidenIntOrFpInductionRecipe>(&Phi);
+
+    // Currently only handle canonical IVs as it is trivial to replace the start
+    // and stop values, and we only perform the optimisation when the IV is only
+    // used by the comparison controlling loop control-flow.
     if (!WideIV || !WideIV->isCanonical() ||
         WideIV->hasMoreThanOneUniqueUser() ||
         NewIVTy == WideIV->getScalarType())
@@ -1145,7 +1149,7 @@ static bool optimizeVectorInductionWidthForTCAndVFUF(VPlan &Plan,
     auto *NewBTC = new VPWidenCastRecipe(
         Instruction::Trunc, Plan.getOrCreateBackedgeTakenCount(), NewIVTy);
     Plan.getVectorPreheader()->appendRecipe(NewBTC);
-    auto *Cmp = dyn_cast<VPInstruction>(*WideIV->user_begin());
+    auto *Cmp = cast<VPInstruction>(*WideIV->user_begin());
     Cmp->setOperand(1, NewBTC);
 
     MadeChange = true;