llvm
diff --git a/‎llvm/lib/Transforms/Vectorize/LoopVectorize.cpp‎
Lines changed: 3 additions & 4 deletions b/‎llvm/lib/Transforms/Vectorize/LoopVectorize.cpp‎
Lines changed: 3 additions & 4 deletions
diff --git a/‎llvm/test/Transforms/LoopVectorize/Hexagon/maximum-vf-crash.ll‎
Lines changed: 29 additions & 0 deletions b/‎llvm/test/Transforms/LoopVectorize/Hexagon/maximum-vf-crash.ll‎
Lines changed: 29 additions & 0 deletions
@@ -5504,11 +5504,9 @@ LoopVectorizationCostModel::computeMaxVF(ElementCount UserVF, unsigned UserIC) {
  return None;
  }
 
- ElementCount MaxVF = computeFeasibleMaxVF(TC, UserVF);
-
  switch (ScalarEpilogueStatus) {
  case CM_ScalarEpilogueAllowed:
- return MaxVF;
+ return computeFeasibleMaxVF(TC, UserVF);
  case CM_ScalarEpilogueNotAllowedUsePredicate:
  LLVM_FALLTHROUGH;
  case CM_ScalarEpilogueNotNeededUsePredicate:
@@ -5546,7 +5544,7 @@ LoopVectorizationCostModel::computeMaxVF(ElementCount UserVF, unsigned UserIC) {
  LLVM_DEBUG(dbgs() << "LV: Cannot fold tail by masking: vectorize with a "
  "scalar epilogue instead.\n");
  ScalarEpilogueStatus = CM_ScalarEpilogueAllowed;
- return MaxVF;
+ return computeFeasibleMaxVF(TC, UserVF);
  }
  return None;
  }
@@ -5563,6 +5561,7 @@ LoopVectorizationCostModel::computeMaxVF(ElementCount UserVF, unsigned UserIC) {
  InterleaveInfo.invalidateGroupsRequiringScalarEpilogue();
  }
 
+ ElementCount MaxVF = computeFeasibleMaxVF(TC, UserVF);
  assert(!MaxVF.isScalable() &&
  "Scalable vectors do not yet support tail folding");
  assert((UserVF.isNonZero() || isPowerOf2_32(MaxVF.getFixedValue())) &&
 
@@ -0,0 +1,29 @@
+; RUN: opt -march=hexagon -hexagon-autohvx -loop-vectorize -S < %s 2>&1 | FileCheck %s
+
+; Check that we don't crash.
+
+; CHECK-LABEL: @f
+; CHECK: vector.body
+
+target datalayout = "e-m:e-p:32:32:32-a:0-n16:32-i64:64:64-i32:32:32-i16:16:16-i1:8:8-f32:32:32-f64:64:64-v32:32:32-v64:64:64-v512:512:512-v1024:1024:1024-v2048:2048:2048"
+target triple = "hexagon"
+
+; Function Attrs: optsize
+define i32 @f() #0 {
+entry:
+ br label %loop
+
+loop:
+ %g.016 = phi i32 [ 0, %entry ], [ %g.1.lcssa, %loop ]
+ %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ]
+ %0 = load i8, i8* undef, align 1
+ %g.1.lcssa = add i32 %g.016, undef
+ %iv.next = add nsw i32 %iv, 1
+ %exitcond = icmp eq i32 %iv.next, 0
+ br i1 %exitcond, label %exit, label %loop
+
+exit:
+ ret i32 %g.1.lcssa
+}
+
+attributes #0 = { optsize "target-features"="+hvx-length128b" }