Skip to content

Commit 9ba738a

Browse files
authored
[VPlan] Fix assert in store-user in narrowToSingleScalars (llvm#167686)
Follow up on c2d4c7c ([VPlan] Permit more users in narrowToSingleScalars) to fix an assert related to WidenStore users of the recipe being narrowed in narrowToSingleScalars.
1 parent d3a813b commit 9ba738a

File tree

2 files changed

+58
-5
lines changed

2 files changed

+58
-5
lines changed

llvm/lib/Transforms/Vectorize/VPlanTransforms.cpp

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1431,11 +1431,11 @@ static void narrowToSingleScalarRecipes(VPlan &Plan) {
14311431
!all_of(RepOrWidenR->users(), [RepOrWidenR](const VPUser *U) {
14321432
if (auto *Store = dyn_cast<VPWidenStoreRecipe>(U)) {
14331433
// VPWidenStore doesn't have users, and stores are always
1434-
// profitable to widen: hence, permitting single-scalar stored
1435-
// values is an important leaf condition. The assert must hold as
1436-
// we checked the RepOrWidenR operand against
1437-
// vputils::isSingleScalar.
1438-
assert(RepOrWidenR == Store->getAddr() ||
1434+
// profitable to widen: hence, permitting address and mask
1435+
// operands, and single-scalar stored values is an important leaf
1436+
// condition. The assert must hold as we checked the RepOrWidenR
1437+
// operand against vputils::isSingleScalar.
1438+
assert(RepOrWidenR != Store->getStoredValue() ||
14391439
vputils::isSingleScalar(Store->getStoredValue()));
14401440
return true;
14411441
}
Lines changed: 53 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,53 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6
2+
; RUN: opt -p loop-vectorize -mcpu=skylake -S %s | FileCheck %s
3+
4+
target triple = "x86_64-unknown-linux-gnu"
5+
6+
@p = external global [3952 x i8], align 8
7+
@q = external global [3952 x i8], align 8
8+
9+
define void @narrow_store_user_mask_operand(i32 %x) {
10+
; CHECK-LABEL: define void @narrow_store_user_mask_operand(
11+
; CHECK-SAME: i32 [[X:%.*]]) #[[ATTR0:[0-9]+]] {
12+
; CHECK-NEXT: [[ENTRY:.*]]:
13+
; CHECK-NEXT: br label %[[LOOP_PH:.*]]
14+
; CHECK: [[LOOP_PH]]:
15+
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP_TAIL:.*]] ]
16+
; CHECK-NEXT: [[X_POS:%.*]] = icmp sgt i32 [[X]], 0
17+
; CHECK-NEXT: br i1 [[X_POS]], label %[[LOOP_BODY:.*]], label %[[LOOP_TAIL]]
18+
; CHECK: [[LOOP_BODY]]:
19+
; CHECK-NEXT: [[LD_P:%.*]] = load double, ptr @p, align 8
20+
; CHECK-NEXT: [[GEP_Q_IV:%.*]] = getelementptr double, ptr @q, i64 [[IV]]
21+
; CHECK-NEXT: [[GEP_Q_IV_8:%.*]] = getelementptr i8, ptr [[GEP_Q_IV]], i64 -8
22+
; CHECK-NEXT: store double [[LD_P]], ptr [[GEP_Q_IV_8]], align 8
23+
; CHECK-NEXT: br label %[[LOOP_TAIL]]
24+
; CHECK: [[LOOP_TAIL]]:
25+
; CHECK-NEXT: [[IV_NEXT]] = add i64 [[IV]], 1
26+
; CHECK-NEXT: [[EC:%.*]] = icmp eq i64 [[IV]], 1
27+
; CHECK-NEXT: br i1 [[EC]], label %[[EXIT:.*]], label %[[LOOP_PH]]
28+
; CHECK: [[EXIT]]:
29+
; CHECK-NEXT: ret void
30+
;
31+
entry:
32+
br label %loop.ph
33+
34+
loop.ph:
35+
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop.tail ]
36+
%x.pos = icmp sgt i32 %x, 0
37+
br i1 %x.pos, label %loop.body, label %loop.tail
38+
39+
loop.body:
40+
%ld.p = load double, ptr @p
41+
%gep.q.iv = getelementptr double, ptr @q, i64 %iv
42+
%gep.q.iv.8 = getelementptr i8, ptr %gep.q.iv, i64 -8
43+
store double %ld.p, ptr %gep.q.iv.8
44+
br label %loop.tail
45+
46+
loop.tail:
47+
%iv.next = add i64 %iv, 1
48+
%ec = icmp eq i64 %iv, 1
49+
br i1 %ec, label %exit, label %loop.ph
50+
51+
exit:
52+
ret void
53+
}

0 commit comments

Comments
 (0)