Skip to content

Commit be37f13

Browse files
committed
[SLP]Add an extra test for vectorization of non-pow-2 trees, NFC.
1 parent 68922f7 commit be37f13

File tree

1 file changed

+94
-0
lines changed

1 file changed

+94
-0
lines changed
Lines changed: 94 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,94 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2+
; RUN: opt -slp-vectorizer -S -o - -mtriple=x86_64-unknown-linux -mcpu=haswell < %s | FileCheck %s
3+
@e = dso_local local_unnamed_addr global i32 0, align 4
4+
@f = dso_local local_unnamed_addr global i32 0, align 4
5+
6+
; Function Attrs: nofree norecurse nounwind uwtable
7+
define dso_local i32 @g() local_unnamed_addr {
8+
; CHECK-LABEL: @g(
9+
; CHECK-NEXT: entry:
10+
; CHECK-NEXT: [[TMP0:%.*]] = load i32, i32* @e, align 4
11+
; CHECK-NEXT: [[TOBOOL_NOT19:%.*]] = icmp eq i32 [[TMP0]], 0
12+
; CHECK-NEXT: br i1 [[TOBOOL_NOT19]], label [[WHILE_END:%.*]], label [[WHILE_BODY:%.*]]
13+
; CHECK: while.body:
14+
; CHECK-NEXT: [[C_022:%.*]] = phi i32* [ [[C_022_BE:%.*]], [[WHILE_BODY_BACKEDGE:%.*]] ], [ undef, [[ENTRY:%.*]] ]
15+
; CHECK-NEXT: [[TMP1:%.*]] = phi <2 x i32*> [ [[TMP14:%.*]], [[WHILE_BODY_BACKEDGE]] ], [ undef, [[ENTRY]] ]
16+
; CHECK-NEXT: [[INCDEC_PTR:%.*]] = getelementptr inbounds i32, i32* [[C_022]], i64 1
17+
; CHECK-NEXT: [[TMP2:%.*]] = ptrtoint i32* [[C_022]] to i64
18+
; CHECK-NEXT: [[TMP3:%.*]] = trunc i64 [[TMP2]] to i32
19+
; CHECK-NEXT: [[TMP4:%.*]] = getelementptr i32, <2 x i32*> [[TMP1]], <2 x i64> <i64 1, i64 1>
20+
; CHECK-NEXT: switch i32 [[TMP3]], label [[WHILE_BODY_BACKEDGE]] [
21+
; CHECK-NEXT: i32 2, label [[SW_BB:%.*]]
22+
; CHECK-NEXT: i32 4, label [[SW_BB6:%.*]]
23+
; CHECK-NEXT: ]
24+
; CHECK: sw.bb:
25+
; CHECK-NEXT: [[TMP5:%.*]] = extractelement <2 x i32*> [[TMP4]], i32 0
26+
; CHECK-NEXT: [[TMP6:%.*]] = ptrtoint i32* [[TMP5]] to i64
27+
; CHECK-NEXT: [[TMP7:%.*]] = trunc i64 [[TMP6]] to i32
28+
; CHECK-NEXT: [[TMP8:%.*]] = getelementptr i32, <2 x i32*> [[TMP1]], <2 x i64> <i64 2, i64 2>
29+
; CHECK-NEXT: [[TMP9:%.*]] = extractelement <2 x i32*> [[TMP4]], i32 1
30+
; CHECK-NEXT: store i32 [[TMP7]], i32* [[TMP9]], align 4
31+
; CHECK-NEXT: [[INCDEC_PTR5:%.*]] = getelementptr inbounds i32, i32* [[C_022]], i64 2
32+
; CHECK-NEXT: br label [[WHILE_BODY_BACKEDGE]]
33+
; CHECK: sw.bb6:
34+
; CHECK-NEXT: [[INCDEC_PTR8:%.*]] = getelementptr inbounds i32, i32* [[C_022]], i64 2
35+
; CHECK-NEXT: [[TMP10:%.*]] = ptrtoint i32* [[INCDEC_PTR]] to i64
36+
; CHECK-NEXT: [[TMP11:%.*]] = trunc i64 [[TMP10]] to i32
37+
; CHECK-NEXT: [[TMP12:%.*]] = getelementptr i32, <2 x i32*> [[TMP1]], <2 x i64> <i64 2, i64 2>
38+
; CHECK-NEXT: [[TMP13:%.*]] = extractelement <2 x i32*> [[TMP4]], i32 0
39+
; CHECK-NEXT: store i32 [[TMP11]], i32* [[TMP13]], align 4
40+
; CHECK-NEXT: br label [[WHILE_BODY_BACKEDGE]]
41+
; CHECK: while.body.backedge:
42+
; CHECK-NEXT: [[C_022_BE]] = phi i32* [ [[INCDEC_PTR]], [[WHILE_BODY]] ], [ [[INCDEC_PTR8]], [[SW_BB6]] ], [ [[INCDEC_PTR5]], [[SW_BB]] ]
43+
; CHECK-NEXT: [[TMP14]] = phi <2 x i32*> [ [[TMP4]], [[WHILE_BODY]] ], [ [[TMP12]], [[SW_BB6]] ], [ [[TMP8]], [[SW_BB]] ]
44+
; CHECK-NEXT: br label [[WHILE_BODY]]
45+
; CHECK: while.end:
46+
; CHECK-NEXT: ret i32 undef
47+
;
48+
entry:
49+
%0 = load i32, i32* @e, align 4
50+
%tobool.not19 = icmp eq i32 %0, 0
51+
br i1 %tobool.not19, label %while.end, label %while.body
52+
53+
while.body: ; preds = %entry, %while.body.backedge
54+
%c.022 = phi i32* [ %c.022.be, %while.body.backedge ], [ undef, %entry ]
55+
%b.021 = phi i32* [ %b.021.be, %while.body.backedge ], [ undef, %entry ]
56+
%a.020 = phi i32* [ %a.020.be, %while.body.backedge ], [ undef, %entry ]
57+
%incdec.ptr = getelementptr inbounds i32, i32* %c.022, i64 1
58+
%1 = ptrtoint i32* %c.022 to i64
59+
%2 = trunc i64 %1 to i32
60+
%incdec.ptr1 = getelementptr inbounds i32, i32* %a.020, i64 1
61+
%incdec.ptr2 = getelementptr inbounds i32, i32* %b.021, i64 1
62+
switch i32 %2, label %while.body.backedge [
63+
i32 2, label %sw.bb
64+
i32 4, label %sw.bb6
65+
]
66+
67+
sw.bb: ; preds = %while.body
68+
%incdec.ptr3 = getelementptr inbounds i32, i32* %b.021, i64 2
69+
%3 = ptrtoint i32* %incdec.ptr2 to i64
70+
%4 = trunc i64 %3 to i32
71+
%incdec.ptr4 = getelementptr inbounds i32, i32* %a.020, i64 2
72+
store i32 %4, i32* %incdec.ptr1, align 4
73+
%incdec.ptr5 = getelementptr inbounds i32, i32* %c.022, i64 2
74+
br label %while.body.backedge
75+
76+
sw.bb6: ; preds = %while.body
77+
%incdec.ptr7 = getelementptr inbounds i32, i32* %a.020, i64 2
78+
%incdec.ptr8 = getelementptr inbounds i32, i32* %c.022, i64 2
79+
%5 = ptrtoint i32* %incdec.ptr to i64
80+
%6 = trunc i64 %5 to i32
81+
%incdec.ptr9 = getelementptr inbounds i32, i32* %b.021, i64 2
82+
store i32 %6, i32* %incdec.ptr2, align 4
83+
br label %while.body.backedge
84+
85+
while.body.backedge: ; preds = %sw.bb6, %while.body, %sw.bb
86+
%c.022.be = phi i32* [ %incdec.ptr, %while.body ], [ %incdec.ptr8, %sw.bb6 ], [ %incdec.ptr5, %sw.bb ]
87+
%b.021.be = phi i32* [ %incdec.ptr2, %while.body ], [ %incdec.ptr9, %sw.bb6 ], [ %incdec.ptr3, %sw.bb ]
88+
%a.020.be = phi i32* [ %incdec.ptr1, %while.body ], [ %incdec.ptr7, %sw.bb6 ], [ %incdec.ptr4, %sw.bb ]
89+
br label %while.body
90+
91+
while.end: ; preds = %entry
92+
ret i32 undef
93+
}
94+

0 commit comments

Comments
 (0)