Skip to content

Commit 6a0e5b2

Browse files
committed
[IndVars] Add test for missed optimizations depending on guard order.
The added tests show missed optimizations, depending on the order of loop guard conditions.
1 parent 0820266 commit 6a0e5b2

File tree

1 file changed

+201
-0
lines changed

1 file changed

+201
-0
lines changed

llvm/test/Transforms/IndVarSimplify/loop-guard-order.ll

Lines changed: 201 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,8 @@
11
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
22
; RUN: opt -p indvars -S %s | FileCheck %s
33

4+
target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-f80:128-n8:16:32:64-S128"
5+
46
declare void @foo()
57

68
define void @narrow_iv_precondition_order_1(ptr %start, i32 %base, i8 %n) {
@@ -96,3 +98,202 @@ loop:
9698
exit:
9799
ret void
98100
}
101+
102+
define i32 @urem_order1(i32 %n) {
103+
; CHECK-LABEL: define i32 @urem_order1(
104+
; CHECK-SAME: i32 [[N:%.*]]) {
105+
; CHECK-NEXT: [[ENTRY:.*]]:
106+
; CHECK-NEXT: [[UREM:%.*]] = urem i32 [[N]], 3
107+
; CHECK-NEXT: [[UREM_ZERO:%.*]] = icmp eq i32 [[UREM]], 0
108+
; CHECK-NEXT: br i1 [[UREM_ZERO]], label %[[PH:.*]], label %[[EXIT:.*]]
109+
; CHECK: [[PH]]:
110+
; CHECK-NEXT: [[N_NON_ZERO:%.*]] = icmp ne i32 [[N]], 0
111+
; CHECK-NEXT: br i1 [[N_NON_ZERO]], label %[[LOOP_PREHEADER:.*]], label %[[EXIT]]
112+
; CHECK: [[LOOP_PREHEADER]]:
113+
; CHECK-NEXT: br label %[[LOOP:.*]]
114+
; CHECK: [[LOOP]]:
115+
; CHECK-NEXT: [[IV:%.*]] = phi i32 [ [[IV_NEXT:%.*]], %[[LOOP]] ], [ 0, %[[LOOP_PREHEADER]] ]
116+
; CHECK-NEXT: call void @foo()
117+
; CHECK-NEXT: [[IV_NEXT]] = add i32 [[IV]], 3
118+
; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], [[N]]
119+
; CHECK-NEXT: br i1 [[EC]], label %[[EXIT_LOOPEXIT:.*]], label %[[LOOP]]
120+
; CHECK: [[EXIT_LOOPEXIT]]:
121+
; CHECK-NEXT: br label %[[EXIT]]
122+
; CHECK: [[EXIT]]:
123+
; CHECK-NEXT: [[RES:%.*]] = phi i32 [ 1, %[[ENTRY]] ], [ 2, %[[PH]] ], [ 3, %[[EXIT_LOOPEXIT]] ]
124+
; CHECK-NEXT: ret i32 [[RES]]
125+
;
126+
entry:
127+
%urem = urem i32 %n, 3
128+
%urem.zero = icmp eq i32 %urem, 0
129+
br i1 %urem.zero, label %ph, label %exit
130+
131+
ph:
132+
%n.non.zero = icmp ne i32 %n, 0
133+
br i1 %n.non.zero, label %loop, label %exit
134+
135+
loop:
136+
%iv = phi i32 [ 0, %ph ], [ %iv.next, %loop ]
137+
call void @foo()
138+
%iv.next = add i32 %iv, 3
139+
%ec = icmp eq i32 %iv.next, %n
140+
br i1 %ec, label %exit, label %loop
141+
142+
exit:
143+
%res = phi i32 [ 1, %entry ], [ 2, %ph ], [ 3, %loop ]
144+
ret i32 %res
145+
}
146+
147+
define i32 @urem_order2(i32 %n) {
148+
; CHECK-LABEL: define i32 @urem_order2(
149+
; CHECK-SAME: i32 [[N:%.*]]) {
150+
; CHECK-NEXT: [[ENTRY:.*]]:
151+
; CHECK-NEXT: [[N_NON_ZERO:%.*]] = icmp ne i32 [[N]], 0
152+
; CHECK-NEXT: br i1 [[N_NON_ZERO]], label %[[PH:.*]], label %[[EXIT:.*]]
153+
; CHECK: [[PH]]:
154+
; CHECK-NEXT: [[UREM:%.*]] = urem i32 [[N]], 3
155+
; CHECK-NEXT: [[UREM_ZERO:%.*]] = icmp eq i32 [[UREM]], 0
156+
; CHECK-NEXT: br i1 [[UREM_ZERO]], label %[[LOOP_PREHEADER:.*]], label %[[EXIT]]
157+
; CHECK: [[LOOP_PREHEADER]]:
158+
; CHECK-NEXT: br label %[[LOOP:.*]]
159+
; CHECK: [[LOOP]]:
160+
; CHECK-NEXT: [[IV:%.*]] = phi i32 [ [[IV_NEXT:%.*]], %[[LOOP]] ], [ 0, %[[LOOP_PREHEADER]] ]
161+
; CHECK-NEXT: call void @foo()
162+
; CHECK-NEXT: [[IV_NEXT]] = add nuw i32 [[IV]], 3
163+
; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], [[N]]
164+
; CHECK-NEXT: br i1 [[EC]], label %[[EXIT_LOOPEXIT:.*]], label %[[LOOP]]
165+
; CHECK: [[EXIT_LOOPEXIT]]:
166+
; CHECK-NEXT: br label %[[EXIT]]
167+
; CHECK: [[EXIT]]:
168+
; CHECK-NEXT: [[RES:%.*]] = phi i32 [ 1, %[[ENTRY]] ], [ 2, %[[PH]] ], [ 3, %[[EXIT_LOOPEXIT]] ]
169+
; CHECK-NEXT: ret i32 [[RES]]
170+
;
171+
entry:
172+
%n.non.zero = icmp ne i32 %n, 0
173+
br i1 %n.non.zero, label %ph, label %exit
174+
175+
ph:
176+
%urem = urem i32 %n, 3
177+
%urem.zero = icmp eq i32 %urem, 0
178+
br i1 %urem.zero, label %loop, label %exit
179+
180+
loop:
181+
%iv = phi i32 [ 0, %ph ], [ %iv.next, %loop ]
182+
call void @foo()
183+
%iv.next = add i32 %iv, 3
184+
%ec = icmp eq i32 %iv.next, %n
185+
br i1 %ec, label %exit, label %loop
186+
187+
exit:
188+
%res = phi i32 [ 1, %entry ], [ 2, %ph ], [ 3, %loop ]
189+
ret i32 %res
190+
}
191+
192+
define i64 @test_loop_with_div_order_1(i64 %n) {
193+
; CHECK-LABEL: define i64 @test_loop_with_div_order_1(
194+
; CHECK-SAME: i64 [[N:%.*]]) {
195+
; CHECK-NEXT: [[ENTRY:.*:]]
196+
; CHECK-NEXT: [[IS_ZERO:%.*]] = icmp eq i64 [[N]], 0
197+
; CHECK-NEXT: br i1 [[IS_ZERO]], label %[[EXIT:.*]], label %[[CHECK_BOUNDS:.*]]
198+
; CHECK: [[CHECK_BOUNDS]]:
199+
; CHECK-NEXT: [[N_PLUS_63:%.*]] = add i64 [[N]], 63
200+
; CHECK-NEXT: [[UPPER_BOUND:%.*]] = lshr i64 [[N_PLUS_63]], 6
201+
; CHECK-NEXT: [[BOUNDS_CHECK:%.*]] = icmp ult i64 [[N_PLUS_63]], 64
202+
; CHECK-NEXT: br i1 [[BOUNDS_CHECK]], label %[[EXIT]], label %[[CHECK_PARITY:.*]]
203+
; CHECK: [[CHECK_PARITY]]:
204+
; CHECK-NEXT: [[IS_ODD:%.*]] = and i64 [[N]], 1
205+
; CHECK-NEXT: [[PARITY_CHECK:%.*]] = icmp eq i64 [[IS_ODD]], 0
206+
; CHECK-NEXT: br i1 [[PARITY_CHECK]], label %[[LOOP_PREHEADER:.*]], label %[[EXIT]]
207+
; CHECK: [[LOOP_PREHEADER]]:
208+
; CHECK-NEXT: [[UMAX:%.*]] = call i64 @llvm.umax.i64(i64 [[UPPER_BOUND]], i64 1)
209+
; CHECK-NEXT: br label %[[LOOP:.*]]
210+
; CHECK: [[LOOP]]:
211+
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ [[IV_NEXT:%.*]], %[[LOOP]] ], [ 0, %[[LOOP_PREHEADER]] ]
212+
; CHECK-NEXT: [[DUMMY:%.*]] = load volatile i64, ptr null, align 8
213+
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
214+
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp ne i64 [[IV_NEXT]], [[UMAX]]
215+
; CHECK-NEXT: br i1 [[EXITCOND]], label %[[LOOP]], label %[[EXIT_LOOPEXIT:.*]]
216+
; CHECK: [[EXIT_LOOPEXIT]]:
217+
; CHECK-NEXT: br label %[[EXIT]]
218+
; CHECK: [[EXIT]]:
219+
; CHECK-NEXT: ret i64 0
220+
;
221+
entry:
222+
%is_zero = icmp eq i64 %n, 0
223+
br i1 %is_zero, label %exit, label %check_bounds
224+
225+
check_bounds:
226+
%n_plus_63 = add i64 %n, 63
227+
%upper_bound = lshr i64 %n_plus_63, 6
228+
%bounds_check = icmp ult i64 %n_plus_63, 64
229+
br i1 %bounds_check, label %exit, label %check_parity
230+
231+
check_parity:
232+
%is_odd = and i64 %n, 1
233+
%parity_check = icmp eq i64 %is_odd, 0
234+
br i1 %parity_check, label %loop, label %exit
235+
236+
loop:
237+
%iv = phi i64 [ %iv_next, %loop ], [ 0, %check_parity ]
238+
%dummy = load volatile i64, ptr null, align 8
239+
%iv_next = add i64 %iv, 1
240+
%exit_cond = icmp ult i64 %iv_next, %upper_bound
241+
br i1 %exit_cond, label %loop, label %exit
242+
243+
exit:
244+
ret i64 0
245+
}
246+
247+
define i64 @test_loop_with_div_order_2(i64 %n) {
248+
; CHECK-LABEL: define i64 @test_loop_with_div_order_2(
249+
; CHECK-SAME: i64 [[N:%.*]]) {
250+
; CHECK-NEXT: [[ENTRY:.*:]]
251+
; CHECK-NEXT: [[N_PLUS_63:%.*]] = add i64 [[N]], 63
252+
; CHECK-NEXT: [[UPPER_BOUND:%.*]] = lshr i64 [[N_PLUS_63]], 6
253+
; CHECK-NEXT: [[BOUNDS_CHECK:%.*]] = icmp ult i64 [[N_PLUS_63]], 64
254+
; CHECK-NEXT: br i1 [[BOUNDS_CHECK]], label %[[EXIT:.*]], label %[[CHECK_BOUNDS:.*]]
255+
; CHECK: [[CHECK_BOUNDS]]:
256+
; CHECK-NEXT: [[IS_ZERO:%.*]] = icmp eq i64 [[N]], 0
257+
; CHECK-NEXT: br i1 [[IS_ZERO]], label %[[EXIT]], label %[[CHECK_PARITY:.*]]
258+
; CHECK: [[CHECK_PARITY]]:
259+
; CHECK-NEXT: [[IS_ODD:%.*]] = and i64 [[N]], 1
260+
; CHECK-NEXT: [[PARITY_CHECK:%.*]] = icmp eq i64 [[IS_ODD]], 0
261+
; CHECK-NEXT: br i1 [[PARITY_CHECK]], label %[[LOOP_PREHEADER:.*]], label %[[EXIT]]
262+
; CHECK: [[LOOP_PREHEADER]]:
263+
; CHECK-NEXT: br label %[[LOOP:.*]]
264+
; CHECK: [[LOOP]]:
265+
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ [[IV_NEXT:%.*]], %[[LOOP]] ], [ 0, %[[LOOP_PREHEADER]] ]
266+
; CHECK-NEXT: [[DUMMY:%.*]] = load volatile i64, ptr null, align 8
267+
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
268+
; CHECK-NEXT: [[EXITCOND:%.*]] = icmp ne i64 [[IV_NEXT]], [[UPPER_BOUND]]
269+
; CHECK-NEXT: br i1 [[EXITCOND]], label %[[LOOP]], label %[[EXIT_LOOPEXIT:.*]]
270+
; CHECK: [[EXIT_LOOPEXIT]]:
271+
; CHECK-NEXT: br label %[[EXIT]]
272+
; CHECK: [[EXIT]]:
273+
; CHECK-NEXT: ret i64 0
274+
;
275+
entry:
276+
%n_plus_63 = add i64 %n, 63
277+
%upper_bound = lshr i64 %n_plus_63, 6
278+
%bounds_check = icmp ult i64 %n_plus_63, 64
279+
br i1 %bounds_check, label %exit, label %check_bounds
280+
281+
check_bounds:
282+
%is_zero = icmp eq i64 %n, 0
283+
br i1 %is_zero, label %exit, label %check_parity
284+
285+
check_parity:
286+
%is_odd = and i64 %n, 1
287+
%parity_check = icmp eq i64 %is_odd, 0
288+
br i1 %parity_check, label %loop, label %exit
289+
290+
loop:
291+
%iv = phi i64 [ %iv_next, %loop ], [ 0, %check_parity ]
292+
%dummy = load volatile i64, ptr null, align 8
293+
%iv_next = add i64 %iv, 1
294+
%exit_cond = icmp ult i64 %iv_next, %upper_bound
295+
br i1 %exit_cond, label %loop, label %exit
296+
297+
exit:
298+
ret i64 0
299+
}

0 commit comments

Comments
 (0)