1; RUN: opt < %s -indvars -S | FileCheck %s
2target triple = "aarch64--linux-gnu"
3
4; Provide legal integer types.
5target datalayout = "n8:16:32:64"
6
7
8; Check the loop exit i32 compare instruction and operand are widened to i64
9; instead of truncating IV before its use in the i32 compare instruction.
10
11@idx = common global i32 0, align 4
12@e = common global i32 0, align 4
13@ptr = common global i32* null, align 8
14
15; CHECK-LABEL: @test1
16; CHECK: for.body.lr.ph:
17; CHECK: sext i32
18; CHECK: for.cond:
19; CHECK: icmp slt i64
20; CHECK: for.body:
21; CHECK: phi i64
22
23define i32 @test1() {
24entry:
25  store i32 -1, i32* @idx, align 4
26  %0 = load i32, i32* @e, align 4
27  %cmp4 = icmp slt i32 %0, 0
28  br i1 %cmp4, label %for.end.loopexit, label %for.body.lr.ph
29
30for.body.lr.ph:
31  %1 = load i32*, i32** @ptr, align 8
32  %2 = load i32, i32* @e, align 4
33  br label %for.body
34
35for.cond:
36  %inc = add nsw i32 %i.05, 1
37  %cmp = icmp slt i32 %i.05, %2
38  br i1 %cmp, label %for.body, label %for.cond.for.end.loopexit_crit_edge
39
40for.body:
41  %i.05 = phi i32 [ 0, %for.body.lr.ph ], [ %inc, %for.cond ]
42  %idxprom = sext i32 %i.05 to i64
43  %arrayidx = getelementptr inbounds i32, i32* %1, i64 %idxprom
44  %3 = load i32, i32* %arrayidx, align 4
45  %tobool = icmp eq i32 %3, 0
46  br i1 %tobool, label %if.then, label %for.cond
47
48if.then:
49  %i.05.lcssa = phi i32 [ %i.05, %for.body ]
50  store i32 %i.05.lcssa, i32* @idx, align 4
51  br label %for.end
52
53for.cond.for.end.loopexit_crit_edge:
54  br label %for.end.loopexit
55
56for.end.loopexit:
57  br label %for.end
58
59for.end:
60  %4 = load i32, i32* @idx, align 4
61  ret i32 %4
62}
63
64; CHECK-LABEL: @test2
65; CHECK: for.body4.us
66; CHECK: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
67; CHECK: %cmp2.us = icmp slt i64
68; CHECK-NOT: %2 = trunc i64 %indvars.iv.next to i32
69; CHECK-NOT: %cmp2.us = icmp slt i32
70
71define void @test2([8 x i8]* %a, i8* %b, i8 %limit) {
72entry:
73  %conv = zext i8 %limit to i32
74  br i1 undef, label %for.cond1.preheader, label %for.cond1.preheader.us
75
76for.cond1.preheader.us:
77  %storemerge5.us = phi i32 [ 0, %entry ], [ %inc14.us, %for.inc13.us ]
78  br i1 true, label %for.body4.lr.ph.us, label %for.inc13.us
79
80for.inc13.us:
81  %inc14.us = add nsw i32 %storemerge5.us, 1
82  %cmp.us = icmp slt i32 %inc14.us, 4
83  br i1 %cmp.us, label %for.cond1.preheader.us, label %for.end
84
85for.body4.us:
86  %storemerge14.us = phi i32 [ 0, %for.body4.lr.ph.us ], [ %inc.us, %for.body4.us ]
87  %idxprom.us = sext i32 %storemerge14.us to i64
88  %arrayidx6.us = getelementptr inbounds [8 x i8], [8 x i8]* %a, i64 %idxprom5.us, i64 %idxprom.us
89  %0 = load i8, i8* %arrayidx6.us, align 1
90  %idxprom7.us = zext i8 %0 to i64
91  %arrayidx8.us = getelementptr inbounds i8, i8* %b, i64 %idxprom7.us
92  %1 = load i8, i8* %arrayidx8.us, align 1
93  store i8 %1, i8* %arrayidx6.us, align 1
94  %inc.us = add nsw i32 %storemerge14.us, 1
95  %cmp2.us = icmp slt i32 %inc.us, %conv
96  br i1 %cmp2.us, label %for.body4.us, label %for.inc13.us
97
98for.body4.lr.ph.us:
99  %idxprom5.us = sext i32 %storemerge5.us to i64
100  br label %for.body4.us
101
102for.cond1.preheader:
103  %storemerge5 = phi i32 [ 0, %entry ], [ %inc14, %for.inc13 ]
104  br i1 false, label %for.inc13, label %for.inc13
105
106for.inc13:
107  %inc14 = add nsw i32 %storemerge5, 1
108  %cmp = icmp slt i32 %inc14, 4
109  br i1 %cmp, label %for.cond1.preheader, label %for.end
110
111for.end:
112  ret void
113}
114
115; CHECK-LABEL: @test3
116; CHECK: sext i32 %b
117; CHECK: for.cond:
118; CHECK: phi i64
119; CHECK: icmp slt i64
120
121define i32 @test3(i32* %a, i32 %b) {
122entry:
123  br label %for.cond
124
125for.cond:
126  %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
127  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
128  %cmp = icmp slt i32 %i.0, %b
129  br i1 %cmp, label %for.body, label %for.end
130
131for.body:
132  %idxprom = sext i32 %i.0 to i64
133  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
134  %0 = load i32, i32* %arrayidx, align 4
135  %add = add nsw i32 %sum.0, %0
136  %inc = add nsw i32 %i.0, 1
137  br label %for.cond
138
139for.end:
140  ret i32 %sum.0
141}
142
143declare i32 @fn1(i8 signext)
144
145; PR21030
146; CHECK-LABEL: @test4
147; CHECK: for.body:
148; CHECK: phi i32
149; CHECK: icmp sgt i8
150
151define i32 @test4(i32 %a) {
152entry:
153  br label %for.body
154
155for.body:
156  %c.07 = phi i8 [ -3, %entry ], [ %dec, %for.body ]
157  %conv6 = zext i8 %c.07 to i32
158  %or = or i32 %a, %conv6
159  %conv3 = trunc i32 %or to i8
160  %call = call i32 @fn1(i8 signext %conv3)
161  %dec = add i8 %c.07, -1
162  %cmp = icmp sgt i8 %dec, -14
163  br i1 %cmp, label %for.body, label %for.end
164
165for.end:
166  ret i32 0
167}
168
169; CHECK-LABEL: @test5
170; CHECK: zext i32 %b
171; CHECK: for.cond:
172; CHECK: phi i64
173; CHECK: icmp ule i64
174
175define i32 @test5(i32* %a, i32 %b) {
176entry:
177  br label %for.cond
178
179for.cond:
180  %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
181  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
182  %cmp = icmp ule i32 %i.0, %b
183  br i1 %cmp, label %for.body, label %for.end
184
185for.body:
186  %idxprom = zext i32 %i.0 to i64
187  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
188  %0 = load i32, i32* %arrayidx, align 4
189  %add = add nsw i32 %sum.0, %0
190  %inc = add nsw i32 %i.0, 1
191  br label %for.cond
192
193for.end:
194  ret i32 %sum.0
195}
196
197define i32 @test6(i32* %a, i32 %b) {
198; CHECK-LABEL: @test6(
199; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
200; CHECK: for.cond:
201; CHECK: icmp sle i64 %indvars.iv, [[B_SEXT]]
202
203entry:
204  br label %for.cond
205
206for.cond:
207  %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
208  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
209  %cmp = icmp sle i32 %i.0, %b
210  br i1 %cmp, label %for.body, label %for.end
211
212for.body:
213  %idxprom = zext i32 %i.0 to i64
214  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
215  %0 = load i32, i32* %arrayidx, align 4
216  %add = add nsw i32 %sum.0, %0
217  %inc = add nsw i32 %i.0, 1
218  br label %for.cond
219
220for.end:
221  ret i32 %sum.0
222}
223
224define i32 @test7(i32* %a, i32 %b) {
225; CHECK-LABEL: @test7(
226; CHECK: [[B_ZEXT:%[a-z0-9]+]] = zext i32 %b to i64
227; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
228; CHECK: for.cond:
229; CHECK: icmp ule i64 %indvars.iv, [[B_ZEXT]]
230; CHECK: for.body:
231; CHECK: icmp sle i64 %indvars.iv, [[B_SEXT]]
232
233entry:
234  br label %for.cond
235
236for.cond:
237  %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
238  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
239  %cmp = icmp ule i32 %i.0, %b
240  br i1 %cmp, label %for.body, label %for.end
241
242for.body:
243  %idxprom = sext i32 %i.0 to i64
244  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
245  %0 = load i32, i32* %arrayidx, align 4
246  %add = add nsw i32 %sum.0, %0
247  %inc = add nsw i32 %i.0, 1
248  %cmp2 = icmp sle i32 %i.0, %b
249  br i1 %cmp2, label %for.cond, label %for.end
250
251for.end:
252  ret i32 %sum.0
253}
254
255define i32 @test8(i32* %a, i32 %b, i32 %init) {
256; CHECK-LABEL: @test8(
257; CHECK: [[INIT_SEXT:%[a-z0-9]+]] = sext i32 %init to i64
258; CHECK: [[B_ZEXT:%[a-z0-9]+]] = zext i32 %b to i64
259; CHECK: for.cond:
260;     Note: %indvars.iv is the sign extension of %i.0
261; CHECK: %indvars.iv = phi i64 [ [[INIT_SEXT]], %for.cond.preheader ], [ %indvars.iv.next, %for.body ]
262; CHECK: icmp ule i64 %indvars.iv, [[B_ZEXT]]
263
264entry:
265  %e = icmp sgt i32 %init, 0
266  br i1 %e, label %for.cond, label %leave
267
268for.cond:
269  %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
270  %i.0 = phi i32 [ %init, %entry ], [ %inc, %for.body ]
271  %cmp = icmp ule i32 %i.0, %b
272  br i1 %cmp, label %for.body, label %for.end
273
274for.body:
275  %idxprom = sext i32 %i.0 to i64
276  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
277  %0 = load i32, i32* %arrayidx, align 4
278  %add = add nsw i32 %sum.0, %0
279  %inc = add nsw i32 %i.0, 1
280  %cmp2 = icmp slt i32 0, %inc
281  br i1 %cmp2, label %for.cond, label %for.end
282
283for.end:
284  ret i32 %sum.0
285
286leave:
287  ret i32 0
288}
289
290define i32 @test9(i32* %a, i32 %b, i32 %init) {
291; CHECK-LABEL: @test9(
292; CHECK: [[INIT_ZEXT:%[a-z0-9]+]] = zext i32 %init to i64
293; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
294; CHECK: for.cond:
295;     Note: %indvars.iv is the zero extension of %i.0
296; CHECK: %indvars.iv = phi i64 [ [[INIT_ZEXT]], %for.cond.preheader ], [ %indvars.iv.next, %for.body ]
297; CHECK: icmp slt i64 %indvars.iv, [[B_SEXT]]
298
299entry:
300  %e = icmp sgt i32 %init, 0
301  br i1 %e, label %for.cond, label %leave
302
303for.cond:
304  %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
305  %i.0 = phi i32 [ %init, %entry ], [ %inc, %for.body ]
306  %cmp = icmp slt i32 %i.0, %b
307  br i1 %cmp, label %for.body, label %for.end
308
309for.body:
310  %idxprom = zext i32 %i.0 to i64
311  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
312  %0 = load i32, i32* %arrayidx, align 4
313  %add = add nsw i32 %sum.0, %0
314  %inc = add nsw i32 %i.0, 1
315  %cmp2 = icmp slt i32 0, %inc
316  br i1 %cmp2, label %for.cond, label %for.end
317
318for.end:
319  ret i32 %sum.0
320
321leave:
322  ret i32 0
323}
324
325declare void @consume.i64(i64)
326declare void @consume.i1(i1)
327
328define i32 @test10(i32 %v) {
329; CHECK-LABEL: @test10(
330 entry:
331; CHECK-NOT: zext
332  br label %loop
333
334 loop:
335; CHECK: loop:
336; CHECK: %indvars.iv = phi i64 [ %indvars.iv.next, %loop ], [ 0, %entry ]
337; CHECK: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
338; CHECK: [[MUL:%[a-z0-9]+]] = mul nsw i64 %indvars.iv, -1
339; CHECK: [[MUL_TRUNC:%[a-z0-9]+]] = trunc i64 [[MUL]] to i32
340; CHECK: [[CMP:%[a-z0-9]+]] = icmp eq i32 [[MUL_TRUNC]], %v
341; CHECK: call void @consume.i1(i1 [[CMP]])
342
343  %i = phi i32 [ 0, %entry ], [ %i.inc, %loop ]
344  %i.inc = add i32 %i, 1
345  %iv = mul i32 %i, -1
346  %cmp = icmp eq i32 %iv, %v
347  call void @consume.i1(i1 %cmp)
348  %be.cond = icmp slt i32 %i.inc, 11
349  %ext = sext i32 %iv to i64
350  call void @consume.i64(i64 %ext)
351  br i1 %be.cond, label %loop, label %leave
352
353 leave:
354  ret i32 22
355}
356