1; RUN: llc -O3 -mtriple arm64-apple-ios3 -aarch64-enable-gep-opt=false %s -o - | FileCheck %s
2; <rdar://problem/13621857>
3
4@block = common global i8* null, align 8
5
6define i32 @fct(i32 %i1, i32 %i2) {
7; CHECK: @fct
8; Sign extension is used more than once, thus it should not be folded.
9; CodeGenPrepare is not sharing sext across uses, thus this is folded because
10; of that.
11; _CHECK-NOT: , sxtw]
12entry:
13  %idxprom = sext i32 %i1 to i64
14  %0 = load i8*, i8** @block, align 8
15  %arrayidx = getelementptr inbounds i8, i8* %0, i64 %idxprom
16  %1 = load i8, i8* %arrayidx, align 1
17  %idxprom1 = sext i32 %i2 to i64
18  %arrayidx2 = getelementptr inbounds i8, i8* %0, i64 %idxprom1
19  %2 = load i8, i8* %arrayidx2, align 1
20  %cmp = icmp eq i8 %1, %2
21  br i1 %cmp, label %if.end, label %if.then
22
23if.then:                                          ; preds = %entry
24  %cmp7 = icmp ugt i8 %1, %2
25  %conv8 = zext i1 %cmp7 to i32
26  br label %return
27
28if.end:                                           ; preds = %entry
29  %inc = add nsw i32 %i1, 1
30  %inc9 = add nsw i32 %i2, 1
31  %idxprom10 = sext i32 %inc to i64
32  %arrayidx11 = getelementptr inbounds i8, i8* %0, i64 %idxprom10
33  %3 = load i8, i8* %arrayidx11, align 1
34  %idxprom12 = sext i32 %inc9 to i64
35  %arrayidx13 = getelementptr inbounds i8, i8* %0, i64 %idxprom12
36  %4 = load i8, i8* %arrayidx13, align 1
37  %cmp16 = icmp eq i8 %3, %4
38  br i1 %cmp16, label %if.end23, label %if.then18
39
40if.then18:                                        ; preds = %if.end
41  %cmp21 = icmp ugt i8 %3, %4
42  %conv22 = zext i1 %cmp21 to i32
43  br label %return
44
45if.end23:                                         ; preds = %if.end
46  %inc24 = add nsw i32 %i1, 2
47  %inc25 = add nsw i32 %i2, 2
48  %idxprom26 = sext i32 %inc24 to i64
49  %arrayidx27 = getelementptr inbounds i8, i8* %0, i64 %idxprom26
50  %5 = load i8, i8* %arrayidx27, align 1
51  %idxprom28 = sext i32 %inc25 to i64
52  %arrayidx29 = getelementptr inbounds i8, i8* %0, i64 %idxprom28
53  %6 = load i8, i8* %arrayidx29, align 1
54  %cmp32 = icmp eq i8 %5, %6
55  br i1 %cmp32, label %return, label %if.then34
56
57if.then34:                                        ; preds = %if.end23
58  %cmp37 = icmp ugt i8 %5, %6
59  %conv38 = zext i1 %cmp37 to i32
60  br label %return
61
62return:                                           ; preds = %if.end23, %if.then34, %if.then18, %if.then
63  %retval.0 = phi i32 [ %conv8, %if.then ], [ %conv22, %if.then18 ], [ %conv38, %if.then34 ], [ 1, %if.end23 ]
64  ret i32 %retval.0
65}
66
67define i32 @fct1(i32 %i1, i32 %i2) optsize {
68; CHECK: @fct1
69; Addressing are folded when optimizing for code size.
70; CHECK: , sxtw]
71; CHECK: , sxtw]
72entry:
73  %idxprom = sext i32 %i1 to i64
74  %0 = load i8*, i8** @block, align 8
75  %arrayidx = getelementptr inbounds i8, i8* %0, i64 %idxprom
76  %1 = load i8, i8* %arrayidx, align 1
77  %idxprom1 = sext i32 %i2 to i64
78  %arrayidx2 = getelementptr inbounds i8, i8* %0, i64 %idxprom1
79  %2 = load i8, i8* %arrayidx2, align 1
80  %cmp = icmp eq i8 %1, %2
81  br i1 %cmp, label %if.end, label %if.then
82
83if.then:                                          ; preds = %entry
84  %cmp7 = icmp ugt i8 %1, %2
85  %conv8 = zext i1 %cmp7 to i32
86  br label %return
87
88if.end:                                           ; preds = %entry
89  %inc = add nsw i32 %i1, 1
90  %inc9 = add nsw i32 %i2, 1
91  %idxprom10 = sext i32 %inc to i64
92  %arrayidx11 = getelementptr inbounds i8, i8* %0, i64 %idxprom10
93  %3 = load i8, i8* %arrayidx11, align 1
94  %idxprom12 = sext i32 %inc9 to i64
95  %arrayidx13 = getelementptr inbounds i8, i8* %0, i64 %idxprom12
96  %4 = load i8, i8* %arrayidx13, align 1
97  %cmp16 = icmp eq i8 %3, %4
98  br i1 %cmp16, label %if.end23, label %if.then18
99
100if.then18:                                        ; preds = %if.end
101  %cmp21 = icmp ugt i8 %3, %4
102  %conv22 = zext i1 %cmp21 to i32
103  br label %return
104
105if.end23:                                         ; preds = %if.end
106  %inc24 = add nsw i32 %i1, 2
107  %inc25 = add nsw i32 %i2, 2
108  %idxprom26 = sext i32 %inc24 to i64
109  %arrayidx27 = getelementptr inbounds i8, i8* %0, i64 %idxprom26
110  %5 = load i8, i8* %arrayidx27, align 1
111  %idxprom28 = sext i32 %inc25 to i64
112  %arrayidx29 = getelementptr inbounds i8, i8* %0, i64 %idxprom28
113  %6 = load i8, i8* %arrayidx29, align 1
114  %cmp32 = icmp eq i8 %5, %6
115  br i1 %cmp32, label %return, label %if.then34
116
117if.then34:                                        ; preds = %if.end23
118  %cmp37 = icmp ugt i8 %5, %6
119  %conv38 = zext i1 %cmp37 to i32
120  br label %return
121
122return:                                           ; preds = %if.end23, %if.then34, %if.then18, %if.then
123  %retval.0 = phi i32 [ %conv8, %if.then ], [ %conv22, %if.then18 ], [ %conv38, %if.then34 ], [ 1, %if.end23 ]
124  ret i32 %retval.0
125}
126
127; CHECK: @test
128; CHECK-NOT: , uxtw #2]
129define i32 @test(i32* %array, i8 zeroext %c, i32 %arg) {
130entry:
131  %conv = zext i8 %c to i32
132  %add = sub i32 0, %arg
133  %tobool = icmp eq i32 %conv, %add
134  br i1 %tobool, label %if.end, label %if.then
135
136if.then:                                          ; preds = %entry
137  %idxprom = zext i8 %c to i64
138  %arrayidx = getelementptr inbounds i32, i32* %array, i64 %idxprom
139  %0 = load volatile i32, i32* %arrayidx, align 4
140  %1 = load volatile i32, i32* %arrayidx, align 4
141  %add3 = add nsw i32 %1, %0
142  br label %if.end
143
144if.end:                                           ; preds = %entry, %if.then
145  %res.0 = phi i32 [ %add3, %if.then ], [ 0, %entry ]
146  ret i32 %res.0
147}
148
149
150; CHECK: @test2
151; CHECK: , uxtw #2]
152; CHECK: , uxtw #2]
153define i32 @test2(i32* %array, i8 zeroext %c, i32 %arg) optsize {
154entry:
155  %conv = zext i8 %c to i32
156  %add = sub i32 0, %arg
157  %tobool = icmp eq i32 %conv, %add
158  br i1 %tobool, label %if.end, label %if.then
159
160if.then:                                          ; preds = %entry
161  %idxprom = zext i8 %c to i64
162  %arrayidx = getelementptr inbounds i32, i32* %array, i64 %idxprom
163  %0 = load volatile i32, i32* %arrayidx, align 4
164  %1 = load volatile i32, i32* %arrayidx, align 4
165  %add3 = add nsw i32 %1, %0
166  br label %if.end
167
168if.end:                                           ; preds = %entry, %if.then
169  %res.0 = phi i32 [ %add3, %if.then ], [ 0, %entry ]
170  ret i32 %res.0
171}
172