1; RUN: llc < %s -march=arm64 -asm-verbose=false | FileCheck %s
2
3define i32 @t1(i32 %a, i32 %b) nounwind readnone ssp {
4entry:
5; CHECK-LABEL: t1:
6; CHECK: add w0, w1, w0
7; CHECK: ret
8  %add = add i32 %b, %a
9  ret i32 %add
10}
11
12define i32 @t2(i32 %a, i32 %b) nounwind readnone ssp {
13entry:
14; CHECK-LABEL: t2:
15; CHECK: udiv w0, w0, w1
16; CHECK: ret
17  %udiv = udiv i32 %a, %b
18  ret i32 %udiv
19}
20
21define i64 @t3(i64 %a, i64 %b) nounwind readnone ssp {
22entry:
23; CHECK-LABEL: t3:
24; CHECK: udiv x0, x0, x1
25; CHECK: ret
26  %udiv = udiv i64 %a, %b
27  ret i64 %udiv
28}
29
30define i32 @t4(i32 %a, i32 %b) nounwind readnone ssp {
31entry:
32; CHECK-LABEL: t4:
33; CHECK: sdiv w0, w0, w1
34; CHECK: ret
35  %sdiv = sdiv i32 %a, %b
36  ret i32 %sdiv
37}
38
39define i64 @t5(i64 %a, i64 %b) nounwind readnone ssp {
40entry:
41; CHECK-LABEL: t5:
42; CHECK: sdiv x0, x0, x1
43; CHECK: ret
44  %sdiv = sdiv i64 %a, %b
45  ret i64 %sdiv
46}
47
48define i32 @t6(i32 %a, i32 %b) nounwind readnone ssp {
49entry:
50; CHECK-LABEL: t6:
51; CHECK: lsl w0, w0, w1
52; CHECK: ret
53  %shl = shl i32 %a, %b
54  ret i32 %shl
55}
56
57define i64 @t7(i64 %a, i64 %b) nounwind readnone ssp {
58entry:
59; CHECK-LABEL: t7:
60; CHECK: lsl x0, x0, x1
61; CHECK: ret
62  %shl = shl i64 %a, %b
63  ret i64 %shl
64}
65
66define i32 @t8(i32 %a, i32 %b) nounwind readnone ssp {
67entry:
68; CHECK-LABEL: t8:
69; CHECK: lsr w0, w0, w1
70; CHECK: ret
71  %lshr = lshr i32 %a, %b
72  ret i32 %lshr
73}
74
75define i64 @t9(i64 %a, i64 %b) nounwind readnone ssp {
76entry:
77; CHECK-LABEL: t9:
78; CHECK: lsr x0, x0, x1
79; CHECK: ret
80  %lshr = lshr i64 %a, %b
81  ret i64 %lshr
82}
83
84define i32 @t10(i32 %a, i32 %b) nounwind readnone ssp {
85entry:
86; CHECK-LABEL: t10:
87; CHECK: asr w0, w0, w1
88; CHECK: ret
89  %ashr = ashr i32 %a, %b
90  ret i32 %ashr
91}
92
93define i64 @t11(i64 %a, i64 %b) nounwind readnone ssp {
94entry:
95; CHECK-LABEL: t11:
96; CHECK: asr x0, x0, x1
97; CHECK: ret
98  %ashr = ashr i64 %a, %b
99  ret i64 %ashr
100}
101
102define i32 @t12(i16 %a, i32 %x) nounwind ssp {
103entry:
104; CHECK-LABEL: t12:
105; CHECK: add	w0, w1, w0, sxth
106; CHECK: ret
107  %c = sext i16 %a to i32
108  %e = add i32 %x, %c
109  ret i32 %e
110}
111
112define i32 @t13(i16 %a, i32 %x) nounwind ssp {
113entry:
114; CHECK-LABEL: t13:
115; CHECK: add	w0, w1, w0, sxth #2
116; CHECK: ret
117  %c = sext i16 %a to i32
118  %d = shl i32 %c, 2
119  %e = add i32 %x, %d
120  ret i32 %e
121}
122
123define i64 @t14(i16 %a, i64 %x) nounwind ssp {
124entry:
125; CHECK-LABEL: t14:
126; CHECK: and	w8, w0, #0xffff
127; CHECK: add	x0, x1, w8, uxtw #3
128; CHECK: ret
129  %c = zext i16 %a to i64
130  %d = shl i64 %c, 3
131  %e = add i64 %x, %d
132  ret i64 %e
133}
134
135; rdar://9160598
136define i64 @t15(i64 %a, i64 %x) nounwind ssp {
137entry:
138; CHECK-LABEL: t15:
139; CHECK: add x0, x1, w0, uxtw
140; CHECK: ret
141  %b = and i64 %a, 4294967295
142  %c = add i64 %x, %b
143  ret i64 %c
144}
145
146define i64 @t16(i64 %x) nounwind ssp {
147entry:
148; CHECK-LABEL: t16:
149; CHECK: lsl x0, x0, #1
150; CHECK: ret
151  %a = shl i64 %x, 1
152  ret i64 %a
153}
154
155; rdar://9166974
156define i64 @t17(i16 %a, i64 %x) nounwind ssp {
157entry:
158; CHECK-LABEL: t17:
159; CHECK: sxth [[REG:x[0-9]+]], w0
160; CHECK: neg x0, [[REG]], lsl #32
161; CHECK: ret
162  %tmp16 = sext i16 %a to i64
163  %tmp17 = mul i64 %tmp16, -4294967296
164  ret i64 %tmp17
165}
166
167define i32 @t18(i32 %a, i32 %b) nounwind readnone ssp {
168entry:
169; CHECK-LABEL: t18:
170; CHECK: sdiv w0, w0, w1
171; CHECK: ret
172  %sdiv = call i32 @llvm.aarch64.sdiv.i32(i32 %a, i32 %b)
173  ret i32 %sdiv
174}
175
176define i64 @t19(i64 %a, i64 %b) nounwind readnone ssp {
177entry:
178; CHECK-LABEL: t19:
179; CHECK: sdiv x0, x0, x1
180; CHECK: ret
181  %sdiv = call i64 @llvm.aarch64.sdiv.i64(i64 %a, i64 %b)
182  ret i64 %sdiv
183}
184
185define i32 @t20(i32 %a, i32 %b) nounwind readnone ssp {
186entry:
187; CHECK-LABEL: t20:
188; CHECK: udiv w0, w0, w1
189; CHECK: ret
190  %udiv = call i32 @llvm.aarch64.udiv.i32(i32 %a, i32 %b)
191  ret i32 %udiv
192}
193
194define i64 @t21(i64 %a, i64 %b) nounwind readnone ssp {
195entry:
196; CHECK-LABEL: t21:
197; CHECK: udiv x0, x0, x1
198; CHECK: ret
199  %udiv = call i64 @llvm.aarch64.udiv.i64(i64 %a, i64 %b)
200  ret i64 %udiv
201}
202
203declare i32 @llvm.aarch64.sdiv.i32(i32, i32) nounwind readnone
204declare i64 @llvm.aarch64.sdiv.i64(i64, i64) nounwind readnone
205declare i32 @llvm.aarch64.udiv.i32(i32, i32) nounwind readnone
206declare i64 @llvm.aarch64.udiv.i64(i64, i64) nounwind readnone
207
208; 32-bit not.
209define i32 @inv_32(i32 %x) nounwind ssp {
210entry:
211; CHECK: inv_32
212; CHECK: mvn w0, w0
213; CHECK: ret
214  %inv = xor i32 %x, -1
215  ret i32 %inv
216}
217
218; 64-bit not.
219define i64 @inv_64(i64 %x) nounwind ssp {
220entry:
221; CHECK: inv_64
222; CHECK: mvn x0, x0
223; CHECK: ret
224  %inv = xor i64 %x, -1
225  ret i64 %inv
226}
227
228; Multiplying by a power of two plus or minus one is better done via shift
229; and add/sub rather than the madd/msub instructions. The latter are 4+ cycles,
230; and the former are two (total for the two instruction sequence for subtract).
231define i32 @f0(i32 %a) nounwind readnone ssp {
232; CHECK-LABEL: f0:
233; CHECK-NEXT: add w0, w0, w0, lsl #3
234; CHECK-NEXT: ret
235  %res = mul i32 %a, 9
236  ret i32 %res
237}
238
239define i64 @f1(i64 %a) nounwind readnone ssp {
240; CHECK-LABEL: f1:
241; CHECK-NEXT: lsl x8, x0, #4
242; CHECK-NEXT: sub x0, x8, x0
243; CHECK-NEXT: ret
244  %res = mul i64 %a, 15
245  ret i64 %res
246}
247
248define i32 @f2(i32 %a) nounwind readnone ssp {
249; CHECK-LABEL: f2:
250; CHECK-NEXT: lsl w8, w0, #3
251; CHECK-NEXT: sub w0, w8, w0
252; CHECK-NEXT: ret
253  %res = mul nsw i32 %a, 7
254  ret i32 %res
255}
256
257define i64 @f3(i64 %a) nounwind readnone ssp {
258; CHECK-LABEL: f3:
259; CHECK-NEXT: add x0, x0, x0, lsl #4
260; CHECK-NEXT: ret
261  %res = mul nsw i64 %a, 17
262  ret i64 %res
263}
264
265define i32 @f4(i32 %a) nounwind readnone ssp {
266; CHECK-LABEL: f4:
267; CHECK-NEXT: add w0, w0, w0, lsl #1
268; CHECK-NEXT: ret
269  %res = mul i32 %a, 3
270  ret i32 %res
271}
272