1; RUN: llc -mcpu cortex-a53 < %s | FileCheck %s
2target datalayout = "e-m:e-i64:64-i128:128-n8:16:32:64-S128"
3target triple = "aarch64--linux-gnu"
4
5declare void @f(i8*, i8*)
6declare void @f2(i8*, i8*)
7declare void @_Z5setupv()
8declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i1) #3
9
10define i32 @main() local_unnamed_addr #1 {
11; Make sure the stores happen in the correct order (the exact instructions could change).
12; CHECK-LABEL: main:
13; CHECK: stp xzr, xzr, [sp, #72]
14; CHECK: str w9, [sp, #80]
15; CHECK: str q0, [sp, #48]
16; CHECK: ldr w8, [sp, #48]
17; CHECK: str q0, [sp, #64]
18
19for.body.lr.ph.i.i.i.i.i.i63:
20  %b1 = alloca [10 x i32], align 16
21  %x0 = bitcast [10 x i32]* %b1 to i8*
22  %b2 = alloca [10 x i32], align 16
23  %x1 = bitcast [10 x i32]* %b2 to i8*
24  tail call void @_Z5setupv()
25  %x2 = getelementptr inbounds [10 x i32], [10 x i32]* %b1, i64 0, i64 6
26  %x3 = bitcast i32* %x2 to i8*
27  call void @llvm.memset.p0i8.i64(i8* align 8 %x3, i8 0, i64 16, i1 false)
28  %arraydecay2 = getelementptr inbounds [10 x i32], [10 x i32]* %b1, i64 0, i64 0
29  %x4 = bitcast [10 x i32]* %b1 to <4 x i32>*
30  store <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32>* %x4, align 16
31  %incdec.ptr.i7.i.i.i.i.i.i64.3 = getelementptr inbounds [10 x i32], [10 x i32]* %b1, i64 0, i64 4
32  %x5 = bitcast i32* %incdec.ptr.i7.i.i.i.i.i.i64.3 to <4 x i32>*
33  store <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32>* %x5, align 16
34  %incdec.ptr.i7.i.i.i.i.i.i64.7 = getelementptr inbounds [10 x i32], [10 x i32]* %b1, i64 0, i64 8
35  store i32 1, i32* %incdec.ptr.i7.i.i.i.i.i.i64.7, align 16
36  %x6 = load i32, i32* %arraydecay2, align 16
37  %cmp6 = icmp eq i32 %x6, 1
38  br i1 %cmp6, label %for.inc, label %if.then
39
40for.inc:
41  call void @f(i8* %x0, i8* %x1)
42  ret i32 0
43
44if.then:
45  call void @f2(i8* %x0, i8* %x1)
46  ret i32 0
47}
48