1; RUN: llc -mcpu=ppc64 < %s | FileCheck %s -check-prefix=GENERIC
2; RUN: llc -mcpu=970 < %s | FileCheck %s -check-prefix=PWR
3; RUN: llc -mcpu=a2 < %s | FileCheck %s -check-prefix=BASIC
4; RUN: llc -mcpu=e500mc < %s | FileCheck %s -check-prefix=BASIC
5; RUN: llc -mcpu=e5500 < %s | FileCheck %s -check-prefix=BASIC
6; RUN: llc -mcpu=pwr4 < %s | FileCheck %s -check-prefix=PWR
7; RUN: llc -mcpu=pwr5 < %s | FileCheck %s -check-prefix=PWR
8; RUN: llc -mcpu=pwr5x < %s | FileCheck %s -check-prefix=PWR
9; RUN: llc -mcpu=pwr6 < %s | FileCheck %s -check-prefix=PWR
10; RUN: llc -mcpu=pwr6x < %s | FileCheck %s -check-prefix=PWR
11; RUN: llc -mcpu=pwr7 < %s | FileCheck %s -check-prefix=PWR
12; RUN: llc -mcpu=pwr8 < %s | FileCheck %s -check-prefix=PWR
13target datalayout = "E-m:e-i64:64-n32:64"
14target triple = "powerpc64-unknown-linux-gnu"
15
16; Function Attrs: nounwind readnone
17define signext i32 @foo(i32 signext %x) #0 {
18entry:
19  %mul = shl nsw i32 %x, 1
20  ret i32 %mul
21
22; GENERIC-LABEL: .globl  foo
23; BASIC-LABEL: .globl  foo
24; PWR-LABEL: .globl  foo
25; GENERIC: .p2align  2
26; BASIC: .p2align  4
27; PWR: .p2align  4
28; GENERIC: @foo
29; BASIC: @foo
30; PWR: @foo
31}
32
33; Function Attrs: nounwind
34define void @loop(i32 signext %x, i32* nocapture %a) #1 {
35entry:
36  br label %vector.body
37
38; GENERIC-LABEL: @loop
39; BASIC-LABEL: @loop
40; PWR-LABEL: @loop
41; GENERIC: mtctr
42; BASIC: mtctr
43; PWR: mtctr
44; GENERIC-NOT: .p2align
45; BASIC: .p2align  4
46; PWR: .p2align  4
47; GENERIC: lwzu
48; BASIC: lwzu
49; PWR: lwzu
50; GENERIC: bdnz
51; BASIC: bdnz
52; PWR: bdnz
53
54vector.body:                                      ; preds = %vector.body, %entry
55  %index = phi i64 [ 0, %entry ], [ %index.next, %vector.body ]
56  %induction45 = or i64 %index, 1
57  %0 = getelementptr inbounds i32, i32* %a, i64 %index
58  %1 = getelementptr inbounds i32, i32* %a, i64 %induction45
59  %2 = load i32, i32* %0, align 4
60  %3 = load i32, i32* %1, align 4
61  %4 = add nsw i32 %2, 4
62  %5 = add nsw i32 %3, 4
63  %6 = mul nsw i32 %4, 3
64  %7 = mul nsw i32 %5, 3
65  store i32 %6, i32* %0, align 4
66  store i32 %7, i32* %1, align 4
67  %index.next = add i64 %index, 2
68  %8 = icmp eq i64 %index.next, 2048
69  br i1 %8, label %for.end, label %vector.body
70
71for.end:                                          ; preds = %vector.body
72  ret void
73}
74
75; Function Attrs: nounwind
76define void @sloop(i32 signext %x, i32* nocapture %a) #1 {
77entry:
78  br label %for.body
79
80; GENERIC-LABEL: @sloop
81; BASIC-LABEL: @sloop
82; PWR-LABEL: @sloop
83; GENERIC: mtctr
84; BASIC: mtctr
85; PWR: mtctr
86; GENERIC-NOT: .p2align
87; BASIC: .p2align  4
88; PWR: .p2align  5
89; GENERIC: bdnz
90; BASIC: bdnz
91; PWR: bdnz
92
93for.body:                                         ; preds = %for.body, %entry
94  %indvars.iv = phi i64 [ 0, %entry ], [ %indvars.iv.next, %for.body ]
95  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
96  %0 = load i32, i32* %arrayidx, align 4
97  %add = add nsw i32 %0, 4
98  %mul = mul nsw i32 %add, 3
99  store i32 %mul, i32* %arrayidx, align 4
100  %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
101  %exitcond = icmp eq i64 %indvars.iv.next, 2048
102  br i1 %exitcond, label %for.end, label %for.body
103
104for.end:                                          ; preds = %for.body
105  ret void
106}
107
108; Function Attrs: nounwind
109define void @test_minsize(i32 signext %x, i32* nocapture %a) #2 {
110entry:
111  br label %vector.body
112
113; GENERIC-LABEL: @test_minsize
114; BASIC-LABEL: @test_minsize
115; PWR-LABEL: @test_minsize
116; GENERIC: mtctr
117; BASIC: mtctr
118; PWR: mtctr
119; GENERIC-NOT: .p2align
120; BASIC-NOT: .p2align
121; PWR-NOT: .p2align
122; GENERIC: lwzu
123; BASIC: lwzu
124; PWR: lwzu
125; GENERIC: bdnz
126; BASIC: bdnz
127; PWR: bdnz
128
129vector.body:                                      ; preds = %vector.body, %entry
130  %index = phi i64 [ 0, %entry ], [ %index.next, %vector.body ]
131  %induction45 = or i64 %index, 1
132  %0 = getelementptr inbounds i32, i32* %a, i64 %index
133  %1 = getelementptr inbounds i32, i32* %a, i64 %induction45
134  %2 = load i32, i32* %0, align 4
135  %3 = load i32, i32* %1, align 4
136  %4 = add nsw i32 %2, 4
137  %5 = add nsw i32 %3, 4
138  %6 = mul nsw i32 %4, 3
139  %7 = mul nsw i32 %5, 3
140  store i32 %6, i32* %0, align 4
141  store i32 %7, i32* %1, align 4
142  %index.next = add i64 %index, 2
143  %8 = icmp eq i64 %index.next, 2048
144  br i1 %8, label %for.end, label %vector.body
145
146for.end:                                          ; preds = %vector.body
147  ret void
148}
149attributes #0 = { nounwind readnone }
150attributes #1 = { nounwind }
151attributes #2 = { nounwind minsize}
152
153