1; RUN: opt -basicaa -memcpyopt -S %s | FileCheck %s
2
3target datalayout = "e-m:o-i64:64-f80:128-n8:16:32:64-S128"
4
5; CHECK-LABEL: define void @test
6; CHECK: [[ULE:%[0-9]+]] = icmp ule i64 %dst_size, %src_size
7; CHECK: [[SIZEDIFF:%[0-9]+]] = sub i64 %dst_size, %src_size
8; CHECK: [[SIZE:%[0-9]+]] = select i1 [[ULE]], i64 0, i64 [[SIZEDIFF]]
9; CHECK: [[DST:%[0-9]+]] = getelementptr i8, i8* %dst, i64 %src_size
10; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 1 [[DST]], i8 %c, i64 [[SIZE]], i1 false)
11; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, i64 %src_size, i1 false)
12; CHECK-NEXT: ret void
13define void @test(i8* %src, i64 %src_size, i8* %dst, i64 %dst_size, i8 %c) {
14  call void @llvm.memset.p0i8.i64(i8* %dst, i8 %c, i64 %dst_size, i1 false)
15  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, i64 %src_size, i1 false)
16  ret void
17}
18
19; CHECK-LABEL: define void @test_different_types_i32_i64
20; CHECK: [[DSTSIZE:%[0-9]+]] = zext i32 %dst_size to i64
21; CHECK: [[ULE:%[0-9]+]] = icmp ule i64 [[DSTSIZE]], %src_size
22; CHECK: [[SIZEDIFF:%[0-9]+]] = sub i64 [[DSTSIZE]], %src_size
23; CHECK: [[SIZE:%[0-9]+]] = select i1 [[ULE]], i64 0, i64 [[SIZEDIFF]]
24; CHECK: [[DST:%[0-9]+]] = getelementptr i8, i8* %dst, i64 %src_size
25; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 1 [[DST]], i8 %c, i64 [[SIZE]], i1 false)
26; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, i64 %src_size, i1 false)
27; CHECK-NEXT: ret void
28define void @test_different_types_i32_i64(i8* %dst, i8* %src, i32 %dst_size, i64 %src_size, i8 %c) {
29  call void @llvm.memset.p0i8.i32(i8* %dst, i8 %c, i32 %dst_size, i1 false)
30  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, i64 %src_size, i1 false)
31  ret void
32}
33
34; CHECK-LABEL: define void @test_different_types_i128_i32
35; CHECK: [[SRCSIZE:%[0-9]+]] = zext i32 %src_size to i128
36; CHECK: [[ULE:%[0-9]+]] = icmp ule i128 %dst_size, [[SRCSIZE]]
37; CHECK: [[SIZEDIFF:%[0-9]+]] = sub i128 %dst_size, [[SRCSIZE]]
38; CHECK: [[SIZE:%[0-9]+]] = select i1 [[ULE]], i128 0, i128 [[SIZEDIFF]]
39; CHECK: [[DST:%[0-9]+]] = getelementptr i8, i8* %dst, i128 [[SRCSIZE]]
40; CHECK-NEXT: call void @llvm.memset.p0i8.i128(i8* align 1 [[DST]], i8 %c, i128 [[SIZE]], i1 false)
41; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %src, i32 %src_size, i1 false)
42; CHECK-NEXT: ret void
43define void @test_different_types_i128_i32(i8* %dst, i8* %src, i128 %dst_size, i32 %src_size, i8 %c) {
44  call void @llvm.memset.p0i8.i128(i8* %dst, i8 %c, i128 %dst_size, i1 false)
45  call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %src, i32 %src_size, i1 false)
46  ret void
47}
48
49; CHECK-LABEL: define void @test_different_types_i32_i128
50; CHECK: [[DSTSIZE:%[0-9]+]] = zext i32 %dst_size to i128
51; CHECK: [[ULE:%[0-9]+]] = icmp ule i128 [[DSTSIZE]], %src_size
52; CHECK: [[SIZEDIFF:%[0-9]+]] = sub i128 [[DSTSIZE]], %src_size
53; CHECK: [[SIZE:%[0-9]+]] = select i1 [[ULE]], i128 0, i128 [[SIZEDIFF]]
54; CHECK: [[DST:%[0-9]+]] = getelementptr i8, i8* %dst, i128 %src_size
55; CHECK-NEXT: call void @llvm.memset.p0i8.i128(i8* align 1 [[DST]], i8 %c, i128 [[SIZE]], i1 false)
56; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i128(i8* %dst, i8* %src, i128 %src_size, i1 false)
57; CHECK-NEXT: ret void
58define void @test_different_types_i32_i128(i8* %dst, i8* %src, i32 %dst_size, i128 %src_size, i8 %c) {
59  call void @llvm.memset.p0i8.i32(i8* %dst, i8 %c, i32 %dst_size, i1 false)
60  call void @llvm.memcpy.p0i8.p0i8.i128(i8* %dst, i8* %src, i128 %src_size, i1 false)
61  ret void
62}
63
64; CHECK-LABEL: define void @test_different_types_i64_i32
65; CHECK: [[SRCSIZE:%[0-9]+]] = zext i32 %src_size to i64
66; CHECK: [[ULE:%[0-9]+]] = icmp ule i64 %dst_size, [[SRCSIZE]]
67; CHECK: [[SIZEDIFF:%[0-9]+]] = sub i64 %dst_size, [[SRCSIZE]]
68; CHECK: [[SIZE:%[0-9]+]] = select i1 [[ULE]], i64 0, i64 [[SIZEDIFF]]
69; CHECK: [[DST:%[0-9]+]] = getelementptr i8, i8* %dst, i64 [[SRCSIZE]]
70; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 1 [[DST]], i8 %c, i64 [[SIZE]], i1 false)
71; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %src, i32 %src_size, i1 false)
72; CHECK-NEXT: ret void
73define void @test_different_types_i64_i32(i8* %dst, i8* %src, i64 %dst_size, i32 %src_size, i8 %c) {
74  call void @llvm.memset.p0i8.i64(i8* %dst, i8 %c, i64 %dst_size, i1 false)
75  call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %src, i32 %src_size, i1 false)
76  ret void
77}
78
79; CHECK-LABEL: define void @test_align_same
80; CHECK: call void @llvm.memset.p0i8.i64(i8* align 8 {{.*}}, i8 0, i64 {{.*}}, i1 false)
81define void @test_align_same(i8* %src, i8* %dst, i64 %dst_size) {
82  call void @llvm.memset.p0i8.i64(i8* align 8 %dst, i8 0, i64 %dst_size, i1 false)
83  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, i64 80, i1 false)
84  ret void
85}
86
87; CHECK-LABEL: define void @test_align_min
88; CHECK: call void @llvm.memset.p0i8.i64(i8* align 4 {{.*}}, i8 0, i64 {{.*}}, i1 false)
89define void @test_align_min(i8* %src, i8* %dst, i64 %dst_size) {
90  call void @llvm.memset.p0i8.i64(i8* align 8 %dst, i8 0, i64 %dst_size, i1 false)
91  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, i64 36, i1 false)
92  ret void
93}
94
95; CHECK-LABEL: define void @test_align_memcpy
96; CHECK: call void @llvm.memset.p0i8.i64(i8* align 8 {{.*}}, i8 0, i64 {{.*}}, i1 false)
97define void @test_align_memcpy(i8* %src, i8* %dst, i64 %dst_size) {
98  call void @llvm.memset.p0i8.i64(i8* %dst, i8 0, i64 %dst_size, i1 false)
99  call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 8 %dst, i8* align 8 %src, i64 80, i1 false)
100  ret void
101}
102
103; CHECK-LABEL: define void @test_non_i8_dst_type
104; CHECK-NEXT: %dst = bitcast i64* %dst_pi64 to i8*
105; CHECK: [[ULE:%[0-9]+]] = icmp ule i64 %dst_size, %src_size
106; CHECK: [[SIZEDIFF:%[0-9]+]] = sub i64 %dst_size, %src_size
107; CHECK: [[SIZE:%[0-9]+]] = select i1 [[ULE]], i64 0, i64 [[SIZEDIFF]]
108; CHECK: [[DST:%[0-9]+]] = getelementptr i8, i8* %dst, i64 %src_size
109; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 1 [[DST]], i8 %c, i64 [[SIZE]], i1 false)
110; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, i64 %src_size, i1 false)
111; CHECK-NEXT: ret void
112define void @test_non_i8_dst_type(i8* %src, i64 %src_size, i64* %dst_pi64, i64 %dst_size, i8 %c) {
113  %dst = bitcast i64* %dst_pi64 to i8*
114  call void @llvm.memset.p0i8.i64(i8* %dst, i8 %c, i64 %dst_size, i1 false)
115  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, i64 %src_size, i1 false)
116  ret void
117}
118
119; CHECK-LABEL: define void @test_different_dst
120; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* %dst, i8 0, i64 %dst_size, i1 false)
121; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst2, i8* %src, i64 %src_size, i1 false)
122; CHECK-NEXT: ret void
123define void @test_different_dst(i8* %dst2, i8* %src, i64 %src_size, i8* %dst, i64 %dst_size) {
124  call void @llvm.memset.p0i8.i64(i8* %dst, i8 0, i64 %dst_size, i1 false)
125  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst2, i8* %src, i64 %src_size, i1 false)
126  ret void
127}
128
129; Make sure we also take into account dependencies on the destination.
130
131; CHECK-LABEL: define i8 @test_intermediate_read
132; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* %a, i8 0, i64 64, i1 false)
133; CHECK-NEXT: %r = load i8, i8* %a
134; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a, i8* %b, i64 24, i1 false)
135; CHECK-NEXT: ret i8 %r
136define i8 @test_intermediate_read(i8* %a, i8* %b) #0 {
137  call void @llvm.memset.p0i8.i64(i8* %a, i8 0, i64 64, i1 false)
138  %r = load i8, i8* %a
139  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a, i8* %b, i64 24, i1 false)
140  ret i8 %r
141}
142
143%struct = type { [8 x i8], [8 x i8] }
144
145; CHECK-LABEL: define void @test_intermediate_write
146; CHECK-NEXT: %a = alloca %struct
147; CHECK-NEXT: %a0 = getelementptr %struct, %struct* %a, i32 0, i32 0, i32 0
148; CHECK-NEXT: %a1 = getelementptr %struct, %struct* %a, i32 0, i32 1, i32 0
149; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* %a0, i8 0, i64 16, i1 false)
150; CHECK-NEXT: store i8 1, i8* %a1
151; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a0, i8* %b, i64 8, i1 false)
152; CHECK-NEXT: ret void
153define void @test_intermediate_write(i8* %b) #0 {
154  %a = alloca %struct
155  %a0 = getelementptr %struct, %struct* %a, i32 0, i32 0, i32 0
156  %a1 = getelementptr %struct, %struct* %a, i32 0, i32 1, i32 0
157  call void @llvm.memset.p0i8.i64(i8* %a0, i8 0, i64 16, i1 false)
158  store i8 1, i8* %a1
159  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a0, i8* %b, i64 8, i1 false)
160  ret void
161}
162
163declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i1)
164declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture, i8* nocapture readonly, i64, i1)
165declare void @llvm.memset.p0i8.i32(i8* nocapture, i8, i32, i1)
166declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture readonly, i32, i1)
167declare void @llvm.memset.p0i8.i128(i8* nocapture, i8, i128, i1)
168declare void @llvm.memcpy.p0i8.p0i8.i128(i8* nocapture, i8* nocapture readonly, i128, i1)
169