1; RUN: opt < %s -S -early-cse | FileCheck %s 2; RUN: opt < %s -S -passes=early-cse | FileCheck %s 3 4declare void @llvm.assume(i1) nounwind 5 6; CHECK-LABEL: @test1( 7define void @test1(i8 %V, i32 *%P) { 8 %A = bitcast i64 42 to double ;; dead 9 %B = add i32 4, 19 ;; constant folds 10 store i32 %B, i32* %P 11 ; CHECK-NEXT: store i32 23, i32* %P 12 13 %C = zext i8 %V to i32 14 %D = zext i8 %V to i32 ;; CSE 15 store volatile i32 %C, i32* %P 16 store volatile i32 %D, i32* %P 17 ; CHECK-NEXT: %C = zext i8 %V to i32 18 ; CHECK-NEXT: store volatile i32 %C 19 ; CHECK-NEXT: store volatile i32 %C 20 21 %E = add i32 %C, %C 22 %F = add i32 %C, %C 23 store volatile i32 %E, i32* %P 24 store volatile i32 %F, i32* %P 25 ; CHECK-NEXT: %E = add i32 %C, %C 26 ; CHECK-NEXT: store volatile i32 %E 27 ; CHECK-NEXT: store volatile i32 %E 28 29 %G = add nuw i32 %C, %C 30 store volatile i32 %G, i32* %P 31 ; CHECK-NEXT: store volatile i32 %E 32 ret void 33} 34 35 36;; Simple load value numbering. 37; CHECK-LABEL: @test2( 38define i32 @test2(i32 *%P) { 39 %V1 = load i32, i32* %P 40 %V2 = load i32, i32* %P 41 %Diff = sub i32 %V1, %V2 42 ret i32 %Diff 43 ; CHECK: ret i32 0 44} 45 46; CHECK-LABEL: @test2a( 47define i32 @test2a(i32 *%P, i1 %b) { 48 %V1 = load i32, i32* %P 49 tail call void @llvm.assume(i1 %b) 50 %V2 = load i32, i32* %P 51 %Diff = sub i32 %V1, %V2 52 ret i32 %Diff 53 ; CHECK: ret i32 0 54} 55 56;; Cross block load value numbering. 57; CHECK-LABEL: @test3( 58define i32 @test3(i32 *%P, i1 %Cond) { 59 %V1 = load i32, i32* %P 60 br i1 %Cond, label %T, label %F 61T: 62 store i32 4, i32* %P 63 ret i32 42 64F: 65 %V2 = load i32, i32* %P 66 %Diff = sub i32 %V1, %V2 67 ret i32 %Diff 68 ; CHECK: F: 69 ; CHECK: ret i32 0 70} 71 72; CHECK-LABEL: @test3a( 73define i32 @test3a(i32 *%P, i1 %Cond, i1 %b) { 74 %V1 = load i32, i32* %P 75 br i1 %Cond, label %T, label %F 76T: 77 store i32 4, i32* %P 78 ret i32 42 79F: 80 tail call void @llvm.assume(i1 %b) 81 %V2 = load i32, i32* %P 82 %Diff = sub i32 %V1, %V2 83 ret i32 %Diff 84 ; CHECK: F: 85 ; CHECK: ret i32 0 86} 87 88;; Cross block load value numbering stops when stores happen. 89; CHECK-LABEL: @test4( 90define i32 @test4(i32 *%P, i1 %Cond) { 91 %V1 = load i32, i32* %P 92 br i1 %Cond, label %T, label %F 93T: 94 ret i32 42 95F: 96 ; Clobbers V1 97 store i32 42, i32* %P 98 99 %V2 = load i32, i32* %P 100 %Diff = sub i32 %V1, %V2 101 ret i32 %Diff 102 ; CHECK: F: 103 ; CHECK: ret i32 %Diff 104} 105 106declare i32 @func(i32 *%P) readonly 107 108;; Simple call CSE'ing. 109; CHECK-LABEL: @test5( 110define i32 @test5(i32 *%P) { 111 %V1 = call i32 @func(i32* %P) 112 %V2 = call i32 @func(i32* %P) 113 %Diff = sub i32 %V1, %V2 114 ret i32 %Diff 115 ; CHECK: ret i32 0 116} 117 118;; Trivial Store->load forwarding 119; CHECK-LABEL: @test6( 120define i32 @test6(i32 *%P) { 121 store i32 42, i32* %P 122 %V1 = load i32, i32* %P 123 ret i32 %V1 124 ; CHECK: ret i32 42 125} 126 127; CHECK-LABEL: @test6a( 128define i32 @test6a(i32 *%P, i1 %b) { 129 store i32 42, i32* %P 130 tail call void @llvm.assume(i1 %b) 131 %V1 = load i32, i32* %P 132 ret i32 %V1 133 ; CHECK: ret i32 42 134} 135 136;; Trivial dead store elimination. 137; CHECK-LABEL: @test7( 138define void @test7(i32 *%P) { 139 store i32 42, i32* %P 140 store i32 45, i32* %P 141 ret void 142 ; CHECK-NEXT: store i32 45 143 ; CHECK-NEXT: ret void 144} 145 146;; Readnone functions aren't invalidated by stores. 147; CHECK-LABEL: @test8( 148define i32 @test8(i32 *%P) { 149 %V1 = call i32 @func(i32* %P) readnone 150 store i32 4, i32* %P 151 %V2 = call i32 @func(i32* %P) readnone 152 %Diff = sub i32 %V1, %V2 153 ret i32 %Diff 154 ; CHECK: ret i32 0 155} 156 157;; Trivial DSE can't be performed across a readonly call. The call 158;; can observe the earlier write. 159; CHECK-LABEL: @test9( 160define i32 @test9(i32 *%P) { 161 store i32 4, i32* %P 162 %V1 = call i32 @func(i32* %P) readonly 163 store i32 5, i32* %P 164 ret i32 %V1 165 ; CHECK: store i32 4, i32* %P 166 ; CHECK-NEXT: %V1 = call i32 @func(i32* %P) 167 ; CHECK-NEXT: store i32 5, i32* %P 168 ; CHECK-NEXT: ret i32 %V1 169} 170 171;; Trivial DSE can be performed across a readnone call. 172; CHECK-LABEL: @test10 173define i32 @test10(i32 *%P) { 174 store i32 4, i32* %P 175 %V1 = call i32 @func(i32* %P) readnone 176 store i32 5, i32* %P 177 ret i32 %V1 178 ; CHECK-NEXT: %V1 = call i32 @func(i32* %P) 179 ; CHECK-NEXT: store i32 5, i32* %P 180 ; CHECK-NEXT: ret i32 %V1 181} 182 183;; Trivial dead store elimination - should work for an entire series of dead stores too. 184; CHECK-LABEL: @test11( 185define void @test11(i32 *%P) { 186 store i32 42, i32* %P 187 store i32 43, i32* %P 188 store i32 44, i32* %P 189 store i32 45, i32* %P 190 ret void 191 ; CHECK-NEXT: store i32 45 192 ; CHECK-NEXT: ret void 193} 194 195; CHECK-LABEL: @test12( 196define i32 @test12(i1 %B, i32* %P1, i32* %P2) { 197 %load0 = load i32, i32* %P1 198 %1 = load atomic i32, i32* %P2 seq_cst, align 4 199 %load1 = load i32, i32* %P1 200 %sel = select i1 %B, i32 %load0, i32 %load1 201 ret i32 %sel 202 ; CHECK: load i32, i32* %P1 203 ; CHECK: load i32, i32* %P1 204} 205 206define void @dse1(i32 *%P) { 207; CHECK-LABEL: @dse1 208; CHECK-NOT: store 209 %v = load i32, i32* %P 210 store i32 %v, i32* %P 211 ret void 212} 213 214define void @dse2(i32 *%P) { 215; CHECK-LABEL: @dse2 216; CHECK-NOT: store 217 %v = load atomic i32, i32* %P seq_cst, align 4 218 store i32 %v, i32* %P 219 ret void 220} 221 222define void @dse3(i32 *%P) { 223; CHECK-LABEL: @dse3 224; CHECK-NOT: store 225 %v = load atomic i32, i32* %P seq_cst, align 4 226 store atomic i32 %v, i32* %P unordered, align 4 227 ret void 228} 229 230define i32 @dse4(i32 *%P, i32 *%Q) { 231; CHECK-LABEL: @dse4 232; CHECK-NOT: store 233; CHECK: ret i32 0 234 %a = load i32, i32* %Q 235 %v = load atomic i32, i32* %P unordered, align 4 236 store atomic i32 %v, i32* %P unordered, align 4 237 %b = load i32, i32* %Q 238 %res = sub i32 %a, %b 239 ret i32 %res 240} 241 242; Note that in this example, %P and %Q could in fact be the same 243; pointer. %v could be different than the value observed for %a 244; and that's okay because we're using relaxed memory ordering. 245; The only guarantee we have to provide is that each of the loads 246; has to observe some value written to that location. We do 247; not have to respect the order in which those writes were done. 248define i32 @dse5(i32 *%P, i32 *%Q) { 249; CHECK-LABEL: @dse5 250; CHECK-NOT: store 251; CHECK: ret i32 0 252 %v = load atomic i32, i32* %P unordered, align 4 253 %a = load atomic i32, i32* %Q unordered, align 4 254 store atomic i32 %v, i32* %P unordered, align 4 255 %b = load atomic i32, i32* %Q unordered, align 4 256 %res = sub i32 %a, %b 257 ret i32 %res 258} 259 260 261define void @dse_neg1(i32 *%P) { 262; CHECK-LABEL: @dse_neg1 263; CHECK: store 264 %v = load i32, i32* %P 265 store i32 5, i32* %P 266 ret void 267} 268 269; Could remove the store, but only if ordering was somehow 270; encoded. 271define void @dse_neg2(i32 *%P) { 272; CHECK-LABEL: @dse_neg2 273; CHECK: store 274 %v = load i32, i32* %P 275 store atomic i32 %v, i32* %P seq_cst, align 4 276 ret void 277} 278 279