1; RUN: opt < %s -sroa -S | FileCheck %s 2target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-n8:16:32:64" 3 4define i32 @test1() { 5; CHECK-LABEL: @test1( 6entry: 7 %a = alloca [2 x i32] 8; CHECK-NOT: alloca 9 10 %a0 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 0 11 %a1 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 1 12 store i32 0, i32* %a0 13 store i32 1, i32* %a1 14 %v0 = load i32, i32* %a0 15 %v1 = load i32, i32* %a1 16; CHECK-NOT: store 17; CHECK-NOT: load 18 19 %cond = icmp sle i32 %v0, %v1 20 br i1 %cond, label %then, label %exit 21 22then: 23 br label %exit 24 25exit: 26 %phi = phi i32* [ %a1, %then ], [ %a0, %entry ] 27; CHECK: phi i32 [ 1, %{{.*}} ], [ 0, %{{.*}} ] 28 29 %result = load i32, i32* %phi 30 ret i32 %result 31} 32 33define i32 @test2() { 34; CHECK-LABEL: @test2( 35entry: 36 %a = alloca [2 x i32] 37; CHECK-NOT: alloca 38 39 %a0 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 0 40 %a1 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 1 41 store i32 0, i32* %a0 42 store i32 1, i32* %a1 43 %v0 = load i32, i32* %a0 44 %v1 = load i32, i32* %a1 45; CHECK-NOT: store 46; CHECK-NOT: load 47 48 %cond = icmp sle i32 %v0, %v1 49 %select = select i1 %cond, i32* %a1, i32* %a0 50; CHECK: select i1 %{{.*}}, i32 1, i32 0 51 52 %result = load i32, i32* %select 53 ret i32 %result 54} 55 56define i32 @test3(i32 %x) { 57; CHECK-LABEL: @test3( 58entry: 59 %a = alloca [2 x i32] 60; CHECK-NOT: alloca 61 62 ; Note that we build redundant GEPs here to ensure that having different GEPs 63 ; into the same alloca partation continues to work with PHI speculation. This 64 ; was the underlying cause of PR13926. 65 %a0 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 0 66 %a0b = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 0 67 %a1 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 1 68 %a1b = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 1 69 store i32 0, i32* %a0 70 store i32 1, i32* %a1 71; CHECK-NOT: store 72 73 switch i32 %x, label %bb0 [ i32 1, label %bb1 74 i32 2, label %bb2 75 i32 3, label %bb3 76 i32 4, label %bb4 77 i32 5, label %bb5 78 i32 6, label %bb6 79 i32 7, label %bb7 ] 80 81bb0: 82 br label %exit 83bb1: 84 br label %exit 85bb2: 86 br label %exit 87bb3: 88 br label %exit 89bb4: 90 br label %exit 91bb5: 92 br label %exit 93bb6: 94 br label %exit 95bb7: 96 br label %exit 97 98exit: 99 %phi = phi i32* [ %a1, %bb0 ], [ %a0, %bb1 ], [ %a0, %bb2 ], [ %a1, %bb3 ], 100 [ %a1b, %bb4 ], [ %a0b, %bb5 ], [ %a0b, %bb6 ], [ %a1b, %bb7 ] 101; CHECK: phi i32 [ 1, %{{.*}} ], [ 0, %{{.*}} ], [ 0, %{{.*}} ], [ 1, %{{.*}} ], [ 1, %{{.*}} ], [ 0, %{{.*}} ], [ 0, %{{.*}} ], [ 1, %{{.*}} ] 102 103 %result = load i32, i32* %phi 104 ret i32 %result 105} 106 107define i32 @test4() { 108; CHECK-LABEL: @test4( 109entry: 110 %a = alloca [2 x i32] 111; CHECK-NOT: alloca 112 113 %a0 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 0 114 %a1 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 1 115 store i32 0, i32* %a0 116 store i32 1, i32* %a1 117 %v0 = load i32, i32* %a0 118 %v1 = load i32, i32* %a1 119; CHECK-NOT: store 120; CHECK-NOT: load 121 122 %cond = icmp sle i32 %v0, %v1 123 %select = select i1 %cond, i32* %a0, i32* %a0 124; CHECK-NOT: select 125 126 %result = load i32, i32* %select 127 ret i32 %result 128; CHECK: ret i32 0 129} 130 131define i32 @test5(i32* %b) { 132; CHECK-LABEL: @test5( 133entry: 134 %a = alloca [2 x i32] 135; CHECK-NOT: alloca 136 137 %a1 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 1 138 store i32 1, i32* %a1 139; CHECK-NOT: store 140 141 %select = select i1 true, i32* %a1, i32* %b 142; CHECK-NOT: select 143 144 %result = load i32, i32* %select 145; CHECK-NOT: load 146 147 ret i32 %result 148; CHECK: ret i32 1 149} 150 151declare void @f(i32*, i32*) 152 153define i32 @test6(i32* %b) { 154; CHECK-LABEL: @test6( 155entry: 156 %a = alloca [2 x i32] 157 %c = alloca i32 158; CHECK-NOT: alloca 159 160 %a1 = getelementptr [2 x i32], [2 x i32]* %a, i64 0, i32 1 161 store i32 1, i32* %a1 162 163 %select = select i1 true, i32* %a1, i32* %b 164 %select2 = select i1 false, i32* %a1, i32* %b 165 %select3 = select i1 false, i32* %c, i32* %b 166; CHECK: %[[select2:.*]] = select i1 false, i32* undef, i32* %b 167; CHECK: %[[select3:.*]] = select i1 false, i32* undef, i32* %b 168 169 ; Note, this would potentially escape the alloca pointer except for the 170 ; constant folding of the select. 171 call void @f(i32* %select2, i32* %select3) 172; CHECK: call void @f(i32* %[[select2]], i32* %[[select3]]) 173 174 175 %result = load i32, i32* %select 176; CHECK-NOT: load 177 178 %dead = load i32, i32* %c 179 180 ret i32 %result 181; CHECK: ret i32 1 182} 183 184define i32 @test7() { 185; CHECK-LABEL: @test7( 186; CHECK-NOT: alloca 187 188entry: 189 %X = alloca i32 190 br i1 undef, label %good, label %bad 191 192good: 193 %Y1 = getelementptr i32, i32* %X, i64 0 194 store i32 0, i32* %Y1 195 br label %exit 196 197bad: 198 %Y2 = getelementptr i32, i32* %X, i64 1 199 store i32 0, i32* %Y2 200 br label %exit 201 202exit: 203 %P = phi i32* [ %Y1, %good ], [ %Y2, %bad ] 204; CHECK: %[[phi:.*]] = phi i32 [ 0, %good ], 205 %Z2 = load i32, i32* %P 206 ret i32 %Z2 207; CHECK: ret i32 %[[phi]] 208} 209 210define i32 @test8(i32 %b, i32* %ptr) { 211; Ensure that we rewrite allocas to the used type when that use is hidden by 212; a PHI that can be speculated. 213; CHECK-LABEL: @test8( 214; CHECK-NOT: alloca 215; CHECK-NOT: load 216; CHECK: %[[value:.*]] = load i32, i32* %ptr 217; CHECK-NOT: load 218; CHECK: %[[result:.*]] = phi i32 [ undef, %else ], [ %[[value]], %then ] 219; CHECK-NEXT: ret i32 %[[result]] 220 221entry: 222 %f = alloca float 223 %test = icmp ne i32 %b, 0 224 br i1 %test, label %then, label %else 225 226then: 227 br label %exit 228 229else: 230 %bitcast = bitcast float* %f to i32* 231 br label %exit 232 233exit: 234 %phi = phi i32* [ %bitcast, %else ], [ %ptr, %then ] 235 %loaded = load i32, i32* %phi, align 4 236 ret i32 %loaded 237} 238 239define i32 @test9(i32 %b, i32* %ptr) { 240; Same as @test8 but for a select rather than a PHI node. 241; CHECK-LABEL: @test9( 242; CHECK-NOT: alloca 243; CHECK-NOT: load 244; CHECK: %[[value:.*]] = load i32, i32* %ptr 245; CHECK-NOT: load 246; CHECK: %[[result:.*]] = select i1 %{{.*}}, i32 undef, i32 %[[value]] 247; CHECK-NEXT: ret i32 %[[result]] 248 249entry: 250 %f = alloca float 251 store i32 0, i32* %ptr 252 %test = icmp ne i32 %b, 0 253 %bitcast = bitcast float* %f to i32* 254 %select = select i1 %test, i32* %bitcast, i32* %ptr 255 %loaded = load i32, i32* %select, align 4 256 ret i32 %loaded 257} 258 259define float @test10(i32 %b, float* %ptr) { 260; Don't try to promote allocas which are not elligible for it even after 261; rewriting due to the necessity of inserting bitcasts when speculating a PHI 262; node. 263; CHECK-LABEL: @test10( 264; CHECK: %[[alloca:.*]] = alloca 265; CHECK: %[[argvalue:.*]] = load float, float* %ptr 266; CHECK: %[[cast:.*]] = bitcast double* %[[alloca]] to float* 267; CHECK: %[[allocavalue:.*]] = load float, float* %[[cast]] 268; CHECK: %[[result:.*]] = phi float [ %[[allocavalue]], %else ], [ %[[argvalue]], %then ] 269; CHECK-NEXT: ret float %[[result]] 270 271entry: 272 %f = alloca double 273 store double 0.0, double* %f 274 %test = icmp ne i32 %b, 0 275 br i1 %test, label %then, label %else 276 277then: 278 br label %exit 279 280else: 281 %bitcast = bitcast double* %f to float* 282 br label %exit 283 284exit: 285 %phi = phi float* [ %bitcast, %else ], [ %ptr, %then ] 286 %loaded = load float, float* %phi, align 4 287 ret float %loaded 288} 289 290define float @test11(i32 %b, float* %ptr) { 291; Same as @test10 but for a select rather than a PHI node. 292; CHECK-LABEL: @test11( 293; CHECK: %[[alloca:.*]] = alloca 294; CHECK: %[[cast:.*]] = bitcast double* %[[alloca]] to float* 295; CHECK: %[[allocavalue:.*]] = load float, float* %[[cast]] 296; CHECK: %[[argvalue:.*]] = load float, float* %ptr 297; CHECK: %[[result:.*]] = select i1 %{{.*}}, float %[[allocavalue]], float %[[argvalue]] 298; CHECK-NEXT: ret float %[[result]] 299 300entry: 301 %f = alloca double 302 store double 0.0, double* %f 303 store float 0.0, float* %ptr 304 %test = icmp ne i32 %b, 0 305 %bitcast = bitcast double* %f to float* 306 %select = select i1 %test, float* %bitcast, float* %ptr 307 %loaded = load float, float* %select, align 4 308 ret float %loaded 309} 310 311define i32 @test12(i32 %x, i32* %p) { 312; Ensure we don't crash or fail to nuke dead selects of allocas if no load is 313; never found. 314; CHECK-LABEL: @test12( 315; CHECK-NOT: alloca 316; CHECK-NOT: select 317; CHECK: ret i32 %x 318 319entry: 320 %a = alloca i32 321 store i32 %x, i32* %a 322 %dead = select i1 undef, i32* %a, i32* %p 323 %load = load i32, i32* %a 324 ret i32 %load 325} 326 327define i32 @test13(i32 %x, i32* %p) { 328; Ensure we don't crash or fail to nuke dead phis of allocas if no load is ever 329; found. 330; CHECK-LABEL: @test13( 331; CHECK-NOT: alloca 332; CHECK-NOT: phi 333; CHECK: ret i32 %x 334 335entry: 336 %a = alloca i32 337 store i32 %x, i32* %a 338 br label %loop 339 340loop: 341 %phi = phi i32* [ %p, %entry ], [ %a, %loop ] 342 br i1 undef, label %loop, label %exit 343 344exit: 345 %load = load i32, i32* %a 346 ret i32 %load 347} 348 349define i32 @test14(i1 %b1, i1 %b2, i32* %ptr) { 350; Check for problems when there are both selects and phis and one is 351; speculatable toward promotion but the other is not. That should block all of 352; the speculation. 353; CHECK-LABEL: @test14( 354; CHECK: alloca 355; CHECK: alloca 356; CHECK: select 357; CHECK: phi 358; CHECK: phi 359; CHECK: select 360; CHECK: ret i32 361 362entry: 363 %f = alloca i32 364 %g = alloca i32 365 store i32 0, i32* %f 366 store i32 0, i32* %g 367 %f.select = select i1 %b1, i32* %f, i32* %ptr 368 br i1 %b2, label %then, label %else 369 370then: 371 br label %exit 372 373else: 374 br label %exit 375 376exit: 377 %f.phi = phi i32* [ %f, %then ], [ %f.select, %else ] 378 %g.phi = phi i32* [ %g, %then ], [ %ptr, %else ] 379 %f.loaded = load i32, i32* %f.phi 380 %g.select = select i1 %b1, i32* %g, i32* %g.phi 381 %g.loaded = load i32, i32* %g.select 382 %result = add i32 %f.loaded, %g.loaded 383 ret i32 %result 384} 385 386define i32 @PR13905() { 387; Check a pattern where we have a chain of dead phi nodes to ensure they are 388; deleted and promotion can proceed. 389; CHECK-LABEL: @PR13905( 390; CHECK-NOT: alloca i32 391; CHECK: ret i32 undef 392 393entry: 394 %h = alloca i32 395 store i32 0, i32* %h 396 br i1 undef, label %loop1, label %exit 397 398loop1: 399 %phi1 = phi i32* [ null, %entry ], [ %h, %loop1 ], [ %h, %loop2 ] 400 br i1 undef, label %loop1, label %loop2 401 402loop2: 403 br i1 undef, label %loop1, label %exit 404 405exit: 406 %phi2 = phi i32* [ %phi1, %loop2 ], [ null, %entry ] 407 ret i32 undef 408} 409 410define i32 @PR13906() { 411; Another pattern which can lead to crashes due to failing to clear out dead 412; PHI nodes or select nodes. This triggers subtly differently from the above 413; cases because the PHI node is (recursively) alive, but the select is dead. 414; CHECK-LABEL: @PR13906( 415; CHECK-NOT: alloca 416 417entry: 418 %c = alloca i32 419 store i32 0, i32* %c 420 br label %for.cond 421 422for.cond: 423 %d.0 = phi i32* [ undef, %entry ], [ %c, %if.then ], [ %d.0, %for.cond ] 424 br i1 undef, label %if.then, label %for.cond 425 426if.then: 427 %tmpcast.d.0 = select i1 undef, i32* %c, i32* %d.0 428 br label %for.cond 429} 430 431define i64 @PR14132(i1 %flag) { 432; CHECK-LABEL: @PR14132( 433; Here we form a PHI-node by promoting the pointer alloca first, and then in 434; order to promote the other two allocas, we speculate the load of the 435; now-phi-node-pointer. In doing so we end up loading a 64-bit value from an i8 436; alloca. While this is a bit dubious, we were asserting on trying to 437; rewrite it. The trick is that the code using the value may carefully take 438; steps to only use the not-undef bits, and so we need to at least loosely 439; support this.. 440entry: 441 %a = alloca i64, align 8 442 %b = alloca i8, align 8 443 %ptr = alloca i64*, align 8 444; CHECK-NOT: alloca 445 446 %ptr.cast = bitcast i64** %ptr to i8** 447 store i64 0, i64* %a, align 8 448 store i8 1, i8* %b, align 8 449 store i64* %a, i64** %ptr, align 8 450 br i1 %flag, label %if.then, label %if.end 451 452if.then: 453 store i8* %b, i8** %ptr.cast, align 8 454 br label %if.end 455; CHECK-NOT: store 456; CHECK: %[[ext:.*]] = zext i8 1 to i64 457 458if.end: 459 %tmp = load i64*, i64** %ptr, align 8 460 %result = load i64, i64* %tmp, align 8 461; CHECK-NOT: load 462; CHECK: %[[result:.*]] = phi i64 [ %[[ext]], %if.then ], [ 0, %entry ] 463 464 ret i64 %result 465; CHECK-NEXT: ret i64 %[[result]] 466} 467 468define float @PR16687(i64 %x, i1 %flag) { 469; CHECK-LABEL: @PR16687( 470; Check that even when we try to speculate the same phi twice (in two slices) 471; on an otherwise promotable construct, we don't get ahead of ourselves and try 472; to promote one of the slices prior to speculating it. 473 474entry: 475 %a = alloca i64, align 8 476 store i64 %x, i64* %a 477 br i1 %flag, label %then, label %else 478; CHECK-NOT: alloca 479; CHECK-NOT: store 480; CHECK: %[[lo:.*]] = trunc i64 %x to i32 481; CHECK: %[[shift:.*]] = lshr i64 %x, 32 482; CHECK: %[[hi:.*]] = trunc i64 %[[shift]] to i32 483 484then: 485 %a.f = bitcast i64* %a to float* 486 br label %end 487; CHECK: %[[lo_cast:.*]] = bitcast i32 %[[lo]] to float 488 489else: 490 %a.raw = bitcast i64* %a to i8* 491 %a.raw.4 = getelementptr i8, i8* %a.raw, i64 4 492 %a.raw.4.f = bitcast i8* %a.raw.4 to float* 493 br label %end 494; CHECK: %[[hi_cast:.*]] = bitcast i32 %[[hi]] to float 495 496end: 497 %a.phi.f = phi float* [ %a.f, %then ], [ %a.raw.4.f, %else ] 498 %f = load float, float* %a.phi.f 499 ret float %f 500; CHECK: %[[phi:.*]] = phi float [ %[[lo_cast]], %then ], [ %[[hi_cast]], %else ] 501; CHECK-NOT: load 502; CHECK: ret float %[[phi]] 503} 504 505; Verifies we fixed PR20425. We should be able to promote all alloca's to 506; registers in this test. 507; 508; %0 = slice 509; %1 = slice 510; %2 = phi(%0, %1) // == slice 511define float @simplify_phi_nodes_that_equal_slice(i1 %cond, float* %temp) { 512; CHECK-LABEL: @simplify_phi_nodes_that_equal_slice( 513entry: 514 %arr = alloca [4 x float], align 4 515; CHECK-NOT: alloca 516 br i1 %cond, label %then, label %else 517 518then: 519 %0 = getelementptr inbounds [4 x float], [4 x float]* %arr, i64 0, i64 3 520 store float 1.000000e+00, float* %0, align 4 521 br label %merge 522 523else: 524 %1 = getelementptr inbounds [4 x float], [4 x float]* %arr, i64 0, i64 3 525 store float 2.000000e+00, float* %1, align 4 526 br label %merge 527 528merge: 529 %2 = phi float* [ %0, %then ], [ %1, %else ] 530 store float 0.000000e+00, float* %temp, align 4 531 %3 = load float, float* %2, align 4 532 ret float %3 533} 534 535; A slightly complicated example for PR20425. 536; 537; %0 = slice 538; %1 = phi(%0) // == slice 539; %2 = slice 540; %3 = phi(%1, %2) // == slice 541define float @simplify_phi_nodes_that_equal_slice_2(i1 %cond, float* %temp) { 542; CHECK-LABEL: @simplify_phi_nodes_that_equal_slice_2( 543entry: 544 %arr = alloca [4 x float], align 4 545; CHECK-NOT: alloca 546 br i1 %cond, label %then, label %else 547 548then: 549 %0 = getelementptr inbounds [4 x float], [4 x float]* %arr, i64 0, i64 3 550 store float 1.000000e+00, float* %0, align 4 551 br label %then2 552 553then2: 554 %1 = phi float* [ %0, %then ] 555 store float 2.000000e+00, float* %1, align 4 556 br label %merge 557 558else: 559 %2 = getelementptr inbounds [4 x float], [4 x float]* %arr, i64 0, i64 3 560 store float 3.000000e+00, float* %2, align 4 561 br label %merge 562 563merge: 564 %3 = phi float* [ %1, %then2 ], [ %2, %else ] 565 store float 0.000000e+00, float* %temp, align 4 566 %4 = load float, float* %3, align 4 567 ret float %4 568} 569 570%struct.S = type { i32 } 571 572; Verifies we fixed PR20822. We have a foldable PHI feeding a speculatable PHI 573; which requires the rewriting of the speculated PHI to handle insertion 574; when the incoming pointer is itself from a PHI node. We would previously 575; insert a bitcast instruction *before* a PHI, producing an invalid module; 576; make sure we insert *after* the first non-PHI instruction. 577define void @PR20822() { 578; CHECK-LABEL: @PR20822( 579entry: 580 %f = alloca %struct.S, align 4 581; CHECK: %[[alloca:.*]] = alloca 582 br i1 undef, label %if.end, label %for.cond 583 584for.cond: ; preds = %for.cond, %entry 585 br label %if.end 586 587if.end: ; preds = %for.cond, %entry 588 %f2 = phi %struct.S* [ %f, %entry ], [ %f, %for.cond ] 589; CHECK: phi i32 590; CHECK: %[[cast:.*]] = bitcast i32* %[[alloca]] to %struct.S* 591 phi i32 [ undef, %entry ], [ undef, %for.cond ] 592 br i1 undef, label %if.then5, label %if.then2 593 594if.then2: ; preds = %if.end 595 br label %if.then5 596 597if.then5: ; preds = %if.then2, %if.end 598 %f1 = phi %struct.S* [ undef, %if.then2 ], [ %f2, %if.end ] 599; CHECK: phi {{.*}} %[[cast]] 600 store %struct.S undef, %struct.S* %f1, align 4 601 ret void 602} 603 604define i32 @phi_align(i32* %z) { 605; CHECK-LABEL: @phi_align( 606entry: 607 %a = alloca [8 x i8], align 8 608; CHECK: alloca [7 x i8] 609 610 %a0x = getelementptr [8 x i8], [8 x i8]* %a, i64 0, i32 1 611 %a0 = bitcast i8* %a0x to i32* 612 %a1x = getelementptr [8 x i8], [8 x i8]* %a, i64 0, i32 4 613 %a1 = bitcast i8* %a1x to i32* 614; CHECK: store i32 0, {{.*}}, align 1 615 store i32 0, i32* %a0, align 1 616; CHECK: store i32 1, {{.*}}, align 1 617 store i32 1, i32* %a1, align 4 618; CHECK: load {{.*}}, align 1 619 %v0 = load i32, i32* %a0, align 1 620; CHECK: load {{.*}}, align 1 621 %v1 = load i32, i32* %a1, align 4 622 %cond = icmp sle i32 %v0, %v1 623 br i1 %cond, label %then, label %exit 624 625then: 626 br label %exit 627 628exit: 629; CHECK: %phi = phi i32* [ {{.*}}, %then ], [ %z, %entry ] 630; CHECK-NEXT: %result = load i32, i32* %phi, align 1 631 %phi = phi i32* [ %a1, %then ], [ %z, %entry ] 632 %result = load i32, i32* %phi, align 4 633 ret i32 %result 634} 635