1; RUN: llc < %s -mtriple=powerpc64le-unknown-linux-gnu -mcpu=pwr8 -mattr=+vsx | FileCheck %s 2; RUN: llc < %s -mtriple=powerpc64le-unknown-linux-gnu -mcpu=pwr8 -mattr=+vsx -fast-isel -O0 | FileCheck -check-prefix=CHECK-FISL %s 3; XFAIL: * 4 5define void @test1sp(float %a, float %b, float %c, float %e, float* nocapture %d) #0 { 6entry: 7 %0 = tail call float @llvm.fma.f32(float %b, float %c, float %a) 8 store float %0, float* %d, align 4 9 %1 = tail call float @llvm.fma.f32(float %b, float %e, float %a) 10 %arrayidx1 = getelementptr inbounds float, float* %d, i64 1 11 store float %1, float* %arrayidx1, align 4 12 ret void 13 14; CHECK-LABEL: @test1sp 15; CHECK-DAG: li [[C1:[0-9]+]], 4 16; CHECK-DAG: xsmaddmsp 3, 2, 1 17; CHECK-DAG: xsmaddasp 1, 2, 4 18; CHECK-DAG: stxsspx 3, 0, 7 19; CHECK-DAG: stxsspx 1, 7, [[C1]] 20; CHECK: blr 21 22; CHECK-FISL-LABEL: @test1sp 23; CHECK-FISL-DAG: fmr 0, 1 24; CHECK-FISL-DAG: xsmaddasp 0, 2, 3 25; CHECK-FISL-DAG: stxsspx 0, 0, 7 26; CHECK-FISL-DAG: xsmaddasp 1, 2, 4 27; CHECK-FISL-DAG: li [[C1:[0-9]+]], 4 28; CHECK-FISL-DAG: stxsspx 1, 7, [[C1]] 29; CHECK-FISL: blr 30} 31 32define void @test2sp(float %a, float %b, float %c, float %e, float %f, float* nocapture %d) #0 { 33entry: 34 %0 = tail call float @llvm.fma.f32(float %b, float %c, float %a) 35 store float %0, float* %d, align 4 36 %1 = tail call float @llvm.fma.f32(float %b, float %e, float %a) 37 %arrayidx1 = getelementptr inbounds float, float* %d, i64 1 38 store float %1, float* %arrayidx1, align 4 39 %2 = tail call float @llvm.fma.f32(float %b, float %f, float %a) 40 %arrayidx2 = getelementptr inbounds float, float* %d, i64 2 41 store float %2, float* %arrayidx2, align 4 42 ret void 43 44; CHECK-LABEL: @test2sp 45; CHECK-DAG: li [[C1:[0-9]+]], 4 46; CHECK-DAG: li [[C2:[0-9]+]], 8 47; FIXME: We now miss this because of copy ordering at the MI level. 48; CHECX-DAG: xsmaddmsp 3, 2, 1 49; CHECX-DAG: xsmaddmsp 4, 2, 1 50; CHECX-DAG: xsmaddasp 1, 2, 5 51; CHECX-DAG: stxsspx 3, 0, 8 52; CHECX-DAG: stxsspx 4, 8, [[C1]] 53; CHECX-DAG: stxsspx 1, 8, [[C2]] 54; CHECK: blr 55 56; CHECK-FISL-LABEL: @test2sp 57; CHECK-FISL-DAG: fmr 0, 1 58; CHECK-FISL-DAG: xsmaddasp 0, 2, 3 59; CHECK-FISL-DAG: stxsspx 0, 0, 8 60; CHECK-FISL-DAG: fmr 0, 1 61; CHECK-FISL-DAG: xsmaddasp 0, 2, 4 62; CHECK-FISL-DAG: li [[C1:[0-9]+]], 4 63; CHECK-FISL-DAG: stxsspx 0, 8, [[C1]] 64; CHECK-FISL-DAG: xsmaddasp 1, 2, 5 65; CHECK-FISL-DAG: li [[C2:[0-9]+]], 8 66; CHECK-FISL-DAG: stxsspx 1, 8, [[C2]] 67; CHECK-FISL: blr 68} 69 70define void @test3sp(float %a, float %b, float %c, float %e, float %f, float* nocapture %d) #0 { 71entry: 72 %0 = tail call float @llvm.fma.f32(float %b, float %c, float %a) 73 store float %0, float* %d, align 4 74 %1 = tail call float @llvm.fma.f32(float %b, float %e, float %a) 75 %2 = tail call float @llvm.fma.f32(float %b, float %c, float %1) 76 %arrayidx1 = getelementptr inbounds float, float* %d, i64 3 77 store float %2, float* %arrayidx1, align 4 78 %3 = tail call float @llvm.fma.f32(float %b, float %f, float %a) 79 %arrayidx2 = getelementptr inbounds float, float* %d, i64 2 80 store float %3, float* %arrayidx2, align 4 81 %arrayidx3 = getelementptr inbounds float, float* %d, i64 1 82 store float %1, float* %arrayidx3, align 4 83 ret void 84 85; CHECK-LABEL: @test3sp 86; CHECK-DAG: fmr [[F1:[0-9]+]], 1 87; CHECK-DAG: li [[C1:[0-9]+]], 12 88; CHECK-DAG: li [[C2:[0-9]+]], 8 89; CHECK-DAG: li [[C3:[0-9]+]], 4 90; CHECK-DAG: xsmaddmsp 4, 2, 1 91; CHECK-DAG: xsmaddasp 1, 2, 5 92 93; Note: We could convert this next FMA to M-type as well, but it would require 94; re-ordering the instructions. 95; CHECK-DAG: xsmaddasp [[F1]], 2, 3 96 97; CHECK-DAG: xsmaddmsp 3, 2, 4 98; CHECK-DAG: stxsspx [[F1]], 0, 8 99; CHECK-DAG: stxsspx 3, 8, [[C1]] 100; CHECK-DAG: stxsspx 1, 8, [[C2]] 101; CHECK-DAG: stxsspx 4, 8, [[C3]] 102; CHECK: blr 103 104; CHECK-FISL-LABEL: @test3sp 105; CHECK-FISL-DAG: fmr [[F1:[0-9]+]], 1 106; CHECK-FISL-DAG: xsmaddasp [[F1]], 2, 4 107; CHECK-FISL-DAG: fmr 4, [[F1]] 108; CHECK-FISL-DAG: xsmaddasp 4, 2, 3 109; CHECK-FISL-DAG: li [[C1:[0-9]+]], 12 110; CHECK-FISL-DAG: stxsspx 4, 8, [[C1]] 111; CHECK-FISL-DAG: xsmaddasp 1, 2, 5 112; CHECK-FISL-DAG: li [[C2:[0-9]+]], 8 113; CHECK-FISL-DAG: stxsspx 1, 8, [[C2]] 114; CHECK-FISL-DAG: li [[C3:[0-9]+]], 4 115; CHECK-FISL-DAG: stxsspx 0, 8, [[C3]] 116; CHECK-FISL: blr 117} 118 119define void @test4sp(float %a, float %b, float %c, float %e, float %f, float* nocapture %d) #0 { 120entry: 121 %0 = tail call float @llvm.fma.f32(float %b, float %c, float %a) 122 store float %0, float* %d, align 4 123 %1 = tail call float @llvm.fma.f32(float %b, float %e, float %a) 124 %arrayidx1 = getelementptr inbounds float, float* %d, i64 1 125 store float %1, float* %arrayidx1, align 4 126 %2 = tail call float @llvm.fma.f32(float %b, float %c, float %1) 127 %arrayidx3 = getelementptr inbounds float, float* %d, i64 3 128 store float %2, float* %arrayidx3, align 4 129 %3 = tail call float @llvm.fma.f32(float %b, float %f, float %a) 130 %arrayidx4 = getelementptr inbounds float, float* %d, i64 2 131 store float %3, float* %arrayidx4, align 4 132 ret void 133 134; CHECK-LABEL: @test4sp 135; CHECK-DAG: fmr [[F1:[0-9]+]], 1 136; CHECK-DAG: li [[C1:[0-9]+]], 4 137; CHECK-DAG: li [[C2:[0-9]+]], 8 138; CHECK-DAG: xsmaddmsp 4, 2, 1 139 140; Note: We could convert this next FMA to M-type as well, but it would require 141; re-ordering the instructions. 142; CHECK-DAG: xsmaddasp 1, 2, 5 143 144; CHECK-DAG: xsmaddasp [[F1]], 2, 3 145; CHECK-DAG: stxsspx [[F1]], 0, 8 146; CHECK-DAG: stxsspx 4, 8, [[C1]] 147; CHECK-DAG: li [[C3:[0-9]+]], 12 148; CHECK-DAG: xsmaddasp 4, 2, 3 149; CHECK-DAG: stxsspx 4, 8, [[C3]] 150; CHECK-DAG: stxsspx 1, 8, [[C2]] 151; CHECK: blr 152 153; CHECK-FISL-LABEL: @test4sp 154; CHECK-FISL-DAG: fmr [[F1:[0-9]+]], 1 155; CHECK-FISL-DAG: xsmaddasp [[F1]], 2, 3 156; CHECK-FISL-DAG: stxsspx 0, 0, 8 157; CHECK-FISL-DAG: fmr [[F1]], 1 158; CHECK-FISL-DAG: xsmaddasp [[F1]], 2, 4 159; CHECK-FISL-DAG: li [[C3:[0-9]+]], 4 160; CHECK-FISL-DAG: stxsspx 0, 8, [[C3]] 161; CHECK-FISL-DAG: xsmaddasp 0, 2, 3 162; CHECK-FISL-DAG: li [[C1:[0-9]+]], 12 163; CHECK-FISL-DAG: stxsspx 0, 8, [[C1]] 164; CHECK-FISL-DAG: xsmaddasp 1, 2, 5 165; CHECK-FISL-DAG: li [[C2:[0-9]+]], 8 166; CHECK-FISL-DAG: stxsspx 1, 8, [[C2]] 167; CHECK-FISL: blr 168} 169 170declare float @llvm.fma.f32(float, float, float) #0 171