1; RUN: llc -mtriple=x86_64-unknown-unknown -mattr=+mmx,+fma,+f16c,+avx512f -stop-after finalize-isel -o - %s | FileCheck %s 2; This test ensures that the MXCSR is implicitly used by MMX FP instructions. 3 4define x86_mmx @mxcsr_mmx(<4 x float> %a0) { 5; CHECK: MMX_CVTPS2PIirr %{{[0-9]}}, implicit $mxcsr 6; CHECK: MMX_CVTPI2PSirr %{{[0-9]}}, killed %{{[0-9]}}, implicit $mxcsr 7; CHECK: MMX_CVTTPS2PIirr killed %{{[0-9]}}, implicit $mxcsr 8; CHECK: MMX_CVTPI2PDirr killed %{{[0-9]$}} 9; CHECK: MMX_CVTPD2PIirr killed %{{[0-9]}}, implicit $mxcsr 10 %1 = call x86_mmx @llvm.x86.sse.cvtps2pi(<4 x float> %a0) 11 %2 = call <4 x float> @llvm.x86.sse.cvtpi2ps(<4 x float> %a0, x86_mmx %1) 12 %3 = call x86_mmx @llvm.x86.sse.cvttps2pi(<4 x float> %2) 13 %4 = call <2 x double> @llvm.x86.sse.cvtpi2pd(x86_mmx %3) 14 %5 = call x86_mmx @llvm.x86.sse.cvtpd2pi(<2 x double> %4) 15 ret x86_mmx %5 16} 17 18define half @mxcsr_f16c(float %a) { 19; CHECK: VCVTPS2PH{{.*}}mxcsr 20 %res = fptrunc float %a to half 21 ret half %res 22} 23 24define <4 x float> @mxcsr_fma_ss(<4 x float> %a, <4 x float> %b) { 25; CHECK: VFMADD{{.*}}mxcsr 26 %res = call <4 x float> @llvm.x86.fma.vfmadd.ss(<4 x float> %b, <4 x float> %a, <4 x float> 27%a) 28 ret <4 x float> %res 29} 30 31define <4 x float> @mxcsr_fma_ps(<4 x float> %a, <4 x float> %b) { 32; CHECK: VFMADD{{.*}}mxcsr 33 %res = call <4 x float> @llvm.x86.fma.vfmadd.ps(<4 x float> %b, <4 x float> %a, <4 x float> 34%a) 35 ret <4 x float> %res 36} 37 38define <8 x double> @mxcsr_fma_sae(<8 x double> %a, <8 x double> %b, <8 x double> %c) { 39; CHECK: VFMADD{{.*}}mxcsr 40 %res = call <8 x double> @llvm.x86.avx512.mask.vfmadd.pd.512(<8 x double> %a, <8 x double> %b, <8 x double> %c, i8 -1, i32 10) 41 ret <8 x double> %res 42} 43 44declare x86_mmx @llvm.x86.sse.cvtps2pi(<4 x float>) 45declare<4 x float> @llvm.x86.sse.cvtpi2ps(<4 x float>, x86_mmx) 46declare x86_mmx @llvm.x86.sse.cvttps2pi(<4 x float>) 47declare <2 x double> @llvm.x86.sse.cvtpi2pd(x86_mmx) 48declare x86_mmx @llvm.x86.sse.cvtpd2pi(<2 x double>) 49declare <4 x float> @llvm.x86.fma.vfmadd.ss(<4 x float>, <4 x float>, <4 x float>) 50declare <4 x float> @llvm.x86.fma.vfmadd.ps(<4 x float>, <4 x float>, <4 x float>) 51declare <8 x double> @llvm.x86.avx512.mask.vfmadd.pd.512(<8 x double>, <8 x double>, <8 x double>, i8, i32) 52