1//===-- X86Instr3DNow.td - The 3DNow! Instruction Set ------*- tablegen -*-===// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9// 10// This file describes the 3DNow! instruction set, which extends MMX to support 11// floating point and also adds a few more random instructions for good measure. 12// 13//===----------------------------------------------------------------------===// 14 15class I3DNow<bits<8> o, Format F, dag outs, dag ins, string asm, list<dag> pat> 16 : I<o, F, outs, ins, asm, pat>, Requires<[Has3DNow]> { 17} 18 19class I3DNow_binop<bits<8> o, Format F, dag ins, string Mnemonic, list<dag> pat> 20 : I3DNow<o, F, (outs VR64:$dst), ins, 21 !strconcat(Mnemonic, "\t{$src2, $dst|$dst, $src2}"), pat>, ThreeDNow { 22 let Constraints = "$src1 = $dst"; 23} 24 25class I3DNow_conv<bits<8> o, Format F, dag ins, string Mnemonic, list<dag> pat> 26 : I3DNow<o, F, (outs VR64:$dst), ins, 27 !strconcat(Mnemonic, "\t{$src, $dst|$dst, $src}"), pat>, ThreeDNow; 28 29multiclass I3DNow_binop_rm_int<bits<8> opc, string Mn, 30 X86FoldableSchedWrite sched, bit Commutable = 0, 31 string Ver = ""> { 32 let isCommutable = Commutable in 33 def rr : I3DNow_binop<opc, MRMSrcReg, (ins VR64:$src1, VR64:$src2), Mn, 34 [(set VR64:$dst, (!cast<Intrinsic>( 35 !strconcat("int_x86_3dnow", Ver, "_", Mn)) VR64:$src1, VR64:$src2))]>, 36 Sched<[sched]>; 37 def rm : I3DNow_binop<opc, MRMSrcMem, (ins VR64:$src1, i64mem:$src2), Mn, 38 [(set VR64:$dst, (!cast<Intrinsic>( 39 !strconcat("int_x86_3dnow", Ver, "_", Mn)) VR64:$src1, 40 (bitconvert (load_mmx addr:$src2))))]>, 41 Sched<[sched.Folded, ReadAfterLd]>; 42} 43 44multiclass I3DNow_conv_rm_int<bits<8> opc, string Mn, 45 X86FoldableSchedWrite sched, string Ver = ""> { 46 def rr : I3DNow_conv<opc, MRMSrcReg, (ins VR64:$src), Mn, 47 [(set VR64:$dst, (!cast<Intrinsic>( 48 !strconcat("int_x86_3dnow", Ver, "_", Mn)) VR64:$src))]>, 49 Sched<[sched]>; 50 def rm : I3DNow_conv<opc, MRMSrcMem, (ins i64mem:$src), Mn, 51 [(set VR64:$dst, (!cast<Intrinsic>( 52 !strconcat("int_x86_3dnow", Ver, "_", Mn)) 53 (bitconvert (load_mmx addr:$src))))]>, 54 Sched<[sched.Folded, ReadAfterLd]>; 55} 56 57defm PAVGUSB : I3DNow_binop_rm_int<0xBF, "pavgusb", SchedWriteVecALU.MMX, 1>; 58defm PF2ID : I3DNow_conv_rm_int<0x1D, "pf2id", WriteCvtPS2I>; 59defm PFACC : I3DNow_binop_rm_int<0xAE, "pfacc", WriteFAdd>; 60defm PFADD : I3DNow_binop_rm_int<0x9E, "pfadd", WriteFAdd, 1>; 61defm PFCMPEQ : I3DNow_binop_rm_int<0xB0, "pfcmpeq", WriteFAdd, 1>; 62defm PFCMPGE : I3DNow_binop_rm_int<0x90, "pfcmpge", WriteFAdd>; 63defm PFCMPGT : I3DNow_binop_rm_int<0xA0, "pfcmpgt", WriteFAdd>; 64defm PFMAX : I3DNow_binop_rm_int<0xA4, "pfmax", WriteFAdd>; 65defm PFMIN : I3DNow_binop_rm_int<0x94, "pfmin", WriteFAdd>; 66defm PFMUL : I3DNow_binop_rm_int<0xB4, "pfmul", WriteFAdd, 1>; 67defm PFRCP : I3DNow_conv_rm_int<0x96, "pfrcp", WriteFAdd>; 68defm PFRCPIT1 : I3DNow_binop_rm_int<0xA6, "pfrcpit1", WriteFAdd>; 69defm PFRCPIT2 : I3DNow_binop_rm_int<0xB6, "pfrcpit2", WriteFAdd>; 70defm PFRSQIT1 : I3DNow_binop_rm_int<0xA7, "pfrsqit1", WriteFAdd>; 71defm PFRSQRT : I3DNow_conv_rm_int<0x97, "pfrsqrt", WriteFAdd>; 72defm PFSUB : I3DNow_binop_rm_int<0x9A, "pfsub", WriteFAdd, 1>; 73defm PFSUBR : I3DNow_binop_rm_int<0xAA, "pfsubr", WriteFAdd, 1>; 74defm PI2FD : I3DNow_conv_rm_int<0x0D, "pi2fd", WriteCvtI2PS>; 75defm PMULHRW : I3DNow_binop_rm_int<0xB7, "pmulhrw", SchedWriteVecIMul.MMX, 1>; 76 77let SchedRW = [WriteEMMS] in 78def FEMMS : I3DNow<0x0E, RawFrm, (outs), (ins), "femms", 79 [(int_x86_mmx_femms)]>, TB; 80 81// PREFETCHWT1 is supported we want to use it for everything but T0. 82def PrefetchWLevel : PatFrag<(ops), (i32 imm), [{ 83 return N->getSExtValue() == 3 || !Subtarget->hasPREFETCHWT1(); 84}]>; 85 86// Use PREFETCHWT1 for NTA, T2, T1. 87def PrefetchWT1Level : ImmLeaf<i32, [{ 88 return Imm < 3; 89}]>; 90 91let SchedRW = [WriteLoad] in { 92let Predicates = [Has3DNow, NoSSEPrefetch] in 93def PREFETCH : I3DNow<0x0D, MRM0m, (outs), (ins i8mem:$addr), 94 "prefetch\t$addr", 95 [(prefetch addr:$addr, imm, imm, (i32 1))]>, TB; 96 97def PREFETCHW : I<0x0D, MRM1m, (outs), (ins i8mem:$addr), "prefetchw\t$addr", 98 [(prefetch addr:$addr, (i32 1), (i32 PrefetchWLevel), (i32 1))]>, 99 TB, Requires<[HasPrefetchW]>; 100 101def PREFETCHWT1 : I<0x0D, MRM2m, (outs), (ins i8mem:$addr), "prefetchwt1\t$addr", 102 [(prefetch addr:$addr, (i32 1), (i32 PrefetchWT1Level), (i32 1))]>, 103 TB, Requires<[HasPREFETCHWT1]>; 104} 105 106// "3DNowA" instructions 107defm PF2IW : I3DNow_conv_rm_int<0x1C, "pf2iw", WriteCvtPS2I, "a">; 108defm PI2FW : I3DNow_conv_rm_int<0x0C, "pi2fw", WriteCvtI2PS, "a">; 109defm PFNACC : I3DNow_binop_rm_int<0x8A, "pfnacc", WriteFAdd, 0, "a">; 110defm PFPNACC : I3DNow_binop_rm_int<0x8E, "pfpnacc", WriteFAdd, 0, "a">; 111defm PSWAPD : I3DNow_conv_rm_int<0xBB, "pswapd", SchedWriteShuffle.MMX, "a">; 112