//===-- AMDGPUInstPrinter.cpp - AMDGPU MC Inst -> ASM ---------------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // // \file //===----------------------------------------------------------------------===// #include "AMDGPUInstPrinter.h" #include "MCTargetDesc/AMDGPUMCTargetDesc.h" #include "SIDefines.h" #include "llvm/MC/MCExpr.h" #include "llvm/MC/MCInst.h" #include "llvm/MC/MCInstrInfo.h" #include "llvm/MC/MCRegisterInfo.h" #include "llvm/Support/MathExtras.h" using namespace llvm; void AMDGPUInstPrinter::printInst(const MCInst *MI, raw_ostream &OS, StringRef Annot, const MCSubtargetInfo &STI) { OS.flush(); printInstruction(MI, OS); printAnnotation(OS, Annot); } void AMDGPUInstPrinter::printU8ImmOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O) { O << formatHex(MI->getOperand(OpNo).getImm() & 0xff); } void AMDGPUInstPrinter::printU16ImmOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O) { O << formatHex(MI->getOperand(OpNo).getImm() & 0xffff); } void AMDGPUInstPrinter::printU32ImmOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O) { O << formatHex(MI->getOperand(OpNo).getImm() & 0xffffffff); } void AMDGPUInstPrinter::printU8ImmDecOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O) { O << formatDec(MI->getOperand(OpNo).getImm() & 0xff); } void AMDGPUInstPrinter::printU16ImmDecOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O) { O << formatDec(MI->getOperand(OpNo).getImm() & 0xffff); } void AMDGPUInstPrinter::printOffen(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) O << " offen"; } void AMDGPUInstPrinter::printIdxen(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) O << " idxen"; } void AMDGPUInstPrinter::printAddr64(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) O << " addr64"; } void AMDGPUInstPrinter::printMBUFOffset(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) { O << " offset:"; printU16ImmDecOperand(MI, OpNo, O); } } void AMDGPUInstPrinter::printDSOffset(const MCInst *MI, unsigned OpNo, raw_ostream &O) { uint16_t Imm = MI->getOperand(OpNo).getImm(); if (Imm != 0) { O << " offset:"; printU16ImmDecOperand(MI, OpNo, O); } } void AMDGPUInstPrinter::printDSOffset0(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) { O << " offset0:"; printU8ImmDecOperand(MI, OpNo, O); } } void AMDGPUInstPrinter::printDSOffset1(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) { O << " offset1:"; printU8ImmDecOperand(MI, OpNo, O); } } void AMDGPUInstPrinter::printGDS(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) O << " gds"; } void AMDGPUInstPrinter::printGLC(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) O << " glc"; } void AMDGPUInstPrinter::printSLC(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) O << " slc"; } void AMDGPUInstPrinter::printTFE(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) O << " tfe"; } void AMDGPUInstPrinter::printRegOperand(unsigned reg, raw_ostream &O, const MCRegisterInfo &MRI) { switch (reg) { case AMDGPU::VCC: O << "vcc"; return; case AMDGPU::SCC: O << "scc"; return; case AMDGPU::EXEC: O << "exec"; return; case AMDGPU::M0: O << "m0"; return; case AMDGPU::FLAT_SCR: O << "flat_scratch"; return; case AMDGPU::VCC_LO: O << "vcc_lo"; return; case AMDGPU::VCC_HI: O << "vcc_hi"; return; case AMDGPU::EXEC_LO: O << "exec_lo"; return; case AMDGPU::EXEC_HI: O << "exec_hi"; return; case AMDGPU::FLAT_SCR_LO: O << "flat_scratch_lo"; return; case AMDGPU::FLAT_SCR_HI: O << "flat_scratch_hi"; return; default: break; } char Type; unsigned NumRegs; if (MRI.getRegClass(AMDGPU::VGPR_32RegClassID).contains(reg)) { Type = 'v'; NumRegs = 1; } else if (MRI.getRegClass(AMDGPU::SGPR_32RegClassID).contains(reg)) { Type = 's'; NumRegs = 1; } else if (MRI.getRegClass(AMDGPU::VReg_64RegClassID).contains(reg)) { Type = 'v'; NumRegs = 2; } else if (MRI.getRegClass(AMDGPU::SReg_64RegClassID).contains(reg)) { Type = 's'; NumRegs = 2; } else if (MRI.getRegClass(AMDGPU::VReg_128RegClassID).contains(reg)) { Type = 'v'; NumRegs = 4; } else if (MRI.getRegClass(AMDGPU::SReg_128RegClassID).contains(reg)) { Type = 's'; NumRegs = 4; } else if (MRI.getRegClass(AMDGPU::VReg_96RegClassID).contains(reg)) { Type = 'v'; NumRegs = 3; } else if (MRI.getRegClass(AMDGPU::VReg_256RegClassID).contains(reg)) { Type = 'v'; NumRegs = 8; } else if (MRI.getRegClass(AMDGPU::SReg_256RegClassID).contains(reg)) { Type = 's'; NumRegs = 8; } else if (MRI.getRegClass(AMDGPU::VReg_512RegClassID).contains(reg)) { Type = 'v'; NumRegs = 16; } else if (MRI.getRegClass(AMDGPU::SReg_512RegClassID).contains(reg)) { Type = 's'; NumRegs = 16; } else { O << getRegisterName(reg); return; } // The low 8 bits of the encoding value is the register index, for both VGPRs // and SGPRs. unsigned RegIdx = MRI.getEncodingValue(reg) & ((1 << 8) - 1); if (NumRegs == 1) { O << Type << RegIdx; return; } O << Type << '[' << RegIdx << ':' << (RegIdx + NumRegs - 1) << ']'; } void AMDGPUInstPrinter::printVOPDst(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::VOP3) O << "_e64 "; else O << "_e32 "; printOperand(MI, OpNo, O); } void AMDGPUInstPrinter::printImmediate32(uint32_t Imm, raw_ostream &O) { int32_t SImm = static_cast(Imm); if (SImm >= -16 && SImm <= 64) { O << SImm; return; } if (Imm == FloatToBits(0.0f)) O << "0.0"; else if (Imm == FloatToBits(1.0f)) O << "1.0"; else if (Imm == FloatToBits(-1.0f)) O << "-1.0"; else if (Imm == FloatToBits(0.5f)) O << "0.5"; else if (Imm == FloatToBits(-0.5f)) O << "-0.5"; else if (Imm == FloatToBits(2.0f)) O << "2.0"; else if (Imm == FloatToBits(-2.0f)) O << "-2.0"; else if (Imm == FloatToBits(4.0f)) O << "4.0"; else if (Imm == FloatToBits(-4.0f)) O << "-4.0"; else O << formatHex(static_cast(Imm)); } void AMDGPUInstPrinter::printImmediate64(uint64_t Imm, raw_ostream &O) { int64_t SImm = static_cast(Imm); if (SImm >= -16 && SImm <= 64) { O << SImm; return; } if (Imm == DoubleToBits(0.0)) O << "0.0"; else if (Imm == DoubleToBits(1.0)) O << "1.0"; else if (Imm == DoubleToBits(-1.0)) O << "-1.0"; else if (Imm == DoubleToBits(0.5)) O << "0.5"; else if (Imm == DoubleToBits(-0.5)) O << "-0.5"; else if (Imm == DoubleToBits(2.0)) O << "2.0"; else if (Imm == DoubleToBits(-2.0)) O << "-2.0"; else if (Imm == DoubleToBits(4.0)) O << "4.0"; else if (Imm == DoubleToBits(-4.0)) O << "-4.0"; else { assert(isUInt<32>(Imm)); // In rare situations, we will have a 32-bit literal in a 64-bit // operand. This is technically allowed for the encoding of s_mov_b64. O << formatHex(static_cast(Imm)); } } void AMDGPUInstPrinter::printOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O) { const MCOperand &Op = MI->getOperand(OpNo); if (Op.isReg()) { switch (Op.getReg()) { // This is the default predicate state, so we don't need to print it. case AMDGPU::PRED_SEL_OFF: break; default: printRegOperand(Op.getReg(), O, MRI); break; } } else if (Op.isImm()) { const MCInstrDesc &Desc = MII.get(MI->getOpcode()); int RCID = Desc.OpInfo[OpNo].RegClass; if (RCID != -1) { const MCRegisterClass &ImmRC = MRI.getRegClass(RCID); if (ImmRC.getSize() == 4) printImmediate32(Op.getImm(), O); else if (ImmRC.getSize() == 8) printImmediate64(Op.getImm(), O); else llvm_unreachable("Invalid register class size"); } else if (Desc.OpInfo[OpNo].OperandType == MCOI::OPERAND_IMMEDIATE) { printImmediate32(Op.getImm(), O); } else { // We hit this for the immediate instruction bits that don't yet have a // custom printer. // TODO: Eventually this should be unnecessary. O << formatDec(Op.getImm()); } } else if (Op.isFPImm()) { // We special case 0.0 because otherwise it will be printed as an integer. if (Op.getFPImm() == 0.0) O << "0.0"; else { const MCInstrDesc &Desc = MII.get(MI->getOpcode()); const MCRegisterClass &ImmRC = MRI.getRegClass(Desc.OpInfo[OpNo].RegClass); if (ImmRC.getSize() == 4) printImmediate32(FloatToBits(Op.getFPImm()), O); else if (ImmRC.getSize() == 8) printImmediate64(DoubleToBits(Op.getFPImm()), O); else llvm_unreachable("Invalid register class size"); } } else if (Op.isExpr()) { const MCExpr *Exp = Op.getExpr(); Exp->print(O, &MAI); } else { llvm_unreachable("unknown operand type in printOperand"); } } void AMDGPUInstPrinter::printOperandAndMods(const MCInst *MI, unsigned OpNo, raw_ostream &O) { unsigned InputModifiers = MI->getOperand(OpNo).getImm(); if (InputModifiers & SISrcMods::NEG) O << '-'; if (InputModifiers & SISrcMods::ABS) O << '|'; printOperand(MI, OpNo + 1, O); if (InputModifiers & SISrcMods::ABS) O << '|'; } void AMDGPUInstPrinter::printInterpSlot(const MCInst *MI, unsigned OpNum, raw_ostream &O) { unsigned Imm = MI->getOperand(OpNum).getImm(); if (Imm == 2) { O << "P0"; } else if (Imm == 1) { O << "P20"; } else if (Imm == 0) { O << "P10"; } else { llvm_unreachable("Invalid interpolation parameter slot"); } } void AMDGPUInstPrinter::printMemOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O) { printOperand(MI, OpNo, O); O << ", "; printOperand(MI, OpNo + 1, O); } void AMDGPUInstPrinter::printIfSet(const MCInst *MI, unsigned OpNo, raw_ostream &O, StringRef Asm, StringRef Default) { const MCOperand &Op = MI->getOperand(OpNo); assert(Op.isImm()); if (Op.getImm() == 1) { O << Asm; } else { O << Default; } } void AMDGPUInstPrinter::printAbs(const MCInst *MI, unsigned OpNo, raw_ostream &O) { printIfSet(MI, OpNo, O, "|"); } void AMDGPUInstPrinter::printClamp(const MCInst *MI, unsigned OpNo, raw_ostream &O) { printIfSet(MI, OpNo, O, "_SAT"); } void AMDGPUInstPrinter::printClampSI(const MCInst *MI, unsigned OpNo, raw_ostream &O) { if (MI->getOperand(OpNo).getImm()) O << " clamp"; } void AMDGPUInstPrinter::printOModSI(const MCInst *MI, unsigned OpNo, raw_ostream &O) { int Imm = MI->getOperand(OpNo).getImm(); if (Imm == SIOutMods::MUL2) O << " mul:2"; else if (Imm == SIOutMods::MUL4) O << " mul:4"; else if (Imm == SIOutMods::DIV2) O << " div:2"; } void AMDGPUInstPrinter::printLiteral(const MCInst *MI, unsigned OpNo, raw_ostream &O) { int32_t Imm = MI->getOperand(OpNo).getImm(); O << Imm << '(' << BitsToFloat(Imm) << ')'; } void AMDGPUInstPrinter::printLast(const MCInst *MI, unsigned OpNo, raw_ostream &O) { printIfSet(MI, OpNo, O, "*", " "); } void AMDGPUInstPrinter::printNeg(const MCInst *MI, unsigned OpNo, raw_ostream &O) { printIfSet(MI, OpNo, O, "-"); } void AMDGPUInstPrinter::printOMOD(const MCInst *MI, unsigned OpNo, raw_ostream &O) { switch (MI->getOperand(OpNo).getImm()) { default: break; case 1: O << " * 2.0"; break; case 2: O << " * 4.0"; break; case 3: O << " / 2.0"; break; } } void AMDGPUInstPrinter::printRel(const MCInst *MI, unsigned OpNo, raw_ostream &O) { printIfSet(MI, OpNo, O, "+"); } void AMDGPUInstPrinter::printUpdateExecMask(const MCInst *MI, unsigned OpNo, raw_ostream &O) { printIfSet(MI, OpNo, O, "ExecMask,"); } void AMDGPUInstPrinter::printUpdatePred(const MCInst *MI, unsigned OpNo, raw_ostream &O) { printIfSet(MI, OpNo, O, "Pred,"); } void AMDGPUInstPrinter::printWrite(const MCInst *MI, unsigned OpNo, raw_ostream &O) { const MCOperand &Op = MI->getOperand(OpNo); if (Op.getImm() == 0) { O << " (MASKED)"; } } void AMDGPUInstPrinter::printSel(const MCInst *MI, unsigned OpNo, raw_ostream &O) { const char * chans = "XYZW"; int sel = MI->getOperand(OpNo).getImm(); int chan = sel & 3; sel >>= 2; if (sel >= 512) { sel -= 512; int cb = sel >> 12; sel &= 4095; O << cb << '[' << sel << ']'; } else if (sel >= 448) { sel -= 448; O << sel; } else if (sel >= 0){ O << sel; } if (sel >= 0) O << '.' << chans[chan]; } void AMDGPUInstPrinter::printBankSwizzle(const MCInst *MI, unsigned OpNo, raw_ostream &O) { int BankSwizzle = MI->getOperand(OpNo).getImm(); switch (BankSwizzle) { case 1: O << "BS:VEC_021/SCL_122"; break; case 2: O << "BS:VEC_120/SCL_212"; break; case 3: O << "BS:VEC_102/SCL_221"; break; case 4: O << "BS:VEC_201"; break; case 5: O << "BS:VEC_210"; break; default: break; } return; } void AMDGPUInstPrinter::printRSel(const MCInst *MI, unsigned OpNo, raw_ostream &O) { unsigned Sel = MI->getOperand(OpNo).getImm(); switch (Sel) { case 0: O << 'X'; break; case 1: O << 'Y'; break; case 2: O << 'Z'; break; case 3: O << 'W'; break; case 4: O << '0'; break; case 5: O << '1'; break; case 7: O << '_'; break; default: break; } } void AMDGPUInstPrinter::printCT(const MCInst *MI, unsigned OpNo, raw_ostream &O) { unsigned CT = MI->getOperand(OpNo).getImm(); switch (CT) { case 0: O << 'U'; break; case 1: O << 'N'; break; default: break; } } void AMDGPUInstPrinter::printKCache(const MCInst *MI, unsigned OpNo, raw_ostream &O) { int KCacheMode = MI->getOperand(OpNo).getImm(); if (KCacheMode > 0) { int KCacheBank = MI->getOperand(OpNo - 2).getImm(); O << "CB" << KCacheBank << ':'; int KCacheAddr = MI->getOperand(OpNo + 2).getImm(); int LineSize = (KCacheMode == 1) ? 16 : 32; O << KCacheAddr * 16 << '-' << KCacheAddr * 16 + LineSize; } } void AMDGPUInstPrinter::printSendMsg(const MCInst *MI, unsigned OpNo, raw_ostream &O) { unsigned SImm16 = MI->getOperand(OpNo).getImm(); unsigned Msg = SImm16 & 0xF; if (Msg == 2 || Msg == 3) { unsigned Op = (SImm16 >> 4) & 0xF; if (Msg == 3) O << "Gs_done("; else O << "Gs("; if (Op == 0) { O << "nop"; } else { unsigned Stream = (SImm16 >> 8) & 0x3; if (Op == 1) O << "cut"; else if (Op == 2) O << "emit"; else if (Op == 3) O << "emit-cut"; O << " stream " << Stream; } O << "), [m0] "; } else if (Msg == 1) O << "interrupt "; else if (Msg == 15) O << "system "; else O << "unknown(" << Msg << ") "; } void AMDGPUInstPrinter::printWaitFlag(const MCInst *MI, unsigned OpNo, raw_ostream &O) { // Note: Mask values are taken from SIInsertWaits.cpp and not from ISA docs // SIInsertWaits.cpp bits usage does not match ISA docs description but it // works so it might be a misprint in docs. unsigned SImm16 = MI->getOperand(OpNo).getImm(); unsigned Vmcnt = SImm16 & 0xF; unsigned Expcnt = (SImm16 >> 4) & 0xF; unsigned Lgkmcnt = (SImm16 >> 8) & 0xF; bool NeedSpace = false; if (Vmcnt != 0xF) { O << "vmcnt(" << Vmcnt << ')'; NeedSpace = true; } if (Expcnt != 0x7) { if (NeedSpace) O << ' '; O << "expcnt(" << Expcnt << ')'; NeedSpace = true; } if (Lgkmcnt != 0x7) { if (NeedSpace) O << ' '; O << "lgkmcnt(" << Lgkmcnt << ')'; } } #include "AMDGPUGenAsmWriter.inc"