1 //===-- Thumb2ITBlockPass.cpp - Insert Thumb-2 IT blocks ------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
10 #include "ARM.h"
11 #include "ARMMachineFunctionInfo.h"
12 #include "ARMSubtarget.h"
13 #include "MCTargetDesc/ARMBaseInfo.h"
14 #include "Thumb2InstrInfo.h"
15 #include "llvm/ADT/SmallSet.h"
16 #include "llvm/ADT/SmallVector.h"
17 #include "llvm/ADT/Statistic.h"
18 #include "llvm/ADT/StringRef.h"
19 #include "llvm/CodeGen/MachineBasicBlock.h"
20 #include "llvm/CodeGen/MachineFunction.h"
21 #include "llvm/CodeGen/MachineFunctionPass.h"
22 #include "llvm/CodeGen/MachineInstr.h"
23 #include "llvm/CodeGen/MachineInstrBuilder.h"
24 #include "llvm/CodeGen/MachineInstrBundle.h"
25 #include "llvm/CodeGen/MachineOperand.h"
26 #include "llvm/IR/DebugLoc.h"
27 #include "llvm/MC/MCInstrDesc.h"
28 #include "llvm/MC/MCRegisterInfo.h"
29 #include <cassert>
30 #include <new>
31 
32 using namespace llvm;
33 
34 #define DEBUG_TYPE "thumb2-it"
35 
36 STATISTIC(NumITs,        "Number of IT blocks inserted");
37 STATISTIC(NumMovedInsts, "Number of predicated instructions moved");
38 
39 namespace {
40 
41   class Thumb2ITBlockPass : public MachineFunctionPass {
42   public:
43     static char ID;
44 
45     bool restrictIT;
46     const Thumb2InstrInfo *TII;
47     const TargetRegisterInfo *TRI;
48     ARMFunctionInfo *AFI;
49 
Thumb2ITBlockPass()50     Thumb2ITBlockPass() : MachineFunctionPass(ID) {}
51 
52     bool runOnMachineFunction(MachineFunction &Fn) override;
53 
getRequiredProperties() const54     MachineFunctionProperties getRequiredProperties() const override {
55       return MachineFunctionProperties().set(
56           MachineFunctionProperties::Property::NoVRegs);
57     }
58 
getPassName() const59     StringRef getPassName() const override {
60       return "Thumb IT blocks insertion pass";
61     }
62 
63   private:
64     bool MoveCopyOutOfITBlock(MachineInstr *MI,
65                               ARMCC::CondCodes CC, ARMCC::CondCodes OCC,
66                               SmallSet<unsigned, 4> &Defs,
67                               SmallSet<unsigned, 4> &Uses);
68     bool InsertITInstructions(MachineBasicBlock &MBB);
69   };
70 
71   char Thumb2ITBlockPass::ID = 0;
72 
73 } // end anonymous namespace
74 
75 /// TrackDefUses - Tracking what registers are being defined and used by
76 /// instructions in the IT block. This also tracks "dependencies", i.e. uses
77 /// in the IT block that are defined before the IT instruction.
TrackDefUses(MachineInstr * MI,SmallSet<unsigned,4> & Defs,SmallSet<unsigned,4> & Uses,const TargetRegisterInfo * TRI)78 static void TrackDefUses(MachineInstr *MI,
79                          SmallSet<unsigned, 4> &Defs,
80                          SmallSet<unsigned, 4> &Uses,
81                          const TargetRegisterInfo *TRI) {
82   SmallVector<unsigned, 4> LocalDefs;
83   SmallVector<unsigned, 4> LocalUses;
84 
85   for (unsigned i = 0, e = MI->getNumOperands(); i != e; ++i) {
86     MachineOperand &MO = MI->getOperand(i);
87     if (!MO.isReg())
88       continue;
89     unsigned Reg = MO.getReg();
90     if (!Reg || Reg == ARM::ITSTATE || Reg == ARM::SP)
91       continue;
92     if (MO.isUse())
93       LocalUses.push_back(Reg);
94     else
95       LocalDefs.push_back(Reg);
96   }
97 
98   for (unsigned i = 0, e = LocalUses.size(); i != e; ++i) {
99     unsigned Reg = LocalUses[i];
100     for (MCSubRegIterator Subreg(Reg, TRI, /*IncludeSelf=*/true);
101          Subreg.isValid(); ++Subreg)
102       Uses.insert(*Subreg);
103   }
104 
105   for (unsigned i = 0, e = LocalDefs.size(); i != e; ++i) {
106     unsigned Reg = LocalDefs[i];
107     for (MCSubRegIterator Subreg(Reg, TRI, /*IncludeSelf=*/true);
108          Subreg.isValid(); ++Subreg)
109       Defs.insert(*Subreg);
110     if (Reg == ARM::CPSR)
111       continue;
112   }
113 }
114 
115 /// Clear kill flags for any uses in the given set.  This will likely
116 /// conservatively remove more kill flags than are necessary, but removing them
117 /// is safer than incorrect kill flags remaining on instructions.
ClearKillFlags(MachineInstr * MI,SmallSet<unsigned,4> & Uses)118 static void ClearKillFlags(MachineInstr *MI, SmallSet<unsigned, 4> &Uses) {
119   for (MachineOperand &MO : MI->operands()) {
120     if (!MO.isReg() || MO.isDef() || !MO.isKill())
121       continue;
122     if (!Uses.count(MO.getReg()))
123       continue;
124     MO.setIsKill(false);
125   }
126 }
127 
isCopy(MachineInstr * MI)128 static bool isCopy(MachineInstr *MI) {
129   switch (MI->getOpcode()) {
130   default:
131     return false;
132   case ARM::MOVr:
133   case ARM::MOVr_TC:
134   case ARM::tMOVr:
135   case ARM::t2MOVr:
136     return true;
137   }
138 }
139 
140 bool
MoveCopyOutOfITBlock(MachineInstr * MI,ARMCC::CondCodes CC,ARMCC::CondCodes OCC,SmallSet<unsigned,4> & Defs,SmallSet<unsigned,4> & Uses)141 Thumb2ITBlockPass::MoveCopyOutOfITBlock(MachineInstr *MI,
142                                       ARMCC::CondCodes CC, ARMCC::CondCodes OCC,
143                                         SmallSet<unsigned, 4> &Defs,
144                                         SmallSet<unsigned, 4> &Uses) {
145   if (!isCopy(MI))
146     return false;
147   // llvm models select's as two-address instructions. That means a copy
148   // is inserted before a t2MOVccr, etc. If the copy is scheduled in
149   // between selects we would end up creating multiple IT blocks.
150   assert(MI->getOperand(0).getSubReg() == 0 &&
151          MI->getOperand(1).getSubReg() == 0 &&
152          "Sub-register indices still around?");
153 
154   unsigned DstReg = MI->getOperand(0).getReg();
155   unsigned SrcReg = MI->getOperand(1).getReg();
156 
157   // First check if it's safe to move it.
158   if (Uses.count(DstReg) || Defs.count(SrcReg))
159     return false;
160 
161   // If the CPSR is defined by this copy, then we don't want to move it. E.g.,
162   // if we have:
163   //
164   //   movs  r1, r1
165   //   rsb   r1, 0
166   //   movs  r2, r2
167   //   rsb   r2, 0
168   //
169   // we don't want this to be converted to:
170   //
171   //   movs  r1, r1
172   //   movs  r2, r2
173   //   itt   mi
174   //   rsb   r1, 0
175   //   rsb   r2, 0
176   //
177   const MCInstrDesc &MCID = MI->getDesc();
178   if (MI->hasOptionalDef() &&
179       MI->getOperand(MCID.getNumOperands() - 1).getReg() == ARM::CPSR)
180     return false;
181 
182   // Then peek at the next instruction to see if it's predicated on CC or OCC.
183   // If not, then there is nothing to be gained by moving the copy.
184   MachineBasicBlock::iterator I = MI; ++I;
185   MachineBasicBlock::iterator E = MI->getParent()->end();
186   while (I != E && I->isDebugInstr())
187     ++I;
188   if (I != E) {
189     unsigned NPredReg = 0;
190     ARMCC::CondCodes NCC = getITInstrPredicate(*I, NPredReg);
191     if (NCC == CC || NCC == OCC)
192       return true;
193   }
194   return false;
195 }
196 
InsertITInstructions(MachineBasicBlock & MBB)197 bool Thumb2ITBlockPass::InsertITInstructions(MachineBasicBlock &MBB) {
198   bool Modified = false;
199 
200   SmallSet<unsigned, 4> Defs;
201   SmallSet<unsigned, 4> Uses;
202   MachineBasicBlock::iterator MBBI = MBB.begin(), E = MBB.end();
203   while (MBBI != E) {
204     MachineInstr *MI = &*MBBI;
205     DebugLoc dl = MI->getDebugLoc();
206     unsigned PredReg = 0;
207     ARMCC::CondCodes CC = getITInstrPredicate(*MI, PredReg);
208     if (CC == ARMCC::AL) {
209       ++MBBI;
210       continue;
211     }
212 
213     Defs.clear();
214     Uses.clear();
215     TrackDefUses(MI, Defs, Uses, TRI);
216 
217     // Insert an IT instruction.
218     MachineInstrBuilder MIB = BuildMI(MBB, MBBI, dl, TII->get(ARM::t2IT))
219       .addImm(CC);
220 
221     // Add implicit use of ITSTATE to IT block instructions.
222     MI->addOperand(MachineOperand::CreateReg(ARM::ITSTATE, false/*ifDef*/,
223                                              true/*isImp*/, false/*isKill*/));
224 
225     MachineInstr *LastITMI = MI;
226     MachineBasicBlock::iterator InsertPos = MIB.getInstr();
227     ++MBBI;
228 
229     // Form IT block.
230     ARMCC::CondCodes OCC = ARMCC::getOppositeCondition(CC);
231     unsigned Mask = 0, Pos = 3;
232 
233     // v8 IT blocks are limited to one conditional op unless -arm-no-restrict-it
234     // is set: skip the loop
235     if (!restrictIT) {
236       // Branches, including tricky ones like LDM_RET, need to end an IT
237       // block so check the instruction we just put in the block.
238       for (; MBBI != E && Pos &&
239              (!MI->isBranch() && !MI->isReturn()) ; ++MBBI) {
240         if (MBBI->isDebugInstr())
241           continue;
242 
243         MachineInstr *NMI = &*MBBI;
244         MI = NMI;
245 
246         unsigned NPredReg = 0;
247         ARMCC::CondCodes NCC = getITInstrPredicate(*NMI, NPredReg);
248         if (NCC == CC || NCC == OCC) {
249           Mask |= (NCC & 1) << Pos;
250           // Add implicit use of ITSTATE.
251           NMI->addOperand(MachineOperand::CreateReg(ARM::ITSTATE, false/*ifDef*/,
252                                                  true/*isImp*/, false/*isKill*/));
253           LastITMI = NMI;
254         } else {
255           if (NCC == ARMCC::AL &&
256               MoveCopyOutOfITBlock(NMI, CC, OCC, Defs, Uses)) {
257             --MBBI;
258             MBB.remove(NMI);
259             MBB.insert(InsertPos, NMI);
260             ClearKillFlags(MI, Uses);
261             ++NumMovedInsts;
262             continue;
263           }
264           break;
265         }
266         TrackDefUses(NMI, Defs, Uses, TRI);
267         --Pos;
268       }
269     }
270 
271     // Finalize IT mask.
272     Mask |= (1 << Pos);
273     // Tag along (firstcond[0] << 4) with the mask.
274     Mask |= (CC & 1) << 4;
275     MIB.addImm(Mask);
276 
277     // Last instruction in IT block kills ITSTATE.
278     LastITMI->findRegisterUseOperand(ARM::ITSTATE)->setIsKill();
279 
280     // Finalize the bundle.
281     finalizeBundle(MBB, InsertPos.getInstrIterator(),
282                    ++LastITMI->getIterator());
283 
284     Modified = true;
285     ++NumITs;
286   }
287 
288   return Modified;
289 }
290 
runOnMachineFunction(MachineFunction & Fn)291 bool Thumb2ITBlockPass::runOnMachineFunction(MachineFunction &Fn) {
292   const ARMSubtarget &STI =
293       static_cast<const ARMSubtarget &>(Fn.getSubtarget());
294   if (!STI.isThumb2())
295     return false;
296   AFI = Fn.getInfo<ARMFunctionInfo>();
297   TII = static_cast<const Thumb2InstrInfo *>(STI.getInstrInfo());
298   TRI = STI.getRegisterInfo();
299   restrictIT = STI.restrictIT();
300 
301   if (!AFI->isThumbFunction())
302     return false;
303 
304   bool Modified = false;
305   for (MachineFunction::iterator MFI = Fn.begin(), E = Fn.end(); MFI != E; ) {
306     MachineBasicBlock &MBB = *MFI;
307     ++MFI;
308     Modified |= InsertITInstructions(MBB);
309   }
310 
311   if (Modified)
312     AFI->setHasITBlocks(true);
313 
314   return Modified;
315 }
316 
317 /// createThumb2ITBlockPass - Returns an instance of the Thumb2 IT blocks
318 /// insertion pass.
createThumb2ITBlockPass()319 FunctionPass *llvm::createThumb2ITBlockPass() {
320   return new Thumb2ITBlockPass();
321 }
322