1 //===-- HexagonPeephole.cpp - Hexagon Peephole Optimiztions ---------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 // This peephole pass optimizes in the following cases.
9 // 1. Optimizes redundant sign extends for the following case
10 // Transform the following pattern
11 // %170 = SXTW %166
12 // ...
13 // %176 = COPY %170:isub_lo
14 //
15 // Into
16 // %176 = COPY %166
17 //
18 // 2. Optimizes redundant negation of predicates.
19 // %15 = CMPGTrr %6, %2
20 // ...
21 // %16 = NOT_p killed %15
22 // ...
23 // JMP_c killed %16, <%bb.1>, implicit dead %pc
24 //
25 // Into
26 // %15 = CMPGTrr %6, %2;
27 // ...
28 // JMP_cNot killed %15, <%bb.1>, implicit dead %pc;
29 //
30 // Note: The peephole pass makes the instrucstions like
31 // %170 = SXTW %166 or %16 = NOT_p killed %15
32 // redundant and relies on some form of dead removal instructions, like
33 // DCE or DIE to actually eliminate them.
34
35 //===----------------------------------------------------------------------===//
36
37 #include "Hexagon.h"
38 #include "HexagonTargetMachine.h"
39 #include "llvm/ADT/DenseMap.h"
40 #include "llvm/ADT/Statistic.h"
41 #include "llvm/CodeGen/MachineFunction.h"
42 #include "llvm/CodeGen/MachineFunctionPass.h"
43 #include "llvm/CodeGen/MachineInstrBuilder.h"
44 #include "llvm/CodeGen/MachineRegisterInfo.h"
45 #include "llvm/CodeGen/Passes.h"
46 #include "llvm/CodeGen/TargetInstrInfo.h"
47 #include "llvm/CodeGen/TargetRegisterInfo.h"
48 #include "llvm/IR/Constants.h"
49 #include "llvm/PassSupport.h"
50 #include "llvm/Support/CommandLine.h"
51 #include "llvm/Support/Debug.h"
52 #include "llvm/Support/raw_ostream.h"
53 #include "llvm/Target/TargetMachine.h"
54 #include <algorithm>
55
56 using namespace llvm;
57
58 #define DEBUG_TYPE "hexagon-peephole"
59
60 static cl::opt<bool> DisableHexagonPeephole("disable-hexagon-peephole",
61 cl::Hidden, cl::ZeroOrMore, cl::init(false),
62 cl::desc("Disable Peephole Optimization"));
63
64 static cl::opt<bool> DisablePNotP("disable-hexagon-pnotp",
65 cl::Hidden, cl::ZeroOrMore, cl::init(false),
66 cl::desc("Disable Optimization of PNotP"));
67
68 static cl::opt<bool> DisableOptSZExt("disable-hexagon-optszext",
69 cl::Hidden, cl::ZeroOrMore, cl::init(true),
70 cl::desc("Disable Optimization of Sign/Zero Extends"));
71
72 static cl::opt<bool> DisableOptExtTo64("disable-hexagon-opt-ext-to-64",
73 cl::Hidden, cl::ZeroOrMore, cl::init(true),
74 cl::desc("Disable Optimization of extensions to i64."));
75
76 namespace llvm {
77 FunctionPass *createHexagonPeephole();
78 void initializeHexagonPeepholePass(PassRegistry&);
79 }
80
81 namespace {
82 struct HexagonPeephole : public MachineFunctionPass {
83 const HexagonInstrInfo *QII;
84 const HexagonRegisterInfo *QRI;
85 const MachineRegisterInfo *MRI;
86
87 public:
88 static char ID;
HexagonPeephole__anon046e8f950111::HexagonPeephole89 HexagonPeephole() : MachineFunctionPass(ID) {
90 initializeHexagonPeepholePass(*PassRegistry::getPassRegistry());
91 }
92
93 bool runOnMachineFunction(MachineFunction &MF) override;
94
getPassName__anon046e8f950111::HexagonPeephole95 StringRef getPassName() const override {
96 return "Hexagon optimize redundant zero and size extends";
97 }
98
getAnalysisUsage__anon046e8f950111::HexagonPeephole99 void getAnalysisUsage(AnalysisUsage &AU) const override {
100 MachineFunctionPass::getAnalysisUsage(AU);
101 }
102 };
103 }
104
105 char HexagonPeephole::ID = 0;
106
107 INITIALIZE_PASS(HexagonPeephole, "hexagon-peephole", "Hexagon Peephole",
108 false, false)
109
runOnMachineFunction(MachineFunction & MF)110 bool HexagonPeephole::runOnMachineFunction(MachineFunction &MF) {
111 if (skipFunction(MF.getFunction()))
112 return false;
113
114 QII = static_cast<const HexagonInstrInfo *>(MF.getSubtarget().getInstrInfo());
115 QRI = MF.getSubtarget<HexagonSubtarget>().getRegisterInfo();
116 MRI = &MF.getRegInfo();
117
118 DenseMap<unsigned, unsigned> PeepholeMap;
119 DenseMap<unsigned, std::pair<unsigned, unsigned> > PeepholeDoubleRegsMap;
120
121 if (DisableHexagonPeephole) return false;
122
123 // Loop over all of the basic blocks.
124 for (MachineFunction::iterator MBBb = MF.begin(), MBBe = MF.end();
125 MBBb != MBBe; ++MBBb) {
126 MachineBasicBlock *MBB = &*MBBb;
127 PeepholeMap.clear();
128 PeepholeDoubleRegsMap.clear();
129
130 // Traverse the basic block.
131 for (auto I = MBB->begin(), E = MBB->end(), NextI = I; I != E; I = NextI) {
132 NextI = std::next(I);
133 MachineInstr &MI = *I;
134 // Look for sign extends:
135 // %170 = SXTW %166
136 if (!DisableOptSZExt && MI.getOpcode() == Hexagon::A2_sxtw) {
137 assert(MI.getNumOperands() == 2);
138 MachineOperand &Dst = MI.getOperand(0);
139 MachineOperand &Src = MI.getOperand(1);
140 unsigned DstReg = Dst.getReg();
141 unsigned SrcReg = Src.getReg();
142 // Just handle virtual registers.
143 if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
144 TargetRegisterInfo::isVirtualRegister(SrcReg)) {
145 // Map the following:
146 // %170 = SXTW %166
147 // PeepholeMap[170] = %166
148 PeepholeMap[DstReg] = SrcReg;
149 }
150 }
151
152 // Look for %170 = COMBINE_ir_V4 (0, %169)
153 // %170:DoublRegs, %169:IntRegs
154 if (!DisableOptExtTo64 && MI.getOpcode() == Hexagon::A4_combineir) {
155 assert(MI.getNumOperands() == 3);
156 MachineOperand &Dst = MI.getOperand(0);
157 MachineOperand &Src1 = MI.getOperand(1);
158 MachineOperand &Src2 = MI.getOperand(2);
159 if (Src1.getImm() != 0)
160 continue;
161 unsigned DstReg = Dst.getReg();
162 unsigned SrcReg = Src2.getReg();
163 PeepholeMap[DstReg] = SrcReg;
164 }
165
166 // Look for this sequence below
167 // %DoubleReg1 = LSRd_ri %DoubleReg0, 32
168 // %IntReg = COPY %DoubleReg1:isub_lo.
169 // and convert into
170 // %IntReg = COPY %DoubleReg0:isub_hi.
171 if (MI.getOpcode() == Hexagon::S2_lsr_i_p) {
172 assert(MI.getNumOperands() == 3);
173 MachineOperand &Dst = MI.getOperand(0);
174 MachineOperand &Src1 = MI.getOperand(1);
175 MachineOperand &Src2 = MI.getOperand(2);
176 if (Src2.getImm() != 32)
177 continue;
178 unsigned DstReg = Dst.getReg();
179 unsigned SrcReg = Src1.getReg();
180 PeepholeDoubleRegsMap[DstReg] =
181 std::make_pair(*&SrcReg, Hexagon::isub_hi);
182 }
183
184 // Look for P=NOT(P).
185 if (!DisablePNotP && MI.getOpcode() == Hexagon::C2_not) {
186 assert(MI.getNumOperands() == 2);
187 MachineOperand &Dst = MI.getOperand(0);
188 MachineOperand &Src = MI.getOperand(1);
189 unsigned DstReg = Dst.getReg();
190 unsigned SrcReg = Src.getReg();
191 // Just handle virtual registers.
192 if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
193 TargetRegisterInfo::isVirtualRegister(SrcReg)) {
194 // Map the following:
195 // %170 = NOT_xx %166
196 // PeepholeMap[170] = %166
197 PeepholeMap[DstReg] = SrcReg;
198 }
199 }
200
201 // Look for copy:
202 // %176 = COPY %170:isub_lo
203 if (!DisableOptSZExt && MI.isCopy()) {
204 assert(MI.getNumOperands() == 2);
205 MachineOperand &Dst = MI.getOperand(0);
206 MachineOperand &Src = MI.getOperand(1);
207
208 // Make sure we are copying the lower 32 bits.
209 if (Src.getSubReg() != Hexagon::isub_lo)
210 continue;
211
212 unsigned DstReg = Dst.getReg();
213 unsigned SrcReg = Src.getReg();
214 if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
215 TargetRegisterInfo::isVirtualRegister(SrcReg)) {
216 // Try to find in the map.
217 if (unsigned PeepholeSrc = PeepholeMap.lookup(SrcReg)) {
218 // Change the 1st operand.
219 MI.RemoveOperand(1);
220 MI.addOperand(MachineOperand::CreateReg(PeepholeSrc, false));
221 } else {
222 DenseMap<unsigned, std::pair<unsigned, unsigned> >::iterator DI =
223 PeepholeDoubleRegsMap.find(SrcReg);
224 if (DI != PeepholeDoubleRegsMap.end()) {
225 std::pair<unsigned,unsigned> PeepholeSrc = DI->second;
226 MI.RemoveOperand(1);
227 MI.addOperand(MachineOperand::CreateReg(
228 PeepholeSrc.first, false /*isDef*/, false /*isImp*/,
229 false /*isKill*/, false /*isDead*/, false /*isUndef*/,
230 false /*isEarlyClobber*/, PeepholeSrc.second));
231 }
232 }
233 }
234 }
235
236 // Look for Predicated instructions.
237 if (!DisablePNotP) {
238 bool Done = false;
239 if (QII->isPredicated(MI)) {
240 MachineOperand &Op0 = MI.getOperand(0);
241 unsigned Reg0 = Op0.getReg();
242 const TargetRegisterClass *RC0 = MRI->getRegClass(Reg0);
243 if (RC0->getID() == Hexagon::PredRegsRegClassID) {
244 // Handle instructions that have a prediate register in op0
245 // (most cases of predicable instructions).
246 if (TargetRegisterInfo::isVirtualRegister(Reg0)) {
247 // Try to find in the map.
248 if (unsigned PeepholeSrc = PeepholeMap.lookup(Reg0)) {
249 // Change the 1st operand and, flip the opcode.
250 MI.getOperand(0).setReg(PeepholeSrc);
251 MRI->clearKillFlags(PeepholeSrc);
252 int NewOp = QII->getInvertedPredicatedOpcode(MI.getOpcode());
253 MI.setDesc(QII->get(NewOp));
254 Done = true;
255 }
256 }
257 }
258 }
259
260 if (!Done) {
261 // Handle special instructions.
262 unsigned Op = MI.getOpcode();
263 unsigned NewOp = 0;
264 unsigned PR = 1, S1 = 2, S2 = 3; // Operand indices.
265
266 switch (Op) {
267 case Hexagon::C2_mux:
268 case Hexagon::C2_muxii:
269 NewOp = Op;
270 break;
271 case Hexagon::C2_muxri:
272 NewOp = Hexagon::C2_muxir;
273 break;
274 case Hexagon::C2_muxir:
275 NewOp = Hexagon::C2_muxri;
276 break;
277 }
278 if (NewOp) {
279 unsigned PSrc = MI.getOperand(PR).getReg();
280 if (unsigned POrig = PeepholeMap.lookup(PSrc)) {
281 BuildMI(*MBB, MI.getIterator(), MI.getDebugLoc(),
282 QII->get(NewOp), MI.getOperand(0).getReg())
283 .addReg(POrig)
284 .add(MI.getOperand(S2))
285 .add(MI.getOperand(S1));
286 MRI->clearKillFlags(POrig);
287 MI.eraseFromParent();
288 }
289 } // if (NewOp)
290 } // if (!Done)
291
292 } // if (!DisablePNotP)
293
294 } // Instruction
295 } // Basic Block
296 return true;
297 }
298
createHexagonPeephole()299 FunctionPass *llvm::createHexagonPeephole() {
300 return new HexagonPeephole();
301 }
302