1 //===-- Mips16ISelLowering.h - Mips16 DAG Lowering Interface ----*- C++ -*-===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // Subclass of MipsTargetLowering specialized for mips16.
11 //
12 //===----------------------------------------------------------------------===//
13 #include "Mips16ISelLowering.h"
14 #include "MCTargetDesc/MipsBaseInfo.h"
15 #include "Mips16HardFloatInfo.h"
16 #include "MipsMachineFunction.h"
17 #include "MipsRegisterInfo.h"
18 #include "MipsTargetMachine.h"
19 #include "llvm/ADT/StringRef.h"
20 #include "llvm/CodeGen/MachineInstrBuilder.h"
21 #include "llvm/Support/CommandLine.h"
22 #include "llvm/Target/TargetInstrInfo.h"
23 #include <string>
24
25 using namespace llvm;
26
27 #define DEBUG_TYPE "mips-lower"
28
29 static cl::opt<bool> DontExpandCondPseudos16(
30 "mips16-dont-expand-cond-pseudo",
31 cl::init(false),
32 cl::desc("Don't expand conditional move related "
33 "pseudos for Mips 16"),
34 cl::Hidden);
35
36 namespace {
37 struct Mips16Libcall {
38 RTLIB::Libcall Libcall;
39 const char *Name;
40
operator <__anon1351efc40111::Mips16Libcall41 bool operator<(const Mips16Libcall &RHS) const {
42 return std::strcmp(Name, RHS.Name) < 0;
43 }
44 };
45
46 struct Mips16IntrinsicHelperType{
47 const char* Name;
48 const char* Helper;
49
operator <__anon1351efc40111::Mips16IntrinsicHelperType50 bool operator<(const Mips16IntrinsicHelperType &RHS) const {
51 return std::strcmp(Name, RHS.Name) < 0;
52 }
operator ==__anon1351efc40111::Mips16IntrinsicHelperType53 bool operator==(const Mips16IntrinsicHelperType &RHS) const {
54 return std::strcmp(Name, RHS.Name) == 0;
55 }
56 };
57 }
58
59 // Libcalls for which no helper is generated. Sorted by name for binary search.
60 static const Mips16Libcall HardFloatLibCalls[] = {
61 { RTLIB::ADD_F64, "__mips16_adddf3" },
62 { RTLIB::ADD_F32, "__mips16_addsf3" },
63 { RTLIB::DIV_F64, "__mips16_divdf3" },
64 { RTLIB::DIV_F32, "__mips16_divsf3" },
65 { RTLIB::OEQ_F64, "__mips16_eqdf2" },
66 { RTLIB::OEQ_F32, "__mips16_eqsf2" },
67 { RTLIB::FPEXT_F32_F64, "__mips16_extendsfdf2" },
68 { RTLIB::FPTOSINT_F64_I32, "__mips16_fix_truncdfsi" },
69 { RTLIB::FPTOSINT_F32_I32, "__mips16_fix_truncsfsi" },
70 { RTLIB::SINTTOFP_I32_F64, "__mips16_floatsidf" },
71 { RTLIB::SINTTOFP_I32_F32, "__mips16_floatsisf" },
72 { RTLIB::UINTTOFP_I32_F64, "__mips16_floatunsidf" },
73 { RTLIB::UINTTOFP_I32_F32, "__mips16_floatunsisf" },
74 { RTLIB::OGE_F64, "__mips16_gedf2" },
75 { RTLIB::OGE_F32, "__mips16_gesf2" },
76 { RTLIB::OGT_F64, "__mips16_gtdf2" },
77 { RTLIB::OGT_F32, "__mips16_gtsf2" },
78 { RTLIB::OLE_F64, "__mips16_ledf2" },
79 { RTLIB::OLE_F32, "__mips16_lesf2" },
80 { RTLIB::OLT_F64, "__mips16_ltdf2" },
81 { RTLIB::OLT_F32, "__mips16_ltsf2" },
82 { RTLIB::MUL_F64, "__mips16_muldf3" },
83 { RTLIB::MUL_F32, "__mips16_mulsf3" },
84 { RTLIB::UNE_F64, "__mips16_nedf2" },
85 { RTLIB::UNE_F32, "__mips16_nesf2" },
86 { RTLIB::UNKNOWN_LIBCALL, "__mips16_ret_dc" }, // No associated libcall.
87 { RTLIB::UNKNOWN_LIBCALL, "__mips16_ret_df" }, // No associated libcall.
88 { RTLIB::UNKNOWN_LIBCALL, "__mips16_ret_sc" }, // No associated libcall.
89 { RTLIB::UNKNOWN_LIBCALL, "__mips16_ret_sf" }, // No associated libcall.
90 { RTLIB::SUB_F64, "__mips16_subdf3" },
91 { RTLIB::SUB_F32, "__mips16_subsf3" },
92 { RTLIB::FPROUND_F64_F32, "__mips16_truncdfsf2" },
93 { RTLIB::UO_F64, "__mips16_unorddf2" },
94 { RTLIB::UO_F32, "__mips16_unordsf2" }
95 };
96
97 static const Mips16IntrinsicHelperType Mips16IntrinsicHelper[] = {
98 {"__fixunsdfsi", "__mips16_call_stub_2" },
99 {"ceil", "__mips16_call_stub_df_2"},
100 {"ceilf", "__mips16_call_stub_sf_1"},
101 {"copysign", "__mips16_call_stub_df_10"},
102 {"copysignf", "__mips16_call_stub_sf_5"},
103 {"cos", "__mips16_call_stub_df_2"},
104 {"cosf", "__mips16_call_stub_sf_1"},
105 {"exp2", "__mips16_call_stub_df_2"},
106 {"exp2f", "__mips16_call_stub_sf_1"},
107 {"floor", "__mips16_call_stub_df_2"},
108 {"floorf", "__mips16_call_stub_sf_1"},
109 {"log2", "__mips16_call_stub_df_2"},
110 {"log2f", "__mips16_call_stub_sf_1"},
111 {"nearbyint", "__mips16_call_stub_df_2"},
112 {"nearbyintf", "__mips16_call_stub_sf_1"},
113 {"rint", "__mips16_call_stub_df_2"},
114 {"rintf", "__mips16_call_stub_sf_1"},
115 {"sin", "__mips16_call_stub_df_2"},
116 {"sinf", "__mips16_call_stub_sf_1"},
117 {"sqrt", "__mips16_call_stub_df_2"},
118 {"sqrtf", "__mips16_call_stub_sf_1"},
119 {"trunc", "__mips16_call_stub_df_2"},
120 {"truncf", "__mips16_call_stub_sf_1"},
121 };
122
Mips16TargetLowering(const MipsTargetMachine & TM,const MipsSubtarget & STI)123 Mips16TargetLowering::Mips16TargetLowering(const MipsTargetMachine &TM,
124 const MipsSubtarget &STI)
125 : MipsTargetLowering(TM, STI) {
126
127 // Set up the register classes
128 addRegisterClass(MVT::i32, &Mips::CPU16RegsRegClass);
129
130 if (!Subtarget.useSoftFloat())
131 setMips16HardFloatLibCalls();
132
133 setOperationAction(ISD::ATOMIC_FENCE, MVT::Other, Expand);
134 setOperationAction(ISD::ATOMIC_CMP_SWAP, MVT::i32, Expand);
135 setOperationAction(ISD::ATOMIC_SWAP, MVT::i32, Expand);
136 setOperationAction(ISD::ATOMIC_LOAD_ADD, MVT::i32, Expand);
137 setOperationAction(ISD::ATOMIC_LOAD_SUB, MVT::i32, Expand);
138 setOperationAction(ISD::ATOMIC_LOAD_AND, MVT::i32, Expand);
139 setOperationAction(ISD::ATOMIC_LOAD_OR, MVT::i32, Expand);
140 setOperationAction(ISD::ATOMIC_LOAD_XOR, MVT::i32, Expand);
141 setOperationAction(ISD::ATOMIC_LOAD_NAND, MVT::i32, Expand);
142 setOperationAction(ISD::ATOMIC_LOAD_MIN, MVT::i32, Expand);
143 setOperationAction(ISD::ATOMIC_LOAD_MAX, MVT::i32, Expand);
144 setOperationAction(ISD::ATOMIC_LOAD_UMIN, MVT::i32, Expand);
145 setOperationAction(ISD::ATOMIC_LOAD_UMAX, MVT::i32, Expand);
146
147 setOperationAction(ISD::ROTR, MVT::i32, Expand);
148 setOperationAction(ISD::ROTR, MVT::i64, Expand);
149 setOperationAction(ISD::BSWAP, MVT::i32, Expand);
150 setOperationAction(ISD::BSWAP, MVT::i64, Expand);
151
152 computeRegisterProperties(STI.getRegisterInfo());
153 }
154
155 const MipsTargetLowering *
createMips16TargetLowering(const MipsTargetMachine & TM,const MipsSubtarget & STI)156 llvm::createMips16TargetLowering(const MipsTargetMachine &TM,
157 const MipsSubtarget &STI) {
158 return new Mips16TargetLowering(TM, STI);
159 }
160
161 bool
allowsMisalignedMemoryAccesses(EVT VT,unsigned,unsigned,bool * Fast) const162 Mips16TargetLowering::allowsMisalignedMemoryAccesses(EVT VT,
163 unsigned,
164 unsigned,
165 bool *Fast) const {
166 return false;
167 }
168
169 MachineBasicBlock *
EmitInstrWithCustomInserter(MachineInstr * MI,MachineBasicBlock * BB) const170 Mips16TargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
171 MachineBasicBlock *BB) const {
172 switch (MI->getOpcode()) {
173 default:
174 return MipsTargetLowering::EmitInstrWithCustomInserter(MI, BB);
175 case Mips::SelBeqZ:
176 return emitSel16(Mips::BeqzRxImm16, MI, BB);
177 case Mips::SelBneZ:
178 return emitSel16(Mips::BnezRxImm16, MI, BB);
179 case Mips::SelTBteqZCmpi:
180 return emitSeliT16(Mips::Bteqz16, Mips::CmpiRxImmX16, MI, BB);
181 case Mips::SelTBteqZSlti:
182 return emitSeliT16(Mips::Bteqz16, Mips::SltiRxImmX16, MI, BB);
183 case Mips::SelTBteqZSltiu:
184 return emitSeliT16(Mips::Bteqz16, Mips::SltiuRxImmX16, MI, BB);
185 case Mips::SelTBtneZCmpi:
186 return emitSeliT16(Mips::Btnez16, Mips::CmpiRxImmX16, MI, BB);
187 case Mips::SelTBtneZSlti:
188 return emitSeliT16(Mips::Btnez16, Mips::SltiRxImmX16, MI, BB);
189 case Mips::SelTBtneZSltiu:
190 return emitSeliT16(Mips::Btnez16, Mips::SltiuRxImmX16, MI, BB);
191 case Mips::SelTBteqZCmp:
192 return emitSelT16(Mips::Bteqz16, Mips::CmpRxRy16, MI, BB);
193 case Mips::SelTBteqZSlt:
194 return emitSelT16(Mips::Bteqz16, Mips::SltRxRy16, MI, BB);
195 case Mips::SelTBteqZSltu:
196 return emitSelT16(Mips::Bteqz16, Mips::SltuRxRy16, MI, BB);
197 case Mips::SelTBtneZCmp:
198 return emitSelT16(Mips::Btnez16, Mips::CmpRxRy16, MI, BB);
199 case Mips::SelTBtneZSlt:
200 return emitSelT16(Mips::Btnez16, Mips::SltRxRy16, MI, BB);
201 case Mips::SelTBtneZSltu:
202 return emitSelT16(Mips::Btnez16, Mips::SltuRxRy16, MI, BB);
203 case Mips::BteqzT8CmpX16:
204 return emitFEXT_T8I816_ins(Mips::Bteqz16, Mips::CmpRxRy16, MI, BB);
205 case Mips::BteqzT8SltX16:
206 return emitFEXT_T8I816_ins(Mips::Bteqz16, Mips::SltRxRy16, MI, BB);
207 case Mips::BteqzT8SltuX16:
208 // TBD: figure out a way to get this or remove the instruction
209 // altogether.
210 return emitFEXT_T8I816_ins(Mips::Bteqz16, Mips::SltuRxRy16, MI, BB);
211 case Mips::BtnezT8CmpX16:
212 return emitFEXT_T8I816_ins(Mips::Btnez16, Mips::CmpRxRy16, MI, BB);
213 case Mips::BtnezT8SltX16:
214 return emitFEXT_T8I816_ins(Mips::Btnez16, Mips::SltRxRy16, MI, BB);
215 case Mips::BtnezT8SltuX16:
216 // TBD: figure out a way to get this or remove the instruction
217 // altogether.
218 return emitFEXT_T8I816_ins(Mips::Btnez16, Mips::SltuRxRy16, MI, BB);
219 case Mips::BteqzT8CmpiX16: return emitFEXT_T8I8I16_ins(
220 Mips::Bteqz16, Mips::CmpiRxImm16, Mips::CmpiRxImmX16, false, MI, BB);
221 case Mips::BteqzT8SltiX16: return emitFEXT_T8I8I16_ins(
222 Mips::Bteqz16, Mips::SltiRxImm16, Mips::SltiRxImmX16, true, MI, BB);
223 case Mips::BteqzT8SltiuX16: return emitFEXT_T8I8I16_ins(
224 Mips::Bteqz16, Mips::SltiuRxImm16, Mips::SltiuRxImmX16, false, MI, BB);
225 case Mips::BtnezT8CmpiX16: return emitFEXT_T8I8I16_ins(
226 Mips::Btnez16, Mips::CmpiRxImm16, Mips::CmpiRxImmX16, false, MI, BB);
227 case Mips::BtnezT8SltiX16: return emitFEXT_T8I8I16_ins(
228 Mips::Btnez16, Mips::SltiRxImm16, Mips::SltiRxImmX16, true, MI, BB);
229 case Mips::BtnezT8SltiuX16: return emitFEXT_T8I8I16_ins(
230 Mips::Btnez16, Mips::SltiuRxImm16, Mips::SltiuRxImmX16, false, MI, BB);
231 break;
232 case Mips::SltCCRxRy16:
233 return emitFEXT_CCRX16_ins(Mips::SltRxRy16, MI, BB);
234 break;
235 case Mips::SltiCCRxImmX16:
236 return emitFEXT_CCRXI16_ins
237 (Mips::SltiRxImm16, Mips::SltiRxImmX16, MI, BB);
238 case Mips::SltiuCCRxImmX16:
239 return emitFEXT_CCRXI16_ins
240 (Mips::SltiuRxImm16, Mips::SltiuRxImmX16, MI, BB);
241 case Mips::SltuCCRxRy16:
242 return emitFEXT_CCRX16_ins
243 (Mips::SltuRxRy16, MI, BB);
244 }
245 }
246
isEligibleForTailCallOptimization(const CCState & CCInfo,unsigned NextStackOffset,const MipsFunctionInfo & FI) const247 bool Mips16TargetLowering::isEligibleForTailCallOptimization(
248 const CCState &CCInfo, unsigned NextStackOffset,
249 const MipsFunctionInfo &FI) const {
250 // No tail call optimization for mips16.
251 return false;
252 }
253
setMips16HardFloatLibCalls()254 void Mips16TargetLowering::setMips16HardFloatLibCalls() {
255 for (unsigned I = 0; I != array_lengthof(HardFloatLibCalls); ++I) {
256 assert((I == 0 || HardFloatLibCalls[I - 1] < HardFloatLibCalls[I]) &&
257 "Array not sorted!");
258 if (HardFloatLibCalls[I].Libcall != RTLIB::UNKNOWN_LIBCALL)
259 setLibcallName(HardFloatLibCalls[I].Libcall, HardFloatLibCalls[I].Name);
260 }
261
262 setLibcallName(RTLIB::O_F64, "__mips16_unorddf2");
263 setLibcallName(RTLIB::O_F32, "__mips16_unordsf2");
264 }
265
266 //
267 // The Mips16 hard float is a crazy quilt inherited from gcc. I have a much
268 // cleaner way to do all of this but it will have to wait until the traditional
269 // gcc mechanism is completed.
270 //
271 // For Pic, in order for Mips16 code to call Mips32 code which according the abi
272 // have either arguments or returned values placed in floating point registers,
273 // we use a set of helper functions. (This includes functions which return type
274 // complex which on Mips are returned in a pair of floating point registers).
275 //
276 // This is an encoding that we inherited from gcc.
277 // In Mips traditional O32, N32 ABI, floating point numbers are passed in
278 // floating point argument registers 1,2 only when the first and optionally
279 // the second arguments are float (sf) or double (df).
280 // For Mips16 we are only concerned with the situations where floating point
281 // arguments are being passed in floating point registers by the ABI, because
282 // Mips16 mode code cannot execute floating point instructions to load those
283 // values and hence helper functions are needed.
284 // The possibilities are (), (sf), (sf, sf), (sf, df), (df), (df, sf), (df, df)
285 // the helper function suffixs for these are:
286 // 0, 1, 5, 9, 2, 6, 10
287 // this suffix can then be calculated as follows:
288 // for a given argument Arg:
289 // Arg1x, Arg2x = 1 : Arg is sf
290 // 2 : Arg is df
291 // 0: Arg is neither sf or df
292 // So this stub is the string for number Arg1x + Arg2x*4.
293 // However not all numbers between 0 and 10 are possible, we check anyway and
294 // assert if the impossible exists.
295 //
296
getMips16HelperFunctionStubNumber(ArgListTy & Args) const297 unsigned int Mips16TargetLowering::getMips16HelperFunctionStubNumber
298 (ArgListTy &Args) const {
299 unsigned int resultNum = 0;
300 if (Args.size() >= 1) {
301 Type *t = Args[0].Ty;
302 if (t->isFloatTy()) {
303 resultNum = 1;
304 }
305 else if (t->isDoubleTy()) {
306 resultNum = 2;
307 }
308 }
309 if (resultNum) {
310 if (Args.size() >=2) {
311 Type *t = Args[1].Ty;
312 if (t->isFloatTy()) {
313 resultNum += 4;
314 }
315 else if (t->isDoubleTy()) {
316 resultNum += 8;
317 }
318 }
319 }
320 return resultNum;
321 }
322
323 //
324 // Prefixes are attached to stub numbers depending on the return type.
325 // return type: float sf_
326 // double df_
327 // single complex sc_
328 // double complext dc_
329 // others NO PREFIX
330 //
331 //
332 // The full name of a helper function is__mips16_call_stub +
333 // return type dependent prefix + stub number
334 //
335 // FIXME: This is something that probably should be in a different source file
336 // and perhaps done differently but my main purpose is to not waste runtime
337 // on something that we can enumerate in the source. Another possibility is
338 // to have a python script to generate these mapping tables. This will do
339 // for now. There are a whole series of helper function mapping arrays, one
340 // for each return type class as outlined above. There there are 11 possible
341 // entries. Ones with 0 are ones which should never be selected.
342 //
343 // All the arrays are similar except for ones which return neither
344 // sf, df, sc, dc, in which we only care about ones which have sf or df as a
345 // first parameter.
346 //
347 #define P_ "__mips16_call_stub_"
348 #define MAX_STUB_NUMBER 10
349 #define T1 P "1", P "2", 0, 0, P "5", P "6", 0, 0, P "9", P "10"
350 #define T P "0" , T1
351 #define P P_
352 static char const * vMips16Helper[MAX_STUB_NUMBER+1] =
353 {nullptr, T1 };
354 #undef P
355 #define P P_ "sf_"
356 static char const * sfMips16Helper[MAX_STUB_NUMBER+1] =
357 { T };
358 #undef P
359 #define P P_ "df_"
360 static char const * dfMips16Helper[MAX_STUB_NUMBER+1] =
361 { T };
362 #undef P
363 #define P P_ "sc_"
364 static char const * scMips16Helper[MAX_STUB_NUMBER+1] =
365 { T };
366 #undef P
367 #define P P_ "dc_"
368 static char const * dcMips16Helper[MAX_STUB_NUMBER+1] =
369 { T };
370 #undef P
371 #undef P_
372
373
374 const char* Mips16TargetLowering::
getMips16HelperFunction(Type * RetTy,ArgListTy & Args,bool & needHelper) const375 getMips16HelperFunction
376 (Type* RetTy, ArgListTy &Args, bool &needHelper) const {
377 const unsigned int stubNum = getMips16HelperFunctionStubNumber(Args);
378 #ifndef NDEBUG
379 const unsigned int maxStubNum = 10;
380 assert(stubNum <= maxStubNum);
381 const bool validStubNum[maxStubNum+1] =
382 {true, true, true, false, false, true, true, false, false, true, true};
383 assert(validStubNum[stubNum]);
384 #endif
385 const char *result;
386 if (RetTy->isFloatTy()) {
387 result = sfMips16Helper[stubNum];
388 }
389 else if (RetTy ->isDoubleTy()) {
390 result = dfMips16Helper[stubNum];
391 }
392 else if (RetTy->isStructTy()) {
393 // check if it's complex
394 if (RetTy->getNumContainedTypes() == 2) {
395 if ((RetTy->getContainedType(0)->isFloatTy()) &&
396 (RetTy->getContainedType(1)->isFloatTy())) {
397 result = scMips16Helper[stubNum];
398 }
399 else if ((RetTy->getContainedType(0)->isDoubleTy()) &&
400 (RetTy->getContainedType(1)->isDoubleTy())) {
401 result = dcMips16Helper[stubNum];
402 }
403 else {
404 llvm_unreachable("Uncovered condition");
405 }
406 }
407 else {
408 llvm_unreachable("Uncovered condition");
409 }
410 }
411 else {
412 if (stubNum == 0) {
413 needHelper = false;
414 return "";
415 }
416 result = vMips16Helper[stubNum];
417 }
418 needHelper = true;
419 return result;
420 }
421
422 void Mips16TargetLowering::
getOpndList(SmallVectorImpl<SDValue> & Ops,std::deque<std::pair<unsigned,SDValue>> & RegsToPass,bool IsPICCall,bool GlobalOrExternal,bool InternalLinkage,bool IsCallReloc,CallLoweringInfo & CLI,SDValue Callee,SDValue Chain) const423 getOpndList(SmallVectorImpl<SDValue> &Ops,
424 std::deque< std::pair<unsigned, SDValue> > &RegsToPass,
425 bool IsPICCall, bool GlobalOrExternal, bool InternalLinkage,
426 bool IsCallReloc, CallLoweringInfo &CLI, SDValue Callee,
427 SDValue Chain) const {
428 SelectionDAG &DAG = CLI.DAG;
429 MachineFunction &MF = DAG.getMachineFunction();
430 MipsFunctionInfo *FuncInfo = MF.getInfo<MipsFunctionInfo>();
431 const char* Mips16HelperFunction = nullptr;
432 bool NeedMips16Helper = false;
433
434 if (Subtarget.inMips16HardFloat()) {
435 //
436 // currently we don't have symbols tagged with the mips16 or mips32
437 // qualifier so we will assume that we don't know what kind it is.
438 // and generate the helper
439 //
440 bool LookupHelper = true;
441 if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(CLI.Callee)) {
442 Mips16Libcall Find = { RTLIB::UNKNOWN_LIBCALL, S->getSymbol() };
443
444 if (std::binary_search(std::begin(HardFloatLibCalls),
445 std::end(HardFloatLibCalls), Find))
446 LookupHelper = false;
447 else {
448 const char *Symbol = S->getSymbol();
449 Mips16IntrinsicHelperType IntrinsicFind = { Symbol, "" };
450 const Mips16HardFloatInfo::FuncSignature *Signature =
451 Mips16HardFloatInfo::findFuncSignature(Symbol);
452 if (!IsPICCall && (Signature && (FuncInfo->StubsNeeded.find(Symbol) ==
453 FuncInfo->StubsNeeded.end()))) {
454 FuncInfo->StubsNeeded[Symbol] = Signature;
455 //
456 // S2 is normally saved if the stub is for a function which
457 // returns a float or double value and is not otherwise. This is
458 // because more work is required after the function the stub
459 // is calling completes, and so the stub cannot directly return
460 // and the stub has no stack space to store the return address so
461 // S2 is used for that purpose.
462 // In order to take advantage of not saving S2, we need to also
463 // optimize the call in the stub and this requires some further
464 // functionality in MipsAsmPrinter which we don't have yet.
465 // So for now we always save S2. The optimization will be done
466 // in a follow-on patch.
467 //
468 if (1 || (Signature->RetSig != Mips16HardFloatInfo::NoFPRet))
469 FuncInfo->setSaveS2();
470 }
471 // one more look at list of intrinsics
472 const Mips16IntrinsicHelperType *Helper =
473 std::lower_bound(std::begin(Mips16IntrinsicHelper),
474 std::end(Mips16IntrinsicHelper), IntrinsicFind);
475 if (Helper != std::end(Mips16IntrinsicHelper) &&
476 *Helper == IntrinsicFind) {
477 Mips16HelperFunction = Helper->Helper;
478 NeedMips16Helper = true;
479 LookupHelper = false;
480 }
481
482 }
483 } else if (GlobalAddressSDNode *G =
484 dyn_cast<GlobalAddressSDNode>(CLI.Callee)) {
485 Mips16Libcall Find = { RTLIB::UNKNOWN_LIBCALL,
486 G->getGlobal()->getName().data() };
487
488 if (std::binary_search(std::begin(HardFloatLibCalls),
489 std::end(HardFloatLibCalls), Find))
490 LookupHelper = false;
491 }
492 if (LookupHelper)
493 Mips16HelperFunction =
494 getMips16HelperFunction(CLI.RetTy, CLI.getArgs(), NeedMips16Helper);
495 }
496
497 SDValue JumpTarget = Callee;
498
499 // T9 should contain the address of the callee function if
500 // -relocation-model=pic or it is an indirect call.
501 if (IsPICCall || !GlobalOrExternal) {
502 unsigned V0Reg = Mips::V0;
503 if (NeedMips16Helper) {
504 RegsToPass.push_front(std::make_pair(V0Reg, Callee));
505 JumpTarget = DAG.getExternalSymbol(Mips16HelperFunction,
506 getPointerTy(DAG.getDataLayout()));
507 ExternalSymbolSDNode *S = cast<ExternalSymbolSDNode>(JumpTarget);
508 JumpTarget = getAddrGlobal(S, CLI.DL, JumpTarget.getValueType(), DAG,
509 MipsII::MO_GOT, Chain,
510 FuncInfo->callPtrInfo(S->getSymbol()));
511 } else
512 RegsToPass.push_front(std::make_pair((unsigned)Mips::T9, Callee));
513 }
514
515 Ops.push_back(JumpTarget);
516
517 MipsTargetLowering::getOpndList(Ops, RegsToPass, IsPICCall, GlobalOrExternal,
518 InternalLinkage, IsCallReloc, CLI, Callee,
519 Chain);
520 }
521
522 MachineBasicBlock *Mips16TargetLowering::
emitSel16(unsigned Opc,MachineInstr * MI,MachineBasicBlock * BB) const523 emitSel16(unsigned Opc, MachineInstr *MI, MachineBasicBlock *BB) const {
524 if (DontExpandCondPseudos16)
525 return BB;
526 const TargetInstrInfo *TII = Subtarget.getInstrInfo();
527 DebugLoc DL = MI->getDebugLoc();
528 // To "insert" a SELECT_CC instruction, we actually have to insert the
529 // diamond control-flow pattern. The incoming instruction knows the
530 // destination vreg to set, the condition code register to branch on, the
531 // true/false values to select between, and a branch opcode to use.
532 const BasicBlock *LLVM_BB = BB->getBasicBlock();
533 MachineFunction::iterator It = ++BB->getIterator();
534
535 // thisMBB:
536 // ...
537 // TrueVal = ...
538 // setcc r1, r2, r3
539 // bNE r1, r0, copy1MBB
540 // fallthrough --> copy0MBB
541 MachineBasicBlock *thisMBB = BB;
542 MachineFunction *F = BB->getParent();
543 MachineBasicBlock *copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
544 MachineBasicBlock *sinkMBB = F->CreateMachineBasicBlock(LLVM_BB);
545 F->insert(It, copy0MBB);
546 F->insert(It, sinkMBB);
547
548 // Transfer the remainder of BB and its successor edges to sinkMBB.
549 sinkMBB->splice(sinkMBB->begin(), BB,
550 std::next(MachineBasicBlock::iterator(MI)), BB->end());
551 sinkMBB->transferSuccessorsAndUpdatePHIs(BB);
552
553 // Next, add the true and fallthrough blocks as its successors.
554 BB->addSuccessor(copy0MBB);
555 BB->addSuccessor(sinkMBB);
556
557 BuildMI(BB, DL, TII->get(Opc)).addReg(MI->getOperand(3).getReg())
558 .addMBB(sinkMBB);
559
560 // copy0MBB:
561 // %FalseValue = ...
562 // # fallthrough to sinkMBB
563 BB = copy0MBB;
564
565 // Update machine-CFG edges
566 BB->addSuccessor(sinkMBB);
567
568 // sinkMBB:
569 // %Result = phi [ %TrueValue, thisMBB ], [ %FalseValue, copy0MBB ]
570 // ...
571 BB = sinkMBB;
572
573 BuildMI(*BB, BB->begin(), DL,
574 TII->get(Mips::PHI), MI->getOperand(0).getReg())
575 .addReg(MI->getOperand(1).getReg()).addMBB(thisMBB)
576 .addReg(MI->getOperand(2).getReg()).addMBB(copy0MBB);
577
578 MI->eraseFromParent(); // The pseudo instruction is gone now.
579 return BB;
580 }
581
582 MachineBasicBlock *
emitSelT16(unsigned Opc1,unsigned Opc2,MachineInstr * MI,MachineBasicBlock * BB) const583 Mips16TargetLowering::emitSelT16(unsigned Opc1, unsigned Opc2, MachineInstr *MI,
584 MachineBasicBlock *BB) const {
585 if (DontExpandCondPseudos16)
586 return BB;
587 const TargetInstrInfo *TII = Subtarget.getInstrInfo();
588 DebugLoc DL = MI->getDebugLoc();
589 // To "insert" a SELECT_CC instruction, we actually have to insert the
590 // diamond control-flow pattern. The incoming instruction knows the
591 // destination vreg to set, the condition code register to branch on, the
592 // true/false values to select between, and a branch opcode to use.
593 const BasicBlock *LLVM_BB = BB->getBasicBlock();
594 MachineFunction::iterator It = ++BB->getIterator();
595
596 // thisMBB:
597 // ...
598 // TrueVal = ...
599 // setcc r1, r2, r3
600 // bNE r1, r0, copy1MBB
601 // fallthrough --> copy0MBB
602 MachineBasicBlock *thisMBB = BB;
603 MachineFunction *F = BB->getParent();
604 MachineBasicBlock *copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
605 MachineBasicBlock *sinkMBB = F->CreateMachineBasicBlock(LLVM_BB);
606 F->insert(It, copy0MBB);
607 F->insert(It, sinkMBB);
608
609 // Transfer the remainder of BB and its successor edges to sinkMBB.
610 sinkMBB->splice(sinkMBB->begin(), BB,
611 std::next(MachineBasicBlock::iterator(MI)), BB->end());
612 sinkMBB->transferSuccessorsAndUpdatePHIs(BB);
613
614 // Next, add the true and fallthrough blocks as its successors.
615 BB->addSuccessor(copy0MBB);
616 BB->addSuccessor(sinkMBB);
617
618 BuildMI(BB, DL, TII->get(Opc2)).addReg(MI->getOperand(3).getReg())
619 .addReg(MI->getOperand(4).getReg());
620 BuildMI(BB, DL, TII->get(Opc1)).addMBB(sinkMBB);
621
622 // copy0MBB:
623 // %FalseValue = ...
624 // # fallthrough to sinkMBB
625 BB = copy0MBB;
626
627 // Update machine-CFG edges
628 BB->addSuccessor(sinkMBB);
629
630 // sinkMBB:
631 // %Result = phi [ %TrueValue, thisMBB ], [ %FalseValue, copy0MBB ]
632 // ...
633 BB = sinkMBB;
634
635 BuildMI(*BB, BB->begin(), DL,
636 TII->get(Mips::PHI), MI->getOperand(0).getReg())
637 .addReg(MI->getOperand(1).getReg()).addMBB(thisMBB)
638 .addReg(MI->getOperand(2).getReg()).addMBB(copy0MBB);
639
640 MI->eraseFromParent(); // The pseudo instruction is gone now.
641 return BB;
642
643 }
644
645 MachineBasicBlock *
emitSeliT16(unsigned Opc1,unsigned Opc2,MachineInstr * MI,MachineBasicBlock * BB) const646 Mips16TargetLowering::emitSeliT16(unsigned Opc1, unsigned Opc2,
647 MachineInstr *MI,
648 MachineBasicBlock *BB) const {
649 if (DontExpandCondPseudos16)
650 return BB;
651 const TargetInstrInfo *TII = Subtarget.getInstrInfo();
652 DebugLoc DL = MI->getDebugLoc();
653 // To "insert" a SELECT_CC instruction, we actually have to insert the
654 // diamond control-flow pattern. The incoming instruction knows the
655 // destination vreg to set, the condition code register to branch on, the
656 // true/false values to select between, and a branch opcode to use.
657 const BasicBlock *LLVM_BB = BB->getBasicBlock();
658 MachineFunction::iterator It = ++BB->getIterator();
659
660 // thisMBB:
661 // ...
662 // TrueVal = ...
663 // setcc r1, r2, r3
664 // bNE r1, r0, copy1MBB
665 // fallthrough --> copy0MBB
666 MachineBasicBlock *thisMBB = BB;
667 MachineFunction *F = BB->getParent();
668 MachineBasicBlock *copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
669 MachineBasicBlock *sinkMBB = F->CreateMachineBasicBlock(LLVM_BB);
670 F->insert(It, copy0MBB);
671 F->insert(It, sinkMBB);
672
673 // Transfer the remainder of BB and its successor edges to sinkMBB.
674 sinkMBB->splice(sinkMBB->begin(), BB,
675 std::next(MachineBasicBlock::iterator(MI)), BB->end());
676 sinkMBB->transferSuccessorsAndUpdatePHIs(BB);
677
678 // Next, add the true and fallthrough blocks as its successors.
679 BB->addSuccessor(copy0MBB);
680 BB->addSuccessor(sinkMBB);
681
682 BuildMI(BB, DL, TII->get(Opc2)).addReg(MI->getOperand(3).getReg())
683 .addImm(MI->getOperand(4).getImm());
684 BuildMI(BB, DL, TII->get(Opc1)).addMBB(sinkMBB);
685
686 // copy0MBB:
687 // %FalseValue = ...
688 // # fallthrough to sinkMBB
689 BB = copy0MBB;
690
691 // Update machine-CFG edges
692 BB->addSuccessor(sinkMBB);
693
694 // sinkMBB:
695 // %Result = phi [ %TrueValue, thisMBB ], [ %FalseValue, copy0MBB ]
696 // ...
697 BB = sinkMBB;
698
699 BuildMI(*BB, BB->begin(), DL,
700 TII->get(Mips::PHI), MI->getOperand(0).getReg())
701 .addReg(MI->getOperand(1).getReg()).addMBB(thisMBB)
702 .addReg(MI->getOperand(2).getReg()).addMBB(copy0MBB);
703
704 MI->eraseFromParent(); // The pseudo instruction is gone now.
705 return BB;
706
707 }
708
709 MachineBasicBlock *
emitFEXT_T8I816_ins(unsigned BtOpc,unsigned CmpOpc,MachineInstr * MI,MachineBasicBlock * BB) const710 Mips16TargetLowering::emitFEXT_T8I816_ins(unsigned BtOpc, unsigned CmpOpc,
711 MachineInstr *MI,
712 MachineBasicBlock *BB) const {
713 if (DontExpandCondPseudos16)
714 return BB;
715 const TargetInstrInfo *TII = Subtarget.getInstrInfo();
716 unsigned regX = MI->getOperand(0).getReg();
717 unsigned regY = MI->getOperand(1).getReg();
718 MachineBasicBlock *target = MI->getOperand(2).getMBB();
719 BuildMI(*BB, MI, MI->getDebugLoc(), TII->get(CmpOpc)).addReg(regX)
720 .addReg(regY);
721 BuildMI(*BB, MI, MI->getDebugLoc(), TII->get(BtOpc)).addMBB(target);
722 MI->eraseFromParent(); // The pseudo instruction is gone now.
723 return BB;
724 }
725
emitFEXT_T8I8I16_ins(unsigned BtOpc,unsigned CmpiOpc,unsigned CmpiXOpc,bool ImmSigned,MachineInstr * MI,MachineBasicBlock * BB) const726 MachineBasicBlock *Mips16TargetLowering::emitFEXT_T8I8I16_ins(
727 unsigned BtOpc, unsigned CmpiOpc, unsigned CmpiXOpc, bool ImmSigned,
728 MachineInstr *MI, MachineBasicBlock *BB) const {
729 if (DontExpandCondPseudos16)
730 return BB;
731 const TargetInstrInfo *TII = Subtarget.getInstrInfo();
732 unsigned regX = MI->getOperand(0).getReg();
733 int64_t imm = MI->getOperand(1).getImm();
734 MachineBasicBlock *target = MI->getOperand(2).getMBB();
735 unsigned CmpOpc;
736 if (isUInt<8>(imm))
737 CmpOpc = CmpiOpc;
738 else if ((!ImmSigned && isUInt<16>(imm)) ||
739 (ImmSigned && isInt<16>(imm)))
740 CmpOpc = CmpiXOpc;
741 else
742 llvm_unreachable("immediate field not usable");
743 BuildMI(*BB, MI, MI->getDebugLoc(), TII->get(CmpOpc)).addReg(regX)
744 .addImm(imm);
745 BuildMI(*BB, MI, MI->getDebugLoc(), TII->get(BtOpc)).addMBB(target);
746 MI->eraseFromParent(); // The pseudo instruction is gone now.
747 return BB;
748 }
749
Mips16WhichOp8uOr16simm(unsigned shortOp,unsigned longOp,int64_t Imm)750 static unsigned Mips16WhichOp8uOr16simm
751 (unsigned shortOp, unsigned longOp, int64_t Imm) {
752 if (isUInt<8>(Imm))
753 return shortOp;
754 else if (isInt<16>(Imm))
755 return longOp;
756 else
757 llvm_unreachable("immediate field not usable");
758 }
759
760 MachineBasicBlock *
emitFEXT_CCRX16_ins(unsigned SltOpc,MachineInstr * MI,MachineBasicBlock * BB) const761 Mips16TargetLowering::emitFEXT_CCRX16_ins(unsigned SltOpc, MachineInstr *MI,
762 MachineBasicBlock *BB) const {
763 if (DontExpandCondPseudos16)
764 return BB;
765 const TargetInstrInfo *TII = Subtarget.getInstrInfo();
766 unsigned CC = MI->getOperand(0).getReg();
767 unsigned regX = MI->getOperand(1).getReg();
768 unsigned regY = MI->getOperand(2).getReg();
769 BuildMI(*BB, MI, MI->getDebugLoc(), TII->get(SltOpc)).addReg(regX).addReg(
770 regY);
771 BuildMI(*BB, MI, MI->getDebugLoc(),
772 TII->get(Mips::MoveR3216), CC).addReg(Mips::T8);
773 MI->eraseFromParent(); // The pseudo instruction is gone now.
774 return BB;
775 }
776
777 MachineBasicBlock *
emitFEXT_CCRXI16_ins(unsigned SltiOpc,unsigned SltiXOpc,MachineInstr * MI,MachineBasicBlock * BB) const778 Mips16TargetLowering::emitFEXT_CCRXI16_ins(unsigned SltiOpc, unsigned SltiXOpc,
779 MachineInstr *MI,
780 MachineBasicBlock *BB) const {
781 if (DontExpandCondPseudos16)
782 return BB;
783 const TargetInstrInfo *TII = Subtarget.getInstrInfo();
784 unsigned CC = MI->getOperand(0).getReg();
785 unsigned regX = MI->getOperand(1).getReg();
786 int64_t Imm = MI->getOperand(2).getImm();
787 unsigned SltOpc = Mips16WhichOp8uOr16simm(SltiOpc, SltiXOpc, Imm);
788 BuildMI(*BB, MI, MI->getDebugLoc(),
789 TII->get(SltOpc)).addReg(regX).addImm(Imm);
790 BuildMI(*BB, MI, MI->getDebugLoc(),
791 TII->get(Mips::MoveR3216), CC).addReg(Mips::T8);
792 MI->eraseFromParent(); // The pseudo instruction is gone now.
793 return BB;
794
795 }
796