1 //===-- BPFISelLowering.cpp - BPF DAG Lowering Implementation  ------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file defines the interfaces that BPF uses to lower LLVM code into a
11 // selection DAG.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "BPFISelLowering.h"
16 #include "BPF.h"
17 #include "BPFSubtarget.h"
18 #include "BPFTargetMachine.h"
19 #include "llvm/CodeGen/CallingConvLower.h"
20 #include "llvm/CodeGen/MachineFrameInfo.h"
21 #include "llvm/CodeGen/MachineFunction.h"
22 #include "llvm/CodeGen/MachineInstrBuilder.h"
23 #include "llvm/CodeGen/MachineRegisterInfo.h"
24 #include "llvm/CodeGen/SelectionDAGISel.h"
25 #include "llvm/CodeGen/TargetLoweringObjectFileImpl.h"
26 #include "llvm/CodeGen/ValueTypes.h"
27 #include "llvm/IR/DiagnosticInfo.h"
28 #include "llvm/IR/DiagnosticPrinter.h"
29 #include "llvm/Support/Debug.h"
30 #include "llvm/Support/ErrorHandling.h"
31 #include "llvm/Support/raw_ostream.h"
32 using namespace llvm;
33 
34 #define DEBUG_TYPE "bpf-lower"
35 
fail(const SDLoc & DL,SelectionDAG & DAG,const char * Msg)36 static void fail(const SDLoc &DL, SelectionDAG &DAG, const char *Msg) {
37   MachineFunction &MF = DAG.getMachineFunction();
38   DAG.getContext()->diagnose(
39       DiagnosticInfoUnsupported(*MF.getFunction(), Msg, DL.getDebugLoc()));
40 }
41 
fail(const SDLoc & DL,SelectionDAG & DAG,const char * Msg,SDValue Val)42 static void fail(const SDLoc &DL, SelectionDAG &DAG, const char *Msg,
43                  SDValue Val) {
44   MachineFunction &MF = DAG.getMachineFunction();
45   std::string Str;
46   raw_string_ostream OS(Str);
47   OS << Msg;
48   Val->print(OS);
49   OS.flush();
50   DAG.getContext()->diagnose(
51       DiagnosticInfoUnsupported(*MF.getFunction(), Str, DL.getDebugLoc()));
52 }
53 
BPFTargetLowering(const TargetMachine & TM,const BPFSubtarget & STI)54 BPFTargetLowering::BPFTargetLowering(const TargetMachine &TM,
55                                      const BPFSubtarget &STI)
56     : TargetLowering(TM) {
57 
58   // Set up the register classes.
59   addRegisterClass(MVT::i64, &BPF::GPRRegClass);
60 
61   // Compute derived properties from the register classes
62   computeRegisterProperties(STI.getRegisterInfo());
63 
64   setStackPointerRegisterToSaveRestore(BPF::R11);
65 
66   setOperationAction(ISD::BR_CC, MVT::i64, Custom);
67   setOperationAction(ISD::BR_JT, MVT::Other, Expand);
68   setOperationAction(ISD::BRIND, MVT::Other, Expand);
69   setOperationAction(ISD::BRCOND, MVT::Other, Expand);
70   setOperationAction(ISD::SETCC, MVT::i64, Expand);
71   setOperationAction(ISD::SELECT, MVT::i64, Expand);
72   setOperationAction(ISD::SELECT_CC, MVT::i64, Custom);
73 
74   setOperationAction(ISD::GlobalAddress, MVT::i64, Custom);
75 
76   setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64, Custom);
77   setOperationAction(ISD::STACKSAVE, MVT::Other, Expand);
78   setOperationAction(ISD::STACKRESTORE, MVT::Other, Expand);
79 
80   setOperationAction(ISD::SDIVREM, MVT::i64, Expand);
81   setOperationAction(ISD::UDIVREM, MVT::i64, Expand);
82   setOperationAction(ISD::SREM, MVT::i64, Expand);
83   setOperationAction(ISD::UREM, MVT::i64, Expand);
84 
85   setOperationAction(ISD::MULHU, MVT::i64, Expand);
86   setOperationAction(ISD::MULHS, MVT::i64, Expand);
87   setOperationAction(ISD::UMUL_LOHI, MVT::i64, Expand);
88   setOperationAction(ISD::SMUL_LOHI, MVT::i64, Expand);
89 
90   setOperationAction(ISD::ADDC, MVT::i64, Expand);
91   setOperationAction(ISD::ADDE, MVT::i64, Expand);
92   setOperationAction(ISD::SUBC, MVT::i64, Expand);
93   setOperationAction(ISD::SUBE, MVT::i64, Expand);
94 
95   setOperationAction(ISD::ROTR, MVT::i64, Expand);
96   setOperationAction(ISD::ROTL, MVT::i64, Expand);
97   setOperationAction(ISD::SHL_PARTS, MVT::i64, Expand);
98   setOperationAction(ISD::SRL_PARTS, MVT::i64, Expand);
99   setOperationAction(ISD::SRA_PARTS, MVT::i64, Expand);
100 
101   setOperationAction(ISD::CTTZ, MVT::i64, Custom);
102   setOperationAction(ISD::CTLZ, MVT::i64, Custom);
103   setOperationAction(ISD::CTTZ_ZERO_UNDEF, MVT::i64, Custom);
104   setOperationAction(ISD::CTLZ_ZERO_UNDEF, MVT::i64, Custom);
105   setOperationAction(ISD::CTPOP, MVT::i64, Expand);
106 
107   setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);
108   setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i8, Expand);
109   setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i16, Expand);
110   setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i32, Expand);
111 
112   // Extended load operations for i1 types must be promoted
113   for (MVT VT : MVT::integer_valuetypes()) {
114     setLoadExtAction(ISD::EXTLOAD, VT, MVT::i1, Promote);
115     setLoadExtAction(ISD::ZEXTLOAD, VT, MVT::i1, Promote);
116     setLoadExtAction(ISD::SEXTLOAD, VT, MVT::i1, Promote);
117 
118     setLoadExtAction(ISD::SEXTLOAD, VT, MVT::i8, Expand);
119     setLoadExtAction(ISD::SEXTLOAD, VT, MVT::i16, Expand);
120     setLoadExtAction(ISD::SEXTLOAD, VT, MVT::i32, Expand);
121   }
122 
123   setBooleanContents(ZeroOrOneBooleanContent);
124 
125   // Function alignments (log2)
126   setMinFunctionAlignment(3);
127   setPrefFunctionAlignment(3);
128 
129   // inline memcpy() for kernel to see explicit copy
130   MaxStoresPerMemset = MaxStoresPerMemsetOptSize = 128;
131   MaxStoresPerMemcpy = MaxStoresPerMemcpyOptSize = 128;
132   MaxStoresPerMemmove = MaxStoresPerMemmoveOptSize = 128;
133 }
134 
LowerOperation(SDValue Op,SelectionDAG & DAG) const135 SDValue BPFTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) const {
136   switch (Op.getOpcode()) {
137   case ISD::BR_CC:
138     return LowerBR_CC(Op, DAG);
139   case ISD::GlobalAddress:
140     return LowerGlobalAddress(Op, DAG);
141   case ISD::SELECT_CC:
142     return LowerSELECT_CC(Op, DAG);
143   default:
144     llvm_unreachable("unimplemented operand");
145   }
146 }
147 
148 // Calling Convention Implementation
149 #include "BPFGenCallingConv.inc"
150 
LowerFormalArguments(SDValue Chain,CallingConv::ID CallConv,bool IsVarArg,const SmallVectorImpl<ISD::InputArg> & Ins,const SDLoc & DL,SelectionDAG & DAG,SmallVectorImpl<SDValue> & InVals) const151 SDValue BPFTargetLowering::LowerFormalArguments(
152     SDValue Chain, CallingConv::ID CallConv, bool IsVarArg,
153     const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,
154     SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const {
155   switch (CallConv) {
156   default:
157     llvm_unreachable("Unsupported calling convention");
158   case CallingConv::C:
159   case CallingConv::Fast:
160     break;
161   }
162 
163   MachineFunction &MF = DAG.getMachineFunction();
164   MachineRegisterInfo &RegInfo = MF.getRegInfo();
165 
166   // Assign locations to all of the incoming arguments.
167   SmallVector<CCValAssign, 16> ArgLocs;
168   CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());
169   CCInfo.AnalyzeFormalArguments(Ins, CC_BPF64);
170 
171   for (auto &VA : ArgLocs) {
172     if (VA.isRegLoc()) {
173       // Arguments passed in registers
174       EVT RegVT = VA.getLocVT();
175       switch (RegVT.getSimpleVT().SimpleTy) {
176       default: {
177         errs() << "LowerFormalArguments Unhandled argument type: "
178                << RegVT.getEVTString() << '\n';
179         llvm_unreachable(0);
180       }
181       case MVT::i64:
182         unsigned VReg = RegInfo.createVirtualRegister(&BPF::GPRRegClass);
183         RegInfo.addLiveIn(VA.getLocReg(), VReg);
184         SDValue ArgValue = DAG.getCopyFromReg(Chain, DL, VReg, RegVT);
185 
186         // If this is an 8/16/32-bit value, it is really passed promoted to 64
187         // bits. Insert an assert[sz]ext to capture this, then truncate to the
188         // right size.
189         if (VA.getLocInfo() == CCValAssign::SExt)
190           ArgValue = DAG.getNode(ISD::AssertSext, DL, RegVT, ArgValue,
191                                  DAG.getValueType(VA.getValVT()));
192         else if (VA.getLocInfo() == CCValAssign::ZExt)
193           ArgValue = DAG.getNode(ISD::AssertZext, DL, RegVT, ArgValue,
194                                  DAG.getValueType(VA.getValVT()));
195 
196         if (VA.getLocInfo() != CCValAssign::Full)
197           ArgValue = DAG.getNode(ISD::TRUNCATE, DL, VA.getValVT(), ArgValue);
198 
199         InVals.push_back(ArgValue);
200       }
201     } else {
202       fail(DL, DAG, "defined with too many args");
203       InVals.push_back(DAG.getConstant(0, DL, VA.getLocVT()));
204     }
205   }
206 
207   if (IsVarArg || MF.getFunction()->hasStructRetAttr()) {
208     fail(DL, DAG, "functions with VarArgs or StructRet are not supported");
209   }
210 
211   return Chain;
212 }
213 
214 const unsigned BPFTargetLowering::MaxArgs = 5;
215 
LowerCall(TargetLowering::CallLoweringInfo & CLI,SmallVectorImpl<SDValue> & InVals) const216 SDValue BPFTargetLowering::LowerCall(TargetLowering::CallLoweringInfo &CLI,
217                                      SmallVectorImpl<SDValue> &InVals) const {
218   SelectionDAG &DAG = CLI.DAG;
219   auto &Outs = CLI.Outs;
220   auto &OutVals = CLI.OutVals;
221   auto &Ins = CLI.Ins;
222   SDValue Chain = CLI.Chain;
223   SDValue Callee = CLI.Callee;
224   bool &IsTailCall = CLI.IsTailCall;
225   CallingConv::ID CallConv = CLI.CallConv;
226   bool IsVarArg = CLI.IsVarArg;
227   MachineFunction &MF = DAG.getMachineFunction();
228 
229   // BPF target does not support tail call optimization.
230   IsTailCall = false;
231 
232   switch (CallConv) {
233   default:
234     report_fatal_error("Unsupported calling convention");
235   case CallingConv::Fast:
236   case CallingConv::C:
237     break;
238   }
239 
240   // Analyze operands of the call, assigning locations to each operand.
241   SmallVector<CCValAssign, 16> ArgLocs;
242   CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());
243 
244   CCInfo.AnalyzeCallOperands(Outs, CC_BPF64);
245 
246   unsigned NumBytes = CCInfo.getNextStackOffset();
247 
248   if (Outs.size() > MaxArgs)
249     fail(CLI.DL, DAG, "too many args to ", Callee);
250 
251   for (auto &Arg : Outs) {
252     ISD::ArgFlagsTy Flags = Arg.Flags;
253     if (!Flags.isByVal())
254       continue;
255 
256     fail(CLI.DL, DAG, "pass by value not supported ", Callee);
257   }
258 
259   auto PtrVT = getPointerTy(MF.getDataLayout());
260   Chain = DAG.getCALLSEQ_START(
261       Chain, DAG.getConstant(NumBytes, CLI.DL, PtrVT, true), CLI.DL);
262 
263   SmallVector<std::pair<unsigned, SDValue>, MaxArgs> RegsToPass;
264 
265   // Walk arg assignments
266   for (unsigned i = 0,
267                 e = std::min(static_cast<unsigned>(ArgLocs.size()), MaxArgs);
268        i != e; ++i) {
269     CCValAssign &VA = ArgLocs[i];
270     SDValue Arg = OutVals[i];
271 
272     // Promote the value if needed.
273     switch (VA.getLocInfo()) {
274     default:
275       llvm_unreachable("Unknown loc info");
276     case CCValAssign::Full:
277       break;
278     case CCValAssign::SExt:
279       Arg = DAG.getNode(ISD::SIGN_EXTEND, CLI.DL, VA.getLocVT(), Arg);
280       break;
281     case CCValAssign::ZExt:
282       Arg = DAG.getNode(ISD::ZERO_EXTEND, CLI.DL, VA.getLocVT(), Arg);
283       break;
284     case CCValAssign::AExt:
285       Arg = DAG.getNode(ISD::ANY_EXTEND, CLI.DL, VA.getLocVT(), Arg);
286       break;
287     }
288 
289     // Push arguments into RegsToPass vector
290     if (VA.isRegLoc())
291       RegsToPass.push_back(std::make_pair(VA.getLocReg(), Arg));
292     else
293       llvm_unreachable("call arg pass bug");
294   }
295 
296   SDValue InFlag;
297 
298   // Build a sequence of copy-to-reg nodes chained together with token chain and
299   // flag operands which copy the outgoing args into registers.  The InFlag in
300   // necessary since all emitted instructions must be stuck together.
301   for (auto &Reg : RegsToPass) {
302     Chain = DAG.getCopyToReg(Chain, CLI.DL, Reg.first, Reg.second, InFlag);
303     InFlag = Chain.getValue(1);
304   }
305 
306   // If the callee is a GlobalAddress node (quite common, every direct call is)
307   // turn it into a TargetGlobalAddress node so that legalize doesn't hack it.
308   // Likewise ExternalSymbol -> TargetExternalSymbol.
309   if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee))
310     Callee = DAG.getTargetGlobalAddress(G->getGlobal(), CLI.DL, PtrVT,
311                                         G->getOffset(), 0);
312   else if (ExternalSymbolSDNode *E = dyn_cast<ExternalSymbolSDNode>(Callee))
313     Callee = DAG.getTargetExternalSymbol(E->getSymbol(), PtrVT, 0);
314 
315   // Returns a chain & a flag for retval copy to use.
316   SDVTList NodeTys = DAG.getVTList(MVT::Other, MVT::Glue);
317   SmallVector<SDValue, 8> Ops;
318   Ops.push_back(Chain);
319   Ops.push_back(Callee);
320 
321   // Add argument registers to the end of the list so that they are
322   // known live into the call.
323   for (auto &Reg : RegsToPass)
324     Ops.push_back(DAG.getRegister(Reg.first, Reg.second.getValueType()));
325 
326   if (InFlag.getNode())
327     Ops.push_back(InFlag);
328 
329   Chain = DAG.getNode(BPFISD::CALL, CLI.DL, NodeTys, Ops);
330   InFlag = Chain.getValue(1);
331 
332   // Create the CALLSEQ_END node.
333   Chain = DAG.getCALLSEQ_END(
334       Chain, DAG.getConstant(NumBytes, CLI.DL, PtrVT, true),
335       DAG.getConstant(0, CLI.DL, PtrVT, true), InFlag, CLI.DL);
336   InFlag = Chain.getValue(1);
337 
338   // Handle result values, copying them out of physregs into vregs that we
339   // return.
340   return LowerCallResult(Chain, InFlag, CallConv, IsVarArg, Ins, CLI.DL, DAG,
341                          InVals);
342 }
343 
344 SDValue
LowerReturn(SDValue Chain,CallingConv::ID CallConv,bool IsVarArg,const SmallVectorImpl<ISD::OutputArg> & Outs,const SmallVectorImpl<SDValue> & OutVals,const SDLoc & DL,SelectionDAG & DAG) const345 BPFTargetLowering::LowerReturn(SDValue Chain, CallingConv::ID CallConv,
346                                bool IsVarArg,
347                                const SmallVectorImpl<ISD::OutputArg> &Outs,
348                                const SmallVectorImpl<SDValue> &OutVals,
349                                const SDLoc &DL, SelectionDAG &DAG) const {
350   unsigned Opc = BPFISD::RET_FLAG;
351 
352   // CCValAssign - represent the assignment of the return value to a location
353   SmallVector<CCValAssign, 16> RVLocs;
354   MachineFunction &MF = DAG.getMachineFunction();
355 
356   // CCState - Info about the registers and stack slot.
357   CCState CCInfo(CallConv, IsVarArg, MF, RVLocs, *DAG.getContext());
358 
359   if (MF.getFunction()->getReturnType()->isAggregateType()) {
360     fail(DL, DAG, "only integer returns supported");
361     return DAG.getNode(Opc, DL, MVT::Other, Chain);
362   }
363 
364   // Analize return values.
365   CCInfo.AnalyzeReturn(Outs, RetCC_BPF64);
366 
367   SDValue Flag;
368   SmallVector<SDValue, 4> RetOps(1, Chain);
369 
370   // Copy the result values into the output registers.
371   for (unsigned i = 0; i != RVLocs.size(); ++i) {
372     CCValAssign &VA = RVLocs[i];
373     assert(VA.isRegLoc() && "Can only return in registers!");
374 
375     Chain = DAG.getCopyToReg(Chain, DL, VA.getLocReg(), OutVals[i], Flag);
376 
377     // Guarantee that all emitted copies are stuck together,
378     // avoiding something bad.
379     Flag = Chain.getValue(1);
380     RetOps.push_back(DAG.getRegister(VA.getLocReg(), VA.getLocVT()));
381   }
382 
383   RetOps[0] = Chain; // Update chain.
384 
385   // Add the flag if we have it.
386   if (Flag.getNode())
387     RetOps.push_back(Flag);
388 
389   return DAG.getNode(Opc, DL, MVT::Other, RetOps);
390 }
391 
LowerCallResult(SDValue Chain,SDValue InFlag,CallingConv::ID CallConv,bool IsVarArg,const SmallVectorImpl<ISD::InputArg> & Ins,const SDLoc & DL,SelectionDAG & DAG,SmallVectorImpl<SDValue> & InVals) const392 SDValue BPFTargetLowering::LowerCallResult(
393     SDValue Chain, SDValue InFlag, CallingConv::ID CallConv, bool IsVarArg,
394     const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,
395     SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const {
396 
397   MachineFunction &MF = DAG.getMachineFunction();
398   // Assign locations to each value returned by this call.
399   SmallVector<CCValAssign, 16> RVLocs;
400   CCState CCInfo(CallConv, IsVarArg, MF, RVLocs, *DAG.getContext());
401 
402   if (Ins.size() >= 2) {
403     fail(DL, DAG, "only small returns supported");
404     for (unsigned i = 0, e = Ins.size(); i != e; ++i)
405       InVals.push_back(DAG.getConstant(0, DL, Ins[i].VT));
406     return DAG.getCopyFromReg(Chain, DL, 1, Ins[0].VT, InFlag).getValue(1);
407   }
408 
409   CCInfo.AnalyzeCallResult(Ins, RetCC_BPF64);
410 
411   // Copy all of the result registers out of their specified physreg.
412   for (auto &Val : RVLocs) {
413     Chain = DAG.getCopyFromReg(Chain, DL, Val.getLocReg(),
414                                Val.getValVT(), InFlag).getValue(1);
415     InFlag = Chain.getValue(2);
416     InVals.push_back(Chain.getValue(0));
417   }
418 
419   return Chain;
420 }
421 
NegateCC(SDValue & LHS,SDValue & RHS,ISD::CondCode & CC)422 static void NegateCC(SDValue &LHS, SDValue &RHS, ISD::CondCode &CC) {
423   switch (CC) {
424   default:
425     break;
426   case ISD::SETULT:
427   case ISD::SETULE:
428   case ISD::SETLT:
429   case ISD::SETLE:
430     CC = ISD::getSetCCSwappedOperands(CC);
431     std::swap(LHS, RHS);
432     break;
433   }
434 }
435 
LowerBR_CC(SDValue Op,SelectionDAG & DAG) const436 SDValue BPFTargetLowering::LowerBR_CC(SDValue Op, SelectionDAG &DAG) const {
437   SDValue Chain = Op.getOperand(0);
438   ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(1))->get();
439   SDValue LHS = Op.getOperand(2);
440   SDValue RHS = Op.getOperand(3);
441   SDValue Dest = Op.getOperand(4);
442   SDLoc DL(Op);
443 
444   NegateCC(LHS, RHS, CC);
445 
446   return DAG.getNode(BPFISD::BR_CC, DL, Op.getValueType(), Chain, LHS, RHS,
447                      DAG.getConstant(CC, DL, MVT::i64), Dest);
448 }
449 
LowerSELECT_CC(SDValue Op,SelectionDAG & DAG) const450 SDValue BPFTargetLowering::LowerSELECT_CC(SDValue Op, SelectionDAG &DAG) const {
451   SDValue LHS = Op.getOperand(0);
452   SDValue RHS = Op.getOperand(1);
453   SDValue TrueV = Op.getOperand(2);
454   SDValue FalseV = Op.getOperand(3);
455   ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(4))->get();
456   SDLoc DL(Op);
457 
458   NegateCC(LHS, RHS, CC);
459 
460   SDValue TargetCC = DAG.getConstant(CC, DL, MVT::i64);
461 
462   SDVTList VTs = DAG.getVTList(Op.getValueType(), MVT::Glue);
463   SDValue Ops[] = {LHS, RHS, TargetCC, TrueV, FalseV};
464 
465   return DAG.getNode(BPFISD::SELECT_CC, DL, VTs, Ops);
466 }
467 
getTargetNodeName(unsigned Opcode) const468 const char *BPFTargetLowering::getTargetNodeName(unsigned Opcode) const {
469   switch ((BPFISD::NodeType)Opcode) {
470   case BPFISD::FIRST_NUMBER:
471     break;
472   case BPFISD::RET_FLAG:
473     return "BPFISD::RET_FLAG";
474   case BPFISD::CALL:
475     return "BPFISD::CALL";
476   case BPFISD::SELECT_CC:
477     return "BPFISD::SELECT_CC";
478   case BPFISD::BR_CC:
479     return "BPFISD::BR_CC";
480   case BPFISD::Wrapper:
481     return "BPFISD::Wrapper";
482   }
483   return nullptr;
484 }
485 
LowerGlobalAddress(SDValue Op,SelectionDAG & DAG) const486 SDValue BPFTargetLowering::LowerGlobalAddress(SDValue Op,
487                                               SelectionDAG &DAG) const {
488   SDLoc DL(Op);
489   const GlobalValue *GV = cast<GlobalAddressSDNode>(Op)->getGlobal();
490   SDValue GA = DAG.getTargetGlobalAddress(GV, DL, MVT::i64);
491 
492   return DAG.getNode(BPFISD::Wrapper, DL, MVT::i64, GA);
493 }
494 
495 MachineBasicBlock *
EmitInstrWithCustomInserter(MachineInstr & MI,MachineBasicBlock * BB) const496 BPFTargetLowering::EmitInstrWithCustomInserter(MachineInstr &MI,
497                                                MachineBasicBlock *BB) const {
498   const TargetInstrInfo &TII = *BB->getParent()->getSubtarget().getInstrInfo();
499   DebugLoc DL = MI.getDebugLoc();
500 
501   assert(MI.getOpcode() == BPF::Select && "Unexpected instr type to insert");
502 
503   // To "insert" a SELECT instruction, we actually have to insert the diamond
504   // control-flow pattern.  The incoming instruction knows the destination vreg
505   // to set, the condition code register to branch on, the true/false values to
506   // select between, and a branch opcode to use.
507   const BasicBlock *LLVM_BB = BB->getBasicBlock();
508   MachineFunction::iterator I = ++BB->getIterator();
509 
510   // ThisMBB:
511   // ...
512   //  TrueVal = ...
513   //  jmp_XX r1, r2 goto Copy1MBB
514   //  fallthrough --> Copy0MBB
515   MachineBasicBlock *ThisMBB = BB;
516   MachineFunction *F = BB->getParent();
517   MachineBasicBlock *Copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
518   MachineBasicBlock *Copy1MBB = F->CreateMachineBasicBlock(LLVM_BB);
519 
520   F->insert(I, Copy0MBB);
521   F->insert(I, Copy1MBB);
522   // Update machine-CFG edges by transferring all successors of the current
523   // block to the new block which will contain the Phi node for the select.
524   Copy1MBB->splice(Copy1MBB->begin(), BB,
525                    std::next(MachineBasicBlock::iterator(MI)), BB->end());
526   Copy1MBB->transferSuccessorsAndUpdatePHIs(BB);
527   // Next, add the true and fallthrough blocks as its successors.
528   BB->addSuccessor(Copy0MBB);
529   BB->addSuccessor(Copy1MBB);
530 
531   // Insert Branch if Flag
532   unsigned LHS = MI.getOperand(1).getReg();
533   unsigned RHS = MI.getOperand(2).getReg();
534   int CC = MI.getOperand(3).getImm();
535   switch (CC) {
536   case ISD::SETGT:
537     BuildMI(BB, DL, TII.get(BPF::JSGT_rr))
538         .addReg(LHS)
539         .addReg(RHS)
540         .addMBB(Copy1MBB);
541     break;
542   case ISD::SETUGT:
543     BuildMI(BB, DL, TII.get(BPF::JUGT_rr))
544         .addReg(LHS)
545         .addReg(RHS)
546         .addMBB(Copy1MBB);
547     break;
548   case ISD::SETGE:
549     BuildMI(BB, DL, TII.get(BPF::JSGE_rr))
550         .addReg(LHS)
551         .addReg(RHS)
552         .addMBB(Copy1MBB);
553     break;
554   case ISD::SETUGE:
555     BuildMI(BB, DL, TII.get(BPF::JUGE_rr))
556         .addReg(LHS)
557         .addReg(RHS)
558         .addMBB(Copy1MBB);
559     break;
560   case ISD::SETEQ:
561     BuildMI(BB, DL, TII.get(BPF::JEQ_rr))
562         .addReg(LHS)
563         .addReg(RHS)
564         .addMBB(Copy1MBB);
565     break;
566   case ISD::SETNE:
567     BuildMI(BB, DL, TII.get(BPF::JNE_rr))
568         .addReg(LHS)
569         .addReg(RHS)
570         .addMBB(Copy1MBB);
571     break;
572   default:
573     report_fatal_error("unimplemented select CondCode " + Twine(CC));
574   }
575 
576   // Copy0MBB:
577   //  %FalseValue = ...
578   //  # fallthrough to Copy1MBB
579   BB = Copy0MBB;
580 
581   // Update machine-CFG edges
582   BB->addSuccessor(Copy1MBB);
583 
584   // Copy1MBB:
585   //  %Result = phi [ %FalseValue, Copy0MBB ], [ %TrueValue, ThisMBB ]
586   // ...
587   BB = Copy1MBB;
588   BuildMI(*BB, BB->begin(), DL, TII.get(BPF::PHI), MI.getOperand(0).getReg())
589       .addReg(MI.getOperand(5).getReg())
590       .addMBB(Copy0MBB)
591       .addReg(MI.getOperand(4).getReg())
592       .addMBB(ThisMBB);
593 
594   MI.eraseFromParent(); // The pseudo instruction is gone now.
595   return BB;
596 }
597