• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 //===-- Mips16ISelLowering.h - Mips16 DAG Lowering Interface ----*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // Subclass of MipsTargetLowering specialized for mips16.
10 //
11 //===----------------------------------------------------------------------===//
12 #include "Mips16ISelLowering.h"
13 #include "MCTargetDesc/MipsBaseInfo.h"
14 #include "Mips16HardFloatInfo.h"
15 #include "MipsMachineFunction.h"
16 #include "MipsRegisterInfo.h"
17 #include "MipsTargetMachine.h"
18 #include "llvm/CodeGen/MachineInstrBuilder.h"
19 #include "llvm/CodeGen/TargetInstrInfo.h"
20 #include "llvm/Support/CommandLine.h"
21 
22 using namespace llvm;
23 
24 #define DEBUG_TYPE "mips-lower"
25 
26 static cl::opt<bool> DontExpandCondPseudos16(
27   "mips16-dont-expand-cond-pseudo",
28   cl::init(false),
29   cl::desc("Don't expand conditional move related "
30            "pseudos for Mips 16"),
31   cl::Hidden);
32 
33 namespace {
34 struct Mips16Libcall {
35   RTLIB::Libcall Libcall;
36   const char *Name;
37 
operator <__anonfce114ab0111::Mips16Libcall38   bool operator<(const Mips16Libcall &RHS) const {
39     return std::strcmp(Name, RHS.Name) < 0;
40   }
41 };
42 
43 struct Mips16IntrinsicHelperType{
44   const char* Name;
45   const char* Helper;
46 
operator <__anonfce114ab0111::Mips16IntrinsicHelperType47   bool operator<(const Mips16IntrinsicHelperType &RHS) const {
48     return std::strcmp(Name, RHS.Name) < 0;
49   }
operator ==__anonfce114ab0111::Mips16IntrinsicHelperType50   bool operator==(const Mips16IntrinsicHelperType &RHS) const {
51     return std::strcmp(Name, RHS.Name) == 0;
52   }
53 };
54 }
55 
56 // Libcalls for which no helper is generated. Sorted by name for binary search.
57 static const Mips16Libcall HardFloatLibCalls[] = {
58   { RTLIB::ADD_F64, "__mips16_adddf3" },
59   { RTLIB::ADD_F32, "__mips16_addsf3" },
60   { RTLIB::DIV_F64, "__mips16_divdf3" },
61   { RTLIB::DIV_F32, "__mips16_divsf3" },
62   { RTLIB::OEQ_F64, "__mips16_eqdf2" },
63   { RTLIB::OEQ_F32, "__mips16_eqsf2" },
64   { RTLIB::FPEXT_F32_F64, "__mips16_extendsfdf2" },
65   { RTLIB::FPTOSINT_F64_I32, "__mips16_fix_truncdfsi" },
66   { RTLIB::FPTOSINT_F32_I32, "__mips16_fix_truncsfsi" },
67   { RTLIB::SINTTOFP_I32_F64, "__mips16_floatsidf" },
68   { RTLIB::SINTTOFP_I32_F32, "__mips16_floatsisf" },
69   { RTLIB::UINTTOFP_I32_F64, "__mips16_floatunsidf" },
70   { RTLIB::UINTTOFP_I32_F32, "__mips16_floatunsisf" },
71   { RTLIB::OGE_F64, "__mips16_gedf2" },
72   { RTLIB::OGE_F32, "__mips16_gesf2" },
73   { RTLIB::OGT_F64, "__mips16_gtdf2" },
74   { RTLIB::OGT_F32, "__mips16_gtsf2" },
75   { RTLIB::OLE_F64, "__mips16_ledf2" },
76   { RTLIB::OLE_F32, "__mips16_lesf2" },
77   { RTLIB::OLT_F64, "__mips16_ltdf2" },
78   { RTLIB::OLT_F32, "__mips16_ltsf2" },
79   { RTLIB::MUL_F64, "__mips16_muldf3" },
80   { RTLIB::MUL_F32, "__mips16_mulsf3" },
81   { RTLIB::UNE_F64, "__mips16_nedf2" },
82   { RTLIB::UNE_F32, "__mips16_nesf2" },
83   { RTLIB::UNKNOWN_LIBCALL, "__mips16_ret_dc" }, // No associated libcall.
84   { RTLIB::UNKNOWN_LIBCALL, "__mips16_ret_df" }, // No associated libcall.
85   { RTLIB::UNKNOWN_LIBCALL, "__mips16_ret_sc" }, // No associated libcall.
86   { RTLIB::UNKNOWN_LIBCALL, "__mips16_ret_sf" }, // No associated libcall.
87   { RTLIB::SUB_F64, "__mips16_subdf3" },
88   { RTLIB::SUB_F32, "__mips16_subsf3" },
89   { RTLIB::FPROUND_F64_F32, "__mips16_truncdfsf2" },
90   { RTLIB::UO_F64, "__mips16_unorddf2" },
91   { RTLIB::UO_F32, "__mips16_unordsf2" }
92 };
93 
94 static const Mips16IntrinsicHelperType Mips16IntrinsicHelper[] = {
95   {"__fixunsdfsi", "__mips16_call_stub_2" },
96   {"ceil",  "__mips16_call_stub_df_2"},
97   {"ceilf", "__mips16_call_stub_sf_1"},
98   {"copysign",  "__mips16_call_stub_df_10"},
99   {"copysignf", "__mips16_call_stub_sf_5"},
100   {"cos",  "__mips16_call_stub_df_2"},
101   {"cosf", "__mips16_call_stub_sf_1"},
102   {"exp2",  "__mips16_call_stub_df_2"},
103   {"exp2f", "__mips16_call_stub_sf_1"},
104   {"floor",  "__mips16_call_stub_df_2"},
105   {"floorf", "__mips16_call_stub_sf_1"},
106   {"log2",  "__mips16_call_stub_df_2"},
107   {"log2f", "__mips16_call_stub_sf_1"},
108   {"nearbyint",  "__mips16_call_stub_df_2"},
109   {"nearbyintf", "__mips16_call_stub_sf_1"},
110   {"rint",  "__mips16_call_stub_df_2"},
111   {"rintf", "__mips16_call_stub_sf_1"},
112   {"sin",  "__mips16_call_stub_df_2"},
113   {"sinf", "__mips16_call_stub_sf_1"},
114   {"sqrt",  "__mips16_call_stub_df_2"},
115   {"sqrtf", "__mips16_call_stub_sf_1"},
116   {"trunc",  "__mips16_call_stub_df_2"},
117   {"truncf", "__mips16_call_stub_sf_1"},
118 };
119 
Mips16TargetLowering(const MipsTargetMachine & TM,const MipsSubtarget & STI)120 Mips16TargetLowering::Mips16TargetLowering(const MipsTargetMachine &TM,
121                                            const MipsSubtarget &STI)
122     : MipsTargetLowering(TM, STI) {
123 
124   // Set up the register classes
125   addRegisterClass(MVT::i32, &Mips::CPU16RegsRegClass);
126 
127   if (!Subtarget.useSoftFloat())
128     setMips16HardFloatLibCalls();
129 
130   setOperationAction(ISD::ATOMIC_FENCE,       MVT::Other, Expand);
131   setOperationAction(ISD::ATOMIC_CMP_SWAP,    MVT::i32,   Expand);
132   setOperationAction(ISD::ATOMIC_SWAP,        MVT::i32,   Expand);
133   setOperationAction(ISD::ATOMIC_LOAD_ADD,    MVT::i32,   Expand);
134   setOperationAction(ISD::ATOMIC_LOAD_SUB,    MVT::i32,   Expand);
135   setOperationAction(ISD::ATOMIC_LOAD_AND,    MVT::i32,   Expand);
136   setOperationAction(ISD::ATOMIC_LOAD_OR,     MVT::i32,   Expand);
137   setOperationAction(ISD::ATOMIC_LOAD_XOR,    MVT::i32,   Expand);
138   setOperationAction(ISD::ATOMIC_LOAD_NAND,   MVT::i32,   Expand);
139   setOperationAction(ISD::ATOMIC_LOAD_MIN,    MVT::i32,   Expand);
140   setOperationAction(ISD::ATOMIC_LOAD_MAX,    MVT::i32,   Expand);
141   setOperationAction(ISD::ATOMIC_LOAD_UMIN,   MVT::i32,   Expand);
142   setOperationAction(ISD::ATOMIC_LOAD_UMAX,   MVT::i32,   Expand);
143 
144   setOperationAction(ISD::ROTR, MVT::i32,  Expand);
145   setOperationAction(ISD::ROTR, MVT::i64,  Expand);
146   setOperationAction(ISD::BSWAP, MVT::i32, Expand);
147   setOperationAction(ISD::BSWAP, MVT::i64, Expand);
148 
149   computeRegisterProperties(STI.getRegisterInfo());
150 }
151 
152 const MipsTargetLowering *
createMips16TargetLowering(const MipsTargetMachine & TM,const MipsSubtarget & STI)153 llvm::createMips16TargetLowering(const MipsTargetMachine &TM,
154                                  const MipsSubtarget &STI) {
155   return new Mips16TargetLowering(TM, STI);
156 }
157 
allowsMisalignedMemoryAccesses(EVT VT,unsigned,unsigned,MachineMemOperand::Flags,bool * Fast) const158 bool Mips16TargetLowering::allowsMisalignedMemoryAccesses(
159     EVT VT, unsigned, unsigned, MachineMemOperand::Flags, bool *Fast) const {
160   return false;
161 }
162 
163 MachineBasicBlock *
EmitInstrWithCustomInserter(MachineInstr & MI,MachineBasicBlock * BB) const164 Mips16TargetLowering::EmitInstrWithCustomInserter(MachineInstr &MI,
165                                                   MachineBasicBlock *BB) const {
166   switch (MI.getOpcode()) {
167   default:
168     return MipsTargetLowering::EmitInstrWithCustomInserter(MI, BB);
169   case Mips::SelBeqZ:
170     return emitSel16(Mips::BeqzRxImm16, MI, BB);
171   case Mips::SelBneZ:
172     return emitSel16(Mips::BnezRxImm16, MI, BB);
173   case Mips::SelTBteqZCmpi:
174     return emitSeliT16(Mips::Bteqz16, Mips::CmpiRxImmX16, MI, BB);
175   case Mips::SelTBteqZSlti:
176     return emitSeliT16(Mips::Bteqz16, Mips::SltiRxImmX16, MI, BB);
177   case Mips::SelTBteqZSltiu:
178     return emitSeliT16(Mips::Bteqz16, Mips::SltiuRxImmX16, MI, BB);
179   case Mips::SelTBtneZCmpi:
180     return emitSeliT16(Mips::Btnez16, Mips::CmpiRxImmX16, MI, BB);
181   case Mips::SelTBtneZSlti:
182     return emitSeliT16(Mips::Btnez16, Mips::SltiRxImmX16, MI, BB);
183   case Mips::SelTBtneZSltiu:
184     return emitSeliT16(Mips::Btnez16, Mips::SltiuRxImmX16, MI, BB);
185   case Mips::SelTBteqZCmp:
186     return emitSelT16(Mips::Bteqz16, Mips::CmpRxRy16, MI, BB);
187   case Mips::SelTBteqZSlt:
188     return emitSelT16(Mips::Bteqz16, Mips::SltRxRy16, MI, BB);
189   case Mips::SelTBteqZSltu:
190     return emitSelT16(Mips::Bteqz16, Mips::SltuRxRy16, MI, BB);
191   case Mips::SelTBtneZCmp:
192     return emitSelT16(Mips::Btnez16, Mips::CmpRxRy16, MI, BB);
193   case Mips::SelTBtneZSlt:
194     return emitSelT16(Mips::Btnez16, Mips::SltRxRy16, MI, BB);
195   case Mips::SelTBtneZSltu:
196     return emitSelT16(Mips::Btnez16, Mips::SltuRxRy16, MI, BB);
197   case Mips::BteqzT8CmpX16:
198     return emitFEXT_T8I816_ins(Mips::Bteqz16, Mips::CmpRxRy16, MI, BB);
199   case Mips::BteqzT8SltX16:
200     return emitFEXT_T8I816_ins(Mips::Bteqz16, Mips::SltRxRy16, MI, BB);
201   case Mips::BteqzT8SltuX16:
202     // TBD: figure out a way to get this or remove the instruction
203     // altogether.
204     return emitFEXT_T8I816_ins(Mips::Bteqz16, Mips::SltuRxRy16, MI, BB);
205   case Mips::BtnezT8CmpX16:
206     return emitFEXT_T8I816_ins(Mips::Btnez16, Mips::CmpRxRy16, MI, BB);
207   case Mips::BtnezT8SltX16:
208     return emitFEXT_T8I816_ins(Mips::Btnez16, Mips::SltRxRy16, MI, BB);
209   case Mips::BtnezT8SltuX16:
210     // TBD: figure out a way to get this or remove the instruction
211     // altogether.
212     return emitFEXT_T8I816_ins(Mips::Btnez16, Mips::SltuRxRy16, MI, BB);
213   case Mips::BteqzT8CmpiX16: return emitFEXT_T8I8I16_ins(
214     Mips::Bteqz16, Mips::CmpiRxImm16, Mips::CmpiRxImmX16, false, MI, BB);
215   case Mips::BteqzT8SltiX16: return emitFEXT_T8I8I16_ins(
216     Mips::Bteqz16, Mips::SltiRxImm16, Mips::SltiRxImmX16, true, MI, BB);
217   case Mips::BteqzT8SltiuX16: return emitFEXT_T8I8I16_ins(
218     Mips::Bteqz16, Mips::SltiuRxImm16, Mips::SltiuRxImmX16, false, MI, BB);
219   case Mips::BtnezT8CmpiX16: return emitFEXT_T8I8I16_ins(
220     Mips::Btnez16, Mips::CmpiRxImm16, Mips::CmpiRxImmX16, false, MI, BB);
221   case Mips::BtnezT8SltiX16: return emitFEXT_T8I8I16_ins(
222     Mips::Btnez16, Mips::SltiRxImm16, Mips::SltiRxImmX16, true, MI, BB);
223   case Mips::BtnezT8SltiuX16: return emitFEXT_T8I8I16_ins(
224     Mips::Btnez16, Mips::SltiuRxImm16, Mips::SltiuRxImmX16, false, MI, BB);
225     break;
226   case Mips::SltCCRxRy16:
227     return emitFEXT_CCRX16_ins(Mips::SltRxRy16, MI, BB);
228     break;
229   case Mips::SltiCCRxImmX16:
230     return emitFEXT_CCRXI16_ins
231       (Mips::SltiRxImm16, Mips::SltiRxImmX16, MI, BB);
232   case Mips::SltiuCCRxImmX16:
233     return emitFEXT_CCRXI16_ins
234       (Mips::SltiuRxImm16, Mips::SltiuRxImmX16, MI, BB);
235   case Mips::SltuCCRxRy16:
236     return emitFEXT_CCRX16_ins
237       (Mips::SltuRxRy16, MI, BB);
238   }
239 }
240 
isEligibleForTailCallOptimization(const CCState & CCInfo,unsigned NextStackOffset,const MipsFunctionInfo & FI) const241 bool Mips16TargetLowering::isEligibleForTailCallOptimization(
242     const CCState &CCInfo, unsigned NextStackOffset,
243     const MipsFunctionInfo &FI) const {
244   // No tail call optimization for mips16.
245   return false;
246 }
247 
setMips16HardFloatLibCalls()248 void Mips16TargetLowering::setMips16HardFloatLibCalls() {
249   for (unsigned I = 0; I != array_lengthof(HardFloatLibCalls); ++I) {
250     assert((I == 0 || HardFloatLibCalls[I - 1] < HardFloatLibCalls[I]) &&
251            "Array not sorted!");
252     if (HardFloatLibCalls[I].Libcall != RTLIB::UNKNOWN_LIBCALL)
253       setLibcallName(HardFloatLibCalls[I].Libcall, HardFloatLibCalls[I].Name);
254   }
255 }
256 
257 //
258 // The Mips16 hard float is a crazy quilt inherited from gcc. I have a much
259 // cleaner way to do all of this but it will have to wait until the traditional
260 // gcc mechanism is completed.
261 //
262 // For Pic, in order for Mips16 code to call Mips32 code which according the abi
263 // have either arguments or returned values placed in floating point registers,
264 // we use a set of helper functions. (This includes functions which return type
265 //  complex which on Mips are returned in a pair of floating point registers).
266 //
267 // This is an encoding that we inherited from gcc.
268 // In Mips traditional O32, N32 ABI, floating point numbers are passed in
269 // floating point argument registers 1,2 only when the first and optionally
270 // the second arguments are float (sf) or double (df).
271 // For Mips16 we are only concerned with the situations where floating point
272 // arguments are being passed in floating point registers by the ABI, because
273 // Mips16 mode code cannot execute floating point instructions to load those
274 // values and hence helper functions are needed.
275 // The possibilities are (), (sf), (sf, sf), (sf, df), (df), (df, sf), (df, df)
276 // the helper function suffixs for these are:
277 //                        0,  1,    5,        9,         2,   6,        10
278 // this suffix can then be calculated as follows:
279 // for a given argument Arg:
280 //     Arg1x, Arg2x = 1 :  Arg is sf
281 //                    2 :  Arg is df
282 //                    0:   Arg is neither sf or df
283 // So this stub is the string for number Arg1x + Arg2x*4.
284 // However not all numbers between 0 and 10 are possible, we check anyway and
285 // assert if the impossible exists.
286 //
287 
getMips16HelperFunctionStubNumber(ArgListTy & Args) const288 unsigned int Mips16TargetLowering::getMips16HelperFunctionStubNumber
289   (ArgListTy &Args) const {
290   unsigned int resultNum = 0;
291   if (Args.size() >= 1) {
292     Type *t = Args[0].Ty;
293     if (t->isFloatTy()) {
294       resultNum = 1;
295     }
296     else if (t->isDoubleTy()) {
297       resultNum = 2;
298     }
299   }
300   if (resultNum) {
301     if (Args.size() >=2) {
302       Type *t = Args[1].Ty;
303       if (t->isFloatTy()) {
304         resultNum += 4;
305       }
306       else if (t->isDoubleTy()) {
307         resultNum += 8;
308       }
309     }
310   }
311   return resultNum;
312 }
313 
314 //
315 // Prefixes are attached to stub numbers depending on the return type.
316 // return type: float  sf_
317 //              double df_
318 //              single complex sc_
319 //              double complext dc_
320 //              others  NO PREFIX
321 //
322 //
323 // The full name of a helper function is__mips16_call_stub +
324 //    return type dependent prefix + stub number
325 //
326 // FIXME: This is something that probably should be in a different source file
327 // and perhaps done differently but my main purpose is to not waste runtime
328 // on something that we can enumerate in the source. Another possibility is
329 // to have a python script to generate these mapping tables. This will do
330 // for now. There are a whole series of helper function mapping arrays, one
331 // for each return type class as outlined above. There there are 11 possible
332 // entries. Ones with 0 are ones which should never be selected.
333 //
334 // All the arrays are similar except for ones which return neither
335 // sf, df, sc, dc, in which we only care about ones which have sf or df as a
336 // first parameter.
337 //
338 #define P_ "__mips16_call_stub_"
339 #define MAX_STUB_NUMBER 10
340 #define T1 P "1", P "2", 0, 0, P "5", P "6", 0, 0, P "9", P "10"
341 #define T P "0" , T1
342 #define P P_
343 static char const * vMips16Helper[MAX_STUB_NUMBER+1] =
344   {nullptr, T1 };
345 #undef P
346 #define P P_ "sf_"
347 static char const * sfMips16Helper[MAX_STUB_NUMBER+1] =
348   { T };
349 #undef P
350 #define P P_ "df_"
351 static char const * dfMips16Helper[MAX_STUB_NUMBER+1] =
352   { T };
353 #undef P
354 #define P P_ "sc_"
355 static char const * scMips16Helper[MAX_STUB_NUMBER+1] =
356   { T };
357 #undef P
358 #define P P_ "dc_"
359 static char const * dcMips16Helper[MAX_STUB_NUMBER+1] =
360   { T };
361 #undef P
362 #undef P_
363 
364 
365 const char* Mips16TargetLowering::
getMips16HelperFunction(Type * RetTy,ArgListTy & Args,bool & needHelper) const366   getMips16HelperFunction
367     (Type* RetTy, ArgListTy &Args, bool &needHelper) const {
368   const unsigned int stubNum = getMips16HelperFunctionStubNumber(Args);
369 #ifndef NDEBUG
370   const unsigned int maxStubNum = 10;
371   assert(stubNum <= maxStubNum);
372   const bool validStubNum[maxStubNum+1] =
373     {true, true, true, false, false, true, true, false, false, true, true};
374   assert(validStubNum[stubNum]);
375 #endif
376   const char *result;
377   if (RetTy->isFloatTy()) {
378     result = sfMips16Helper[stubNum];
379   }
380   else if (RetTy ->isDoubleTy()) {
381     result = dfMips16Helper[stubNum];
382   } else if (StructType *SRetTy = dyn_cast<StructType>(RetTy)) {
383     // check if it's complex
384     if (SRetTy->getNumElements() == 2) {
385       if ((SRetTy->getElementType(0)->isFloatTy()) &&
386           (SRetTy->getElementType(1)->isFloatTy())) {
387         result = scMips16Helper[stubNum];
388       } else if ((SRetTy->getElementType(0)->isDoubleTy()) &&
389                  (SRetTy->getElementType(1)->isDoubleTy())) {
390         result = dcMips16Helper[stubNum];
391       } else {
392         llvm_unreachable("Uncovered condition");
393       }
394     } else {
395       llvm_unreachable("Uncovered condition");
396     }
397   } else {
398     if (stubNum == 0) {
399       needHelper = false;
400       return "";
401     }
402     result = vMips16Helper[stubNum];
403   }
404   needHelper = true;
405   return result;
406 }
407 
408 void Mips16TargetLowering::
getOpndList(SmallVectorImpl<SDValue> & Ops,std::deque<std::pair<unsigned,SDValue>> & RegsToPass,bool IsPICCall,bool GlobalOrExternal,bool InternalLinkage,bool IsCallReloc,CallLoweringInfo & CLI,SDValue Callee,SDValue Chain) const409 getOpndList(SmallVectorImpl<SDValue> &Ops,
410             std::deque< std::pair<unsigned, SDValue> > &RegsToPass,
411             bool IsPICCall, bool GlobalOrExternal, bool InternalLinkage,
412             bool IsCallReloc, CallLoweringInfo &CLI, SDValue Callee,
413             SDValue Chain) const {
414   SelectionDAG &DAG = CLI.DAG;
415   MachineFunction &MF = DAG.getMachineFunction();
416   MipsFunctionInfo *FuncInfo = MF.getInfo<MipsFunctionInfo>();
417   const char* Mips16HelperFunction = nullptr;
418   bool NeedMips16Helper = false;
419 
420   if (Subtarget.inMips16HardFloat()) {
421     //
422     // currently we don't have symbols tagged with the mips16 or mips32
423     // qualifier so we will assume that we don't know what kind it is.
424     // and generate the helper
425     //
426     bool LookupHelper = true;
427     if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(CLI.Callee)) {
428       Mips16Libcall Find = { RTLIB::UNKNOWN_LIBCALL, S->getSymbol() };
429 
430       if (std::binary_search(std::begin(HardFloatLibCalls),
431                              std::end(HardFloatLibCalls), Find))
432         LookupHelper = false;
433       else {
434         const char *Symbol = S->getSymbol();
435         Mips16IntrinsicHelperType IntrinsicFind = { Symbol, "" };
436         const Mips16HardFloatInfo::FuncSignature *Signature =
437             Mips16HardFloatInfo::findFuncSignature(Symbol);
438         if (!IsPICCall && (Signature && (FuncInfo->StubsNeeded.find(Symbol) ==
439                                          FuncInfo->StubsNeeded.end()))) {
440           FuncInfo->StubsNeeded[Symbol] = Signature;
441           //
442           // S2 is normally saved if the stub is for a function which
443           // returns a float or double value and is not otherwise. This is
444           // because more work is required after the function the stub
445           // is calling completes, and so the stub cannot directly return
446           // and the stub has no stack space to store the return address so
447           // S2 is used for that purpose.
448           // In order to take advantage of not saving S2, we need to also
449           // optimize the call in the stub and this requires some further
450           // functionality in MipsAsmPrinter which we don't have yet.
451           // So for now we always save S2. The optimization will be done
452           // in a follow-on patch.
453           //
454           if (1 || (Signature->RetSig != Mips16HardFloatInfo::NoFPRet))
455             FuncInfo->setSaveS2();
456         }
457         // one more look at list of intrinsics
458         const Mips16IntrinsicHelperType *Helper =
459             llvm::lower_bound(Mips16IntrinsicHelper, IntrinsicFind);
460         if (Helper != std::end(Mips16IntrinsicHelper) &&
461             *Helper == IntrinsicFind) {
462           Mips16HelperFunction = Helper->Helper;
463           NeedMips16Helper = true;
464           LookupHelper = false;
465         }
466 
467       }
468     } else if (GlobalAddressSDNode *G =
469                    dyn_cast<GlobalAddressSDNode>(CLI.Callee)) {
470       Mips16Libcall Find = { RTLIB::UNKNOWN_LIBCALL,
471                              G->getGlobal()->getName().data() };
472 
473       if (std::binary_search(std::begin(HardFloatLibCalls),
474                              std::end(HardFloatLibCalls), Find))
475         LookupHelper = false;
476     }
477     if (LookupHelper)
478       Mips16HelperFunction =
479         getMips16HelperFunction(CLI.RetTy, CLI.getArgs(), NeedMips16Helper);
480   }
481 
482   SDValue JumpTarget = Callee;
483 
484   // T9 should contain the address of the callee function if
485   // -relocation-model=pic or it is an indirect call.
486   if (IsPICCall || !GlobalOrExternal) {
487     unsigned V0Reg = Mips::V0;
488     if (NeedMips16Helper) {
489       RegsToPass.push_front(std::make_pair(V0Reg, Callee));
490       JumpTarget = DAG.getExternalSymbol(Mips16HelperFunction,
491                                          getPointerTy(DAG.getDataLayout()));
492       ExternalSymbolSDNode *S = cast<ExternalSymbolSDNode>(JumpTarget);
493       JumpTarget = getAddrGlobal(S, CLI.DL, JumpTarget.getValueType(), DAG,
494                                  MipsII::MO_GOT, Chain,
495                                  FuncInfo->callPtrInfo(S->getSymbol()));
496     } else
497       RegsToPass.push_front(std::make_pair((unsigned)Mips::T9, Callee));
498   }
499 
500   Ops.push_back(JumpTarget);
501 
502   MipsTargetLowering::getOpndList(Ops, RegsToPass, IsPICCall, GlobalOrExternal,
503                                   InternalLinkage, IsCallReloc, CLI, Callee,
504                                   Chain);
505 }
506 
507 MachineBasicBlock *
emitSel16(unsigned Opc,MachineInstr & MI,MachineBasicBlock * BB) const508 Mips16TargetLowering::emitSel16(unsigned Opc, MachineInstr &MI,
509                                 MachineBasicBlock *BB) const {
510   if (DontExpandCondPseudos16)
511     return BB;
512   const TargetInstrInfo *TII = Subtarget.getInstrInfo();
513   DebugLoc DL = MI.getDebugLoc();
514   // To "insert" a SELECT_CC instruction, we actually have to insert the
515   // diamond control-flow pattern.  The incoming instruction knows the
516   // destination vreg to set, the condition code register to branch on, the
517   // true/false values to select between, and a branch opcode to use.
518   const BasicBlock *LLVM_BB = BB->getBasicBlock();
519   MachineFunction::iterator It = ++BB->getIterator();
520 
521   //  thisMBB:
522   //  ...
523   //   TrueVal = ...
524   //   setcc r1, r2, r3
525   //   bNE   r1, r0, copy1MBB
526   //   fallthrough --> copy0MBB
527   MachineBasicBlock *thisMBB  = BB;
528   MachineFunction *F = BB->getParent();
529   MachineBasicBlock *copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
530   MachineBasicBlock *sinkMBB  = F->CreateMachineBasicBlock(LLVM_BB);
531   F->insert(It, copy0MBB);
532   F->insert(It, sinkMBB);
533 
534   // Transfer the remainder of BB and its successor edges to sinkMBB.
535   sinkMBB->splice(sinkMBB->begin(), BB,
536                   std::next(MachineBasicBlock::iterator(MI)), BB->end());
537   sinkMBB->transferSuccessorsAndUpdatePHIs(BB);
538 
539   // Next, add the true and fallthrough blocks as its successors.
540   BB->addSuccessor(copy0MBB);
541   BB->addSuccessor(sinkMBB);
542 
543   BuildMI(BB, DL, TII->get(Opc))
544       .addReg(MI.getOperand(3).getReg())
545       .addMBB(sinkMBB);
546 
547   //  copy0MBB:
548   //   %FalseValue = ...
549   //   # fallthrough to sinkMBB
550   BB = copy0MBB;
551 
552   // Update machine-CFG edges
553   BB->addSuccessor(sinkMBB);
554 
555   //  sinkMBB:
556   //   %Result = phi [ %TrueValue, thisMBB ], [ %FalseValue, copy0MBB ]
557   //  ...
558   BB = sinkMBB;
559 
560   BuildMI(*BB, BB->begin(), DL, TII->get(Mips::PHI), MI.getOperand(0).getReg())
561       .addReg(MI.getOperand(1).getReg())
562       .addMBB(thisMBB)
563       .addReg(MI.getOperand(2).getReg())
564       .addMBB(copy0MBB);
565 
566   MI.eraseFromParent(); // The pseudo instruction is gone now.
567   return BB;
568 }
569 
570 MachineBasicBlock *
emitSelT16(unsigned Opc1,unsigned Opc2,MachineInstr & MI,MachineBasicBlock * BB) const571 Mips16TargetLowering::emitSelT16(unsigned Opc1, unsigned Opc2, MachineInstr &MI,
572                                  MachineBasicBlock *BB) const {
573   if (DontExpandCondPseudos16)
574     return BB;
575   const TargetInstrInfo *TII = Subtarget.getInstrInfo();
576   DebugLoc DL = MI.getDebugLoc();
577   // To "insert" a SELECT_CC instruction, we actually have to insert the
578   // diamond control-flow pattern.  The incoming instruction knows the
579   // destination vreg to set, the condition code register to branch on, the
580   // true/false values to select between, and a branch opcode to use.
581   const BasicBlock *LLVM_BB = BB->getBasicBlock();
582   MachineFunction::iterator It = ++BB->getIterator();
583 
584   //  thisMBB:
585   //  ...
586   //   TrueVal = ...
587   //   setcc r1, r2, r3
588   //   bNE   r1, r0, copy1MBB
589   //   fallthrough --> copy0MBB
590   MachineBasicBlock *thisMBB  = BB;
591   MachineFunction *F = BB->getParent();
592   MachineBasicBlock *copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
593   MachineBasicBlock *sinkMBB  = F->CreateMachineBasicBlock(LLVM_BB);
594   F->insert(It, copy0MBB);
595   F->insert(It, sinkMBB);
596 
597   // Transfer the remainder of BB and its successor edges to sinkMBB.
598   sinkMBB->splice(sinkMBB->begin(), BB,
599                   std::next(MachineBasicBlock::iterator(MI)), BB->end());
600   sinkMBB->transferSuccessorsAndUpdatePHIs(BB);
601 
602   // Next, add the true and fallthrough blocks as its successors.
603   BB->addSuccessor(copy0MBB);
604   BB->addSuccessor(sinkMBB);
605 
606   BuildMI(BB, DL, TII->get(Opc2))
607       .addReg(MI.getOperand(3).getReg())
608       .addReg(MI.getOperand(4).getReg());
609   BuildMI(BB, DL, TII->get(Opc1)).addMBB(sinkMBB);
610 
611   //  copy0MBB:
612   //   %FalseValue = ...
613   //   # fallthrough to sinkMBB
614   BB = copy0MBB;
615 
616   // Update machine-CFG edges
617   BB->addSuccessor(sinkMBB);
618 
619   //  sinkMBB:
620   //   %Result = phi [ %TrueValue, thisMBB ], [ %FalseValue, copy0MBB ]
621   //  ...
622   BB = sinkMBB;
623 
624   BuildMI(*BB, BB->begin(), DL, TII->get(Mips::PHI), MI.getOperand(0).getReg())
625       .addReg(MI.getOperand(1).getReg())
626       .addMBB(thisMBB)
627       .addReg(MI.getOperand(2).getReg())
628       .addMBB(copy0MBB);
629 
630   MI.eraseFromParent(); // The pseudo instruction is gone now.
631   return BB;
632 
633 }
634 
635 MachineBasicBlock *
emitSeliT16(unsigned Opc1,unsigned Opc2,MachineInstr & MI,MachineBasicBlock * BB) const636 Mips16TargetLowering::emitSeliT16(unsigned Opc1, unsigned Opc2,
637                                   MachineInstr &MI,
638                                   MachineBasicBlock *BB) const {
639   if (DontExpandCondPseudos16)
640     return BB;
641   const TargetInstrInfo *TII = Subtarget.getInstrInfo();
642   DebugLoc DL = MI.getDebugLoc();
643   // To "insert" a SELECT_CC instruction, we actually have to insert the
644   // diamond control-flow pattern.  The incoming instruction knows the
645   // destination vreg to set, the condition code register to branch on, the
646   // true/false values to select between, and a branch opcode to use.
647   const BasicBlock *LLVM_BB = BB->getBasicBlock();
648   MachineFunction::iterator It = ++BB->getIterator();
649 
650   //  thisMBB:
651   //  ...
652   //   TrueVal = ...
653   //   setcc r1, r2, r3
654   //   bNE   r1, r0, copy1MBB
655   //   fallthrough --> copy0MBB
656   MachineBasicBlock *thisMBB  = BB;
657   MachineFunction *F = BB->getParent();
658   MachineBasicBlock *copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
659   MachineBasicBlock *sinkMBB  = F->CreateMachineBasicBlock(LLVM_BB);
660   F->insert(It, copy0MBB);
661   F->insert(It, sinkMBB);
662 
663   // Transfer the remainder of BB and its successor edges to sinkMBB.
664   sinkMBB->splice(sinkMBB->begin(), BB,
665                   std::next(MachineBasicBlock::iterator(MI)), BB->end());
666   sinkMBB->transferSuccessorsAndUpdatePHIs(BB);
667 
668   // Next, add the true and fallthrough blocks as its successors.
669   BB->addSuccessor(copy0MBB);
670   BB->addSuccessor(sinkMBB);
671 
672   BuildMI(BB, DL, TII->get(Opc2))
673       .addReg(MI.getOperand(3).getReg())
674       .addImm(MI.getOperand(4).getImm());
675   BuildMI(BB, DL, TII->get(Opc1)).addMBB(sinkMBB);
676 
677   //  copy0MBB:
678   //   %FalseValue = ...
679   //   # fallthrough to sinkMBB
680   BB = copy0MBB;
681 
682   // Update machine-CFG edges
683   BB->addSuccessor(sinkMBB);
684 
685   //  sinkMBB:
686   //   %Result = phi [ %TrueValue, thisMBB ], [ %FalseValue, copy0MBB ]
687   //  ...
688   BB = sinkMBB;
689 
690   BuildMI(*BB, BB->begin(), DL, TII->get(Mips::PHI), MI.getOperand(0).getReg())
691       .addReg(MI.getOperand(1).getReg())
692       .addMBB(thisMBB)
693       .addReg(MI.getOperand(2).getReg())
694       .addMBB(copy0MBB);
695 
696   MI.eraseFromParent(); // The pseudo instruction is gone now.
697   return BB;
698 
699 }
700 
701 MachineBasicBlock *
emitFEXT_T8I816_ins(unsigned BtOpc,unsigned CmpOpc,MachineInstr & MI,MachineBasicBlock * BB) const702 Mips16TargetLowering::emitFEXT_T8I816_ins(unsigned BtOpc, unsigned CmpOpc,
703                                           MachineInstr &MI,
704                                           MachineBasicBlock *BB) const {
705   if (DontExpandCondPseudos16)
706     return BB;
707   const TargetInstrInfo *TII = Subtarget.getInstrInfo();
708   Register regX = MI.getOperand(0).getReg();
709   Register regY = MI.getOperand(1).getReg();
710   MachineBasicBlock *target = MI.getOperand(2).getMBB();
711   BuildMI(*BB, MI, MI.getDebugLoc(), TII->get(CmpOpc))
712       .addReg(regX)
713       .addReg(regY);
714   BuildMI(*BB, MI, MI.getDebugLoc(), TII->get(BtOpc)).addMBB(target);
715   MI.eraseFromParent(); // The pseudo instruction is gone now.
716   return BB;
717 }
718 
emitFEXT_T8I8I16_ins(unsigned BtOpc,unsigned CmpiOpc,unsigned CmpiXOpc,bool ImmSigned,MachineInstr & MI,MachineBasicBlock * BB) const719 MachineBasicBlock *Mips16TargetLowering::emitFEXT_T8I8I16_ins(
720     unsigned BtOpc, unsigned CmpiOpc, unsigned CmpiXOpc, bool ImmSigned,
721     MachineInstr &MI, MachineBasicBlock *BB) const {
722   if (DontExpandCondPseudos16)
723     return BB;
724   const TargetInstrInfo *TII = Subtarget.getInstrInfo();
725   Register regX = MI.getOperand(0).getReg();
726   int64_t imm = MI.getOperand(1).getImm();
727   MachineBasicBlock *target = MI.getOperand(2).getMBB();
728   unsigned CmpOpc;
729   if (isUInt<8>(imm))
730     CmpOpc = CmpiOpc;
731   else if ((!ImmSigned && isUInt<16>(imm)) ||
732            (ImmSigned && isInt<16>(imm)))
733     CmpOpc = CmpiXOpc;
734   else
735     llvm_unreachable("immediate field not usable");
736   BuildMI(*BB, MI, MI.getDebugLoc(), TII->get(CmpOpc)).addReg(regX).addImm(imm);
737   BuildMI(*BB, MI, MI.getDebugLoc(), TII->get(BtOpc)).addMBB(target);
738   MI.eraseFromParent(); // The pseudo instruction is gone now.
739   return BB;
740 }
741 
Mips16WhichOp8uOr16simm(unsigned shortOp,unsigned longOp,int64_t Imm)742 static unsigned Mips16WhichOp8uOr16simm
743   (unsigned shortOp, unsigned longOp, int64_t Imm) {
744   if (isUInt<8>(Imm))
745     return shortOp;
746   else if (isInt<16>(Imm))
747     return longOp;
748   else
749     llvm_unreachable("immediate field not usable");
750 }
751 
752 MachineBasicBlock *
emitFEXT_CCRX16_ins(unsigned SltOpc,MachineInstr & MI,MachineBasicBlock * BB) const753 Mips16TargetLowering::emitFEXT_CCRX16_ins(unsigned SltOpc, MachineInstr &MI,
754                                           MachineBasicBlock *BB) const {
755   if (DontExpandCondPseudos16)
756     return BB;
757   const TargetInstrInfo *TII = Subtarget.getInstrInfo();
758   Register CC = MI.getOperand(0).getReg();
759   Register regX = MI.getOperand(1).getReg();
760   Register regY = MI.getOperand(2).getReg();
761   BuildMI(*BB, MI, MI.getDebugLoc(), TII->get(SltOpc))
762       .addReg(regX)
763       .addReg(regY);
764   BuildMI(*BB, MI, MI.getDebugLoc(), TII->get(Mips::MoveR3216), CC)
765       .addReg(Mips::T8);
766   MI.eraseFromParent(); // The pseudo instruction is gone now.
767   return BB;
768 }
769 
770 MachineBasicBlock *
emitFEXT_CCRXI16_ins(unsigned SltiOpc,unsigned SltiXOpc,MachineInstr & MI,MachineBasicBlock * BB) const771 Mips16TargetLowering::emitFEXT_CCRXI16_ins(unsigned SltiOpc, unsigned SltiXOpc,
772                                            MachineInstr &MI,
773                                            MachineBasicBlock *BB) const {
774   if (DontExpandCondPseudos16)
775     return BB;
776   const TargetInstrInfo *TII = Subtarget.getInstrInfo();
777   Register CC = MI.getOperand(0).getReg();
778   Register regX = MI.getOperand(1).getReg();
779   int64_t Imm = MI.getOperand(2).getImm();
780   unsigned SltOpc = Mips16WhichOp8uOr16simm(SltiOpc, SltiXOpc, Imm);
781   BuildMI(*BB, MI, MI.getDebugLoc(), TII->get(SltOpc)).addReg(regX).addImm(Imm);
782   BuildMI(*BB, MI, MI.getDebugLoc(), TII->get(Mips::MoveR3216), CC)
783       .addReg(Mips::T8);
784   MI.eraseFromParent(); // The pseudo instruction is gone now.
785   return BB;
786 
787 }
788