• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 //===------- HexagonCopyToCombine.cpp - Hexagon Copy-To-Combine Pass ------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 // This pass replaces transfer instructions by combine instructions.
10 // We walk along a basic block and look for two combinable instructions and try
11 // to move them together. If we can move them next to each other we do so and
12 // replace them with a combine instruction.
13 //===----------------------------------------------------------------------===//
14 #include "llvm/PassSupport.h"
15 #include "Hexagon.h"
16 #include "HexagonInstrInfo.h"
17 #include "HexagonMachineFunctionInfo.h"
18 #include "HexagonRegisterInfo.h"
19 #include "HexagonSubtarget.h"
20 #include "HexagonTargetMachine.h"
21 #include "llvm/ADT/DenseMap.h"
22 #include "llvm/ADT/DenseSet.h"
23 #include "llvm/CodeGen/MachineBasicBlock.h"
24 #include "llvm/CodeGen/MachineFunction.h"
25 #include "llvm/CodeGen/MachineFunctionPass.h"
26 #include "llvm/CodeGen/MachineInstr.h"
27 #include "llvm/CodeGen/MachineInstrBuilder.h"
28 #include "llvm/CodeGen/Passes.h"
29 #include "llvm/Support/CodeGen.h"
30 #include "llvm/Support/CommandLine.h"
31 #include "llvm/Support/Debug.h"
32 #include "llvm/Support/raw_ostream.h"
33 #include "llvm/Target/TargetRegisterInfo.h"
34 
35 using namespace llvm;
36 
37 #define DEBUG_TYPE "hexagon-copy-combine"
38 
39 static
40 cl::opt<bool> IsCombinesDisabled("disable-merge-into-combines",
41                                  cl::Hidden, cl::ZeroOrMore,
42                                  cl::init(false),
43                                  cl::desc("Disable merging into combines"));
44 static
45 cl::opt<bool> IsConst64Disabled("disable-const64",
46                                  cl::Hidden, cl::ZeroOrMore,
47                                  cl::init(false),
48                                  cl::desc("Disable generation of const64"));
49 static
50 cl::opt<unsigned>
51 MaxNumOfInstsBetweenNewValueStoreAndTFR("max-num-inst-between-tfr-and-nv-store",
52                    cl::Hidden, cl::init(4),
53                    cl::desc("Maximum distance between a tfr feeding a store we "
54                             "consider the store still to be newifiable"));
55 
56 namespace llvm {
57   FunctionPass *createHexagonCopyToCombine();
58   void initializeHexagonCopyToCombinePass(PassRegistry&);
59 }
60 
61 
62 namespace {
63 
64 class HexagonCopyToCombine : public MachineFunctionPass  {
65   const HexagonInstrInfo *TII;
66   const TargetRegisterInfo *TRI;
67   bool ShouldCombineAggressively;
68 
69   DenseSet<MachineInstr *> PotentiallyNewifiableTFR;
70   SmallVector<MachineInstr *, 8> DbgMItoMove;
71 
72 public:
73   static char ID;
74 
HexagonCopyToCombine()75   HexagonCopyToCombine() : MachineFunctionPass(ID) {
76     initializeHexagonCopyToCombinePass(*PassRegistry::getPassRegistry());
77   }
78 
getAnalysisUsage(AnalysisUsage & AU) const79   void getAnalysisUsage(AnalysisUsage &AU) const override {
80     MachineFunctionPass::getAnalysisUsage(AU);
81   }
82 
getPassName() const83   const char *getPassName() const override {
84     return "Hexagon Copy-To-Combine Pass";
85   }
86 
87   bool runOnMachineFunction(MachineFunction &Fn) override;
88 
getRequiredProperties() const89   MachineFunctionProperties getRequiredProperties() const override {
90     return MachineFunctionProperties().set(
91         MachineFunctionProperties::Property::AllVRegsAllocated);
92   }
93 
94 private:
95   MachineInstr *findPairable(MachineInstr &I1, bool &DoInsertAtI1,
96                              bool AllowC64);
97 
98   void findPotentialNewifiableTFRs(MachineBasicBlock &);
99 
100   void combine(MachineInstr &I1, MachineInstr &I2,
101                MachineBasicBlock::iterator &MI, bool DoInsertAtI1,
102                bool OptForSize);
103 
104   bool isSafeToMoveTogether(MachineInstr &I1, MachineInstr &I2,
105                             unsigned I1DestReg, unsigned I2DestReg,
106                             bool &DoInsertAtI1);
107 
108   void emitCombineRR(MachineBasicBlock::iterator &Before, unsigned DestReg,
109                      MachineOperand &HiOperand, MachineOperand &LoOperand);
110 
111   void emitCombineRI(MachineBasicBlock::iterator &Before, unsigned DestReg,
112                      MachineOperand &HiOperand, MachineOperand &LoOperand);
113 
114   void emitCombineIR(MachineBasicBlock::iterator &Before, unsigned DestReg,
115                      MachineOperand &HiOperand, MachineOperand &LoOperand);
116 
117   void emitCombineII(MachineBasicBlock::iterator &Before, unsigned DestReg,
118                      MachineOperand &HiOperand, MachineOperand &LoOperand);
119 
120   void emitConst64(MachineBasicBlock::iterator &Before, unsigned DestReg,
121                    MachineOperand &HiOperand, MachineOperand &LoOperand);
122 };
123 
124 } // End anonymous namespace.
125 
126 char HexagonCopyToCombine::ID = 0;
127 
128 INITIALIZE_PASS(HexagonCopyToCombine, "hexagon-copy-combine",
129                 "Hexagon Copy-To-Combine Pass", false, false)
130 
isCombinableInstType(MachineInstr & MI,const HexagonInstrInfo * TII,bool ShouldCombineAggressively)131 static bool isCombinableInstType(MachineInstr &MI, const HexagonInstrInfo *TII,
132                                  bool ShouldCombineAggressively) {
133   switch (MI.getOpcode()) {
134   case Hexagon::A2_tfr: {
135     // A COPY instruction can be combined if its arguments are IntRegs (32bit).
136     const MachineOperand &Op0 = MI.getOperand(0);
137     const MachineOperand &Op1 = MI.getOperand(1);
138     assert(Op0.isReg() && Op1.isReg());
139 
140     unsigned DestReg = Op0.getReg();
141     unsigned SrcReg = Op1.getReg();
142     return Hexagon::IntRegsRegClass.contains(DestReg) &&
143            Hexagon::IntRegsRegClass.contains(SrcReg);
144   }
145 
146   case Hexagon::A2_tfrsi: {
147     // A transfer-immediate can be combined if its argument is a signed 8bit
148     // value.
149     const MachineOperand &Op0 = MI.getOperand(0);
150     const MachineOperand &Op1 = MI.getOperand(1);
151     assert(Op0.isReg());
152 
153     unsigned DestReg = Op0.getReg();
154     // Ensure that TargetFlags are MO_NO_FLAG for a global. This is a
155     // workaround for an ABI bug that prevents GOT relocations on combine
156     // instructions
157     if (!Op1.isImm() && Op1.getTargetFlags() != HexagonII::MO_NO_FLAG)
158       return false;
159 
160     // Only combine constant extended A2_tfrsi if we are in aggressive mode.
161     bool NotExt = Op1.isImm() && isInt<8>(Op1.getImm());
162     return Hexagon::IntRegsRegClass.contains(DestReg) &&
163            (ShouldCombineAggressively || NotExt);
164   }
165 
166   default:
167     break;
168   }
169 
170   return false;
171 }
172 
isGreaterThanNBitTFRI(const MachineInstr & I)173 template <unsigned N> static bool isGreaterThanNBitTFRI(const MachineInstr &I) {
174   if (I.getOpcode() == Hexagon::TFRI64_V4 ||
175       I.getOpcode() == Hexagon::A2_tfrsi) {
176     const MachineOperand &Op = I.getOperand(1);
177     return !Op.isImm() || !isInt<N>(Op.getImm());
178   }
179   return false;
180 }
181 
182 /// areCombinableOperations - Returns true if the two instruction can be merge
183 /// into a combine (ignoring register constraints).
areCombinableOperations(const TargetRegisterInfo * TRI,MachineInstr & HighRegInst,MachineInstr & LowRegInst,bool AllowC64)184 static bool areCombinableOperations(const TargetRegisterInfo *TRI,
185                                     MachineInstr &HighRegInst,
186                                     MachineInstr &LowRegInst, bool AllowC64) {
187   unsigned HiOpc = HighRegInst.getOpcode();
188   unsigned LoOpc = LowRegInst.getOpcode();
189   (void)HiOpc; // Fix compiler warning
190   (void)LoOpc; // Fix compiler warning
191   assert((HiOpc == Hexagon::A2_tfr || HiOpc == Hexagon::A2_tfrsi) &&
192          (LoOpc == Hexagon::A2_tfr || LoOpc == Hexagon::A2_tfrsi) &&
193          "Assume individual instructions are of a combinable type");
194 
195   if (!AllowC64) {
196     // There is no combine of two constant extended values.
197     if (isGreaterThanNBitTFRI<8>(HighRegInst) &&
198         isGreaterThanNBitTFRI<6>(LowRegInst))
199       return false;
200   }
201 
202   // There is a combine of two constant extended values into CONST64,
203   // provided both constants are true immediates.
204   if (isGreaterThanNBitTFRI<16>(HighRegInst) &&
205       isGreaterThanNBitTFRI<16>(LowRegInst))
206     return (HighRegInst.getOperand(1).isImm() &&
207             LowRegInst.getOperand(1).isImm());
208 
209   // There is no combine of two constant extended values, unless handled above
210   // Make both 8-bit size checks to allow both combine (#,##) and combine(##,#)
211   if (isGreaterThanNBitTFRI<8>(HighRegInst) &&
212       isGreaterThanNBitTFRI<8>(LowRegInst))
213     return false;
214 
215   return true;
216 }
217 
isEvenReg(unsigned Reg)218 static bool isEvenReg(unsigned Reg) {
219   assert(TargetRegisterInfo::isPhysicalRegister(Reg) &&
220          Hexagon::IntRegsRegClass.contains(Reg));
221   return (Reg - Hexagon::R0) % 2 == 0;
222 }
223 
removeKillInfo(MachineInstr & MI,unsigned RegNotKilled)224 static void removeKillInfo(MachineInstr &MI, unsigned RegNotKilled) {
225   for (unsigned I = 0, E = MI.getNumOperands(); I != E; ++I) {
226     MachineOperand &Op = MI.getOperand(I);
227     if (!Op.isReg() || Op.getReg() != RegNotKilled || !Op.isKill())
228       continue;
229     Op.setIsKill(false);
230   }
231 }
232 
233 /// Returns true if it is unsafe to move a copy instruction from \p UseReg to
234 /// \p DestReg over the instruction \p MI.
isUnsafeToMoveAcross(MachineInstr & MI,unsigned UseReg,unsigned DestReg,const TargetRegisterInfo * TRI)235 static bool isUnsafeToMoveAcross(MachineInstr &MI, unsigned UseReg,
236                                  unsigned DestReg,
237                                  const TargetRegisterInfo *TRI) {
238   return (UseReg && (MI.modifiesRegister(UseReg, TRI))) ||
239          MI.modifiesRegister(DestReg, TRI) || MI.readsRegister(DestReg, TRI) ||
240          MI.hasUnmodeledSideEffects() || MI.isInlineAsm() || MI.isDebugValue();
241 }
242 
UseReg(const MachineOperand & MO)243 static unsigned UseReg(const MachineOperand& MO) {
244   return MO.isReg() ? MO.getReg() : 0;
245 }
246 
247 /// isSafeToMoveTogether - Returns true if it is safe to move I1 next to I2 such
248 /// that the two instructions can be paired in a combine.
isSafeToMoveTogether(MachineInstr & I1,MachineInstr & I2,unsigned I1DestReg,unsigned I2DestReg,bool & DoInsertAtI1)249 bool HexagonCopyToCombine::isSafeToMoveTogether(MachineInstr &I1,
250                                                 MachineInstr &I2,
251                                                 unsigned I1DestReg,
252                                                 unsigned I2DestReg,
253                                                 bool &DoInsertAtI1) {
254   unsigned I2UseReg = UseReg(I2.getOperand(1));
255 
256   // It is not safe to move I1 and I2 into one combine if I2 has a true
257   // dependence on I1.
258   if (I2UseReg && I1.modifiesRegister(I2UseReg, TRI))
259     return false;
260 
261   bool isSafe = true;
262 
263   // First try to move I2 towards I1.
264   {
265     // A reverse_iterator instantiated like below starts before I2, and I1
266     // respectively.
267     // Look at instructions I in between I2 and (excluding) I1.
268     MachineBasicBlock::reverse_iterator I(I2),
269       End = --(MachineBasicBlock::reverse_iterator(I1));
270     // At 03 we got better results (dhrystone!) by being more conservative.
271     if (!ShouldCombineAggressively)
272       End = MachineBasicBlock::reverse_iterator(I1);
273     // If I2 kills its operand and we move I2 over an instruction that also
274     // uses I2's use reg we need to modify that (first) instruction to now kill
275     // this reg.
276     unsigned KilledOperand = 0;
277     if (I2.killsRegister(I2UseReg))
278       KilledOperand = I2UseReg;
279     MachineInstr *KillingInstr = nullptr;
280 
281     for (; I != End; ++I) {
282       // If the intervening instruction I:
283       //   * modifies I2's use reg
284       //   * modifies I2's def reg
285       //   * reads I2's def reg
286       //   * or has unmodelled side effects
287       // we can't move I2 across it.
288       if (I->isDebugValue())
289         continue;
290 
291       if (isUnsafeToMoveAcross(*I, I2UseReg, I2DestReg, TRI)) {
292         isSafe = false;
293         break;
294       }
295 
296       // Update first use of the killed operand.
297       if (!KillingInstr && KilledOperand &&
298           I->readsRegister(KilledOperand, TRI))
299         KillingInstr = &*I;
300     }
301     if (isSafe) {
302       // Update the intermediate instruction to with the kill flag.
303       if (KillingInstr) {
304         bool Added = KillingInstr->addRegisterKilled(KilledOperand, TRI, true);
305         (void)Added; // suppress compiler warning
306         assert(Added && "Must successfully update kill flag");
307         removeKillInfo(I2, KilledOperand);
308       }
309       DoInsertAtI1 = true;
310       return true;
311     }
312   }
313 
314   // Try to move I1 towards I2.
315   {
316     // Look at instructions I in between I1 and (excluding) I2.
317     MachineBasicBlock::iterator I(I1), End(I2);
318     // At O3 we got better results (dhrystone) by being more conservative here.
319     if (!ShouldCombineAggressively)
320       End = std::next(MachineBasicBlock::iterator(I2));
321     unsigned I1UseReg = UseReg(I1.getOperand(1));
322     // Track killed operands. If we move across an instruction that kills our
323     // operand, we need to update the kill information on the moved I1. It kills
324     // the operand now.
325     MachineInstr *KillingInstr = nullptr;
326     unsigned KilledOperand = 0;
327 
328     while(++I != End) {
329       MachineInstr &MI = *I;
330       // If the intervening instruction MI:
331       //   * modifies I1's use reg
332       //   * modifies I1's def reg
333       //   * reads I1's def reg
334       //   * or has unmodelled side effects
335       //   We introduce this special case because llvm has no api to remove a
336       //   kill flag for a register (a removeRegisterKilled() analogous to
337       //   addRegisterKilled) that handles aliased register correctly.
338       //   * or has a killed aliased register use of I1's use reg
339       //           %D4<def> = A2_tfrpi 16
340       //           %R6<def> = A2_tfr %R9
341       //           %R8<def> = KILL %R8, %D4<imp-use,kill>
342       //      If we want to move R6 = across the KILL instruction we would have
343       //      to remove the %D4<imp-use,kill> operand. For now, we are
344       //      conservative and disallow the move.
345       // we can't move I1 across it.
346       if (MI.isDebugValue()) {
347         if (MI.readsRegister(I1DestReg, TRI)) // Move this instruction after I2.
348           DbgMItoMove.push_back(&MI);
349         continue;
350       }
351 
352       if (isUnsafeToMoveAcross(MI, I1UseReg, I1DestReg, TRI) ||
353           // Check for an aliased register kill. Bail out if we see one.
354           (!MI.killsRegister(I1UseReg) && MI.killsRegister(I1UseReg, TRI)))
355         return false;
356 
357       // Check for an exact kill (registers match).
358       if (I1UseReg && MI.killsRegister(I1UseReg)) {
359         assert(!KillingInstr && "Should only see one killing instruction");
360         KilledOperand = I1UseReg;
361         KillingInstr = &MI;
362       }
363     }
364     if (KillingInstr) {
365       removeKillInfo(*KillingInstr, KilledOperand);
366       // Update I1 to set the kill flag. This flag will later be picked up by
367       // the new COMBINE instruction.
368       bool Added = I1.addRegisterKilled(KilledOperand, TRI);
369       (void)Added; // suppress compiler warning
370       assert(Added && "Must successfully update kill flag");
371     }
372     DoInsertAtI1 = false;
373   }
374 
375   return true;
376 }
377 
378 /// findPotentialNewifiableTFRs - Finds tranfers that feed stores that could be
379 /// newified. (A use of a 64 bit register define can not be newified)
380 void
findPotentialNewifiableTFRs(MachineBasicBlock & BB)381 HexagonCopyToCombine::findPotentialNewifiableTFRs(MachineBasicBlock &BB) {
382   DenseMap<unsigned, MachineInstr *> LastDef;
383   for (MachineInstr &MI : BB) {
384     if (MI.isDebugValue())
385       continue;
386 
387     // Mark TFRs that feed a potential new value store as such.
388     if (TII->mayBeNewStore(&MI)) {
389       // Look for uses of TFR instructions.
390       for (unsigned OpdIdx = 0, OpdE = MI.getNumOperands(); OpdIdx != OpdE;
391            ++OpdIdx) {
392         MachineOperand &Op = MI.getOperand(OpdIdx);
393 
394         // Skip over anything except register uses.
395         if (!Op.isReg() || !Op.isUse() || !Op.getReg())
396           continue;
397 
398         // Look for the defining instruction.
399         unsigned Reg = Op.getReg();
400         MachineInstr *DefInst = LastDef[Reg];
401         if (!DefInst)
402           continue;
403         if (!isCombinableInstType(*DefInst, TII, ShouldCombineAggressively))
404           continue;
405 
406         // Only close newifiable stores should influence the decision.
407         // Ignore the debug instructions in between.
408         MachineBasicBlock::iterator It(DefInst);
409         unsigned NumInstsToDef = 0;
410         while (&*It != &MI) {
411           if (!It->isDebugValue())
412             ++NumInstsToDef;
413           ++It;
414         }
415 
416         if (NumInstsToDef > MaxNumOfInstsBetweenNewValueStoreAndTFR)
417           continue;
418 
419         PotentiallyNewifiableTFR.insert(DefInst);
420       }
421       // Skip to next instruction.
422       continue;
423     }
424 
425     // Put instructions that last defined integer or double registers into the
426     // map.
427     for (unsigned I = 0, E = MI.getNumOperands(); I != E; ++I) {
428       MachineOperand &Op = MI.getOperand(I);
429       if (!Op.isReg() || !Op.isDef() || !Op.getReg())
430         continue;
431       unsigned Reg = Op.getReg();
432       if (Hexagon::DoubleRegsRegClass.contains(Reg)) {
433         for (MCSubRegIterator SubRegs(Reg, TRI); SubRegs.isValid(); ++SubRegs) {
434           LastDef[*SubRegs] = &MI;
435         }
436       } else if (Hexagon::IntRegsRegClass.contains(Reg))
437         LastDef[Reg] = &MI;
438     }
439   }
440 }
441 
runOnMachineFunction(MachineFunction & MF)442 bool HexagonCopyToCombine::runOnMachineFunction(MachineFunction &MF) {
443 
444   if (IsCombinesDisabled) return false;
445 
446   bool HasChanged = false;
447 
448   // Get target info.
449   TRI = MF.getSubtarget().getRegisterInfo();
450   TII = MF.getSubtarget<HexagonSubtarget>().getInstrInfo();
451 
452   const Function *F = MF.getFunction();
453   bool OptForSize = F->hasFnAttribute(Attribute::OptimizeForSize);
454 
455   // Combine aggressively (for code size)
456   ShouldCombineAggressively =
457     MF.getTarget().getOptLevel() <= CodeGenOpt::Default;
458 
459   // Traverse basic blocks.
460   for (MachineFunction::iterator BI = MF.begin(), BE = MF.end(); BI != BE;
461        ++BI) {
462     PotentiallyNewifiableTFR.clear();
463     findPotentialNewifiableTFRs(*BI);
464 
465     // Traverse instructions in basic block.
466     for(MachineBasicBlock::iterator MI = BI->begin(), End = BI->end();
467         MI != End;) {
468       MachineInstr &I1 = *MI++;
469 
470       if (I1.isDebugValue())
471         continue;
472 
473       // Don't combine a TFR whose user could be newified (instructions that
474       // define double registers can not be newified - Programmer's Ref Manual
475       // 5.4.2 New-value stores).
476       if (ShouldCombineAggressively && PotentiallyNewifiableTFR.count(&I1))
477         continue;
478 
479       // Ignore instructions that are not combinable.
480       if (!isCombinableInstType(I1, TII, ShouldCombineAggressively))
481         continue;
482 
483       // Find a second instruction that can be merged into a combine
484       // instruction. In addition, also find all the debug instructions that
485       // need to be moved along with it.
486       bool DoInsertAtI1 = false;
487       DbgMItoMove.clear();
488       MachineInstr *I2 = findPairable(I1, DoInsertAtI1, OptForSize);
489       if (I2) {
490         HasChanged = true;
491         combine(I1, *I2, MI, DoInsertAtI1, OptForSize);
492       }
493     }
494   }
495 
496   return HasChanged;
497 }
498 
499 /// findPairable - Returns an instruction that can be merged with \p I1 into a
500 /// COMBINE instruction or 0 if no such instruction can be found. Returns true
501 /// in \p DoInsertAtI1 if the combine must be inserted at instruction \p I1
502 /// false if the combine must be inserted at the returned instruction.
findPairable(MachineInstr & I1,bool & DoInsertAtI1,bool AllowC64)503 MachineInstr *HexagonCopyToCombine::findPairable(MachineInstr &I1,
504                                                  bool &DoInsertAtI1,
505                                                  bool AllowC64) {
506   MachineBasicBlock::iterator I2 = std::next(MachineBasicBlock::iterator(I1));
507 
508   while (I2->isDebugValue())
509     ++I2;
510 
511   unsigned I1DestReg = I1.getOperand(0).getReg();
512 
513   for (MachineBasicBlock::iterator End = I1.getParent()->end(); I2 != End;
514        ++I2) {
515     // Bail out early if we see a second definition of I1DestReg.
516     if (I2->modifiesRegister(I1DestReg, TRI))
517       break;
518 
519     // Ignore non-combinable instructions.
520     if (!isCombinableInstType(*I2, TII, ShouldCombineAggressively))
521       continue;
522 
523     // Don't combine a TFR whose user could be newified.
524     if (ShouldCombineAggressively && PotentiallyNewifiableTFR.count(&*I2))
525       continue;
526 
527     unsigned I2DestReg = I2->getOperand(0).getReg();
528 
529     // Check that registers are adjacent and that the first destination register
530     // is even.
531     bool IsI1LowReg = (I2DestReg - I1DestReg) == 1;
532     bool IsI2LowReg = (I1DestReg - I2DestReg) == 1;
533     unsigned FirstRegIndex = IsI1LowReg ? I1DestReg : I2DestReg;
534     if ((!IsI1LowReg && !IsI2LowReg) || !isEvenReg(FirstRegIndex))
535       continue;
536 
537     // Check that the two instructions are combinable. V4 allows more
538     // instructions to be merged into a combine.
539     // The order matters because in a A2_tfrsi we might can encode a int8 as
540     // the hi reg operand but only a uint6 as the low reg operand.
541     if ((IsI2LowReg && !areCombinableOperations(TRI, I1, *I2, AllowC64)) ||
542         (IsI1LowReg && !areCombinableOperations(TRI, *I2, I1, AllowC64)))
543       break;
544 
545     if (isSafeToMoveTogether(I1, *I2, I1DestReg, I2DestReg, DoInsertAtI1))
546       return &*I2;
547 
548     // Not safe. Stop searching.
549     break;
550   }
551   return nullptr;
552 }
553 
combine(MachineInstr & I1,MachineInstr & I2,MachineBasicBlock::iterator & MI,bool DoInsertAtI1,bool OptForSize)554 void HexagonCopyToCombine::combine(MachineInstr &I1, MachineInstr &I2,
555                                    MachineBasicBlock::iterator &MI,
556                                    bool DoInsertAtI1, bool OptForSize) {
557   // We are going to delete I2. If MI points to I2 advance it to the next
558   // instruction.
559   if (MI == I2.getIterator())
560     ++MI;
561 
562   // Figure out whether I1 or I2 goes into the lowreg part.
563   unsigned I1DestReg = I1.getOperand(0).getReg();
564   unsigned I2DestReg = I2.getOperand(0).getReg();
565   bool IsI1Loreg = (I2DestReg - I1DestReg) == 1;
566   unsigned LoRegDef = IsI1Loreg ? I1DestReg : I2DestReg;
567 
568   // Get the double word register.
569   unsigned DoubleRegDest =
570     TRI->getMatchingSuperReg(LoRegDef, Hexagon::subreg_loreg,
571                              &Hexagon::DoubleRegsRegClass);
572   assert(DoubleRegDest != 0 && "Expect a valid register");
573 
574 
575   // Setup source operands.
576   MachineOperand &LoOperand = IsI1Loreg ? I1.getOperand(1) : I2.getOperand(1);
577   MachineOperand &HiOperand = IsI1Loreg ? I2.getOperand(1) : I1.getOperand(1);
578 
579   // Figure out which source is a register and which a constant.
580   bool IsHiReg = HiOperand.isReg();
581   bool IsLoReg = LoOperand.isReg();
582 
583   // There is a combine of two constant extended values into CONST64.
584   bool IsC64 = OptForSize && LoOperand.isImm() && HiOperand.isImm() &&
585                isGreaterThanNBitTFRI<16>(I1) && isGreaterThanNBitTFRI<16>(I2);
586 
587   MachineBasicBlock::iterator InsertPt(DoInsertAtI1 ? I1 : I2);
588   // Emit combine.
589   if (IsHiReg && IsLoReg)
590     emitCombineRR(InsertPt, DoubleRegDest, HiOperand, LoOperand);
591   else if (IsHiReg)
592     emitCombineRI(InsertPt, DoubleRegDest, HiOperand, LoOperand);
593   else if (IsLoReg)
594     emitCombineIR(InsertPt, DoubleRegDest, HiOperand, LoOperand);
595   else if (IsC64 && !IsConst64Disabled)
596     emitConst64(InsertPt, DoubleRegDest, HiOperand, LoOperand);
597   else
598     emitCombineII(InsertPt, DoubleRegDest, HiOperand, LoOperand);
599 
600   // Move debug instructions along with I1 if it's being
601   // moved towards I2.
602   if (!DoInsertAtI1 && DbgMItoMove.size() != 0) {
603     // Insert debug instructions at the new location before I2.
604     MachineBasicBlock *BB = InsertPt->getParent();
605     for (auto NewMI : DbgMItoMove) {
606       // If iterator MI is pointing to DEBUG_VAL, make sure
607       // MI now points to next relevant instruction.
608       if (NewMI == (MachineInstr*)MI)
609         ++MI;
610       BB->splice(InsertPt, BB, NewMI);
611     }
612   }
613 
614   I1.eraseFromParent();
615   I2.eraseFromParent();
616 }
617 
emitConst64(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)618 void HexagonCopyToCombine::emitConst64(MachineBasicBlock::iterator &InsertPt,
619                                        unsigned DoubleDestReg,
620                                        MachineOperand &HiOperand,
621                                        MachineOperand &LoOperand) {
622   DEBUG(dbgs() << "Found a CONST64\n");
623 
624   DebugLoc DL = InsertPt->getDebugLoc();
625   MachineBasicBlock *BB = InsertPt->getParent();
626   assert(LoOperand.isImm() && HiOperand.isImm() &&
627          "Both operands must be immediate");
628 
629   int64_t V = HiOperand.getImm();
630   V = (V << 32) | (0x0ffffffffLL & LoOperand.getImm());
631   BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::CONST64_Int_Real),
632     DoubleDestReg)
633     .addImm(V);
634 }
635 
emitCombineII(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)636 void HexagonCopyToCombine::emitCombineII(MachineBasicBlock::iterator &InsertPt,
637                                          unsigned DoubleDestReg,
638                                          MachineOperand &HiOperand,
639                                          MachineOperand &LoOperand) {
640   DebugLoc DL = InsertPt->getDebugLoc();
641   MachineBasicBlock *BB = InsertPt->getParent();
642 
643   // Handle globals.
644   if (HiOperand.isGlobal()) {
645     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
646       .addGlobalAddress(HiOperand.getGlobal(), HiOperand.getOffset(),
647                         HiOperand.getTargetFlags())
648       .addImm(LoOperand.getImm());
649     return;
650   }
651   if (LoOperand.isGlobal()) {
652     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
653       .addImm(HiOperand.getImm())
654       .addGlobalAddress(LoOperand.getGlobal(), LoOperand.getOffset(),
655                         LoOperand.getTargetFlags());
656     return;
657   }
658 
659   // Handle block addresses.
660   if (HiOperand.isBlockAddress()) {
661     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
662       .addBlockAddress(HiOperand.getBlockAddress(), HiOperand.getOffset(),
663                        HiOperand.getTargetFlags())
664       .addImm(LoOperand.getImm());
665     return;
666   }
667   if (LoOperand.isBlockAddress()) {
668     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
669       .addImm(HiOperand.getImm())
670       .addBlockAddress(LoOperand.getBlockAddress(), LoOperand.getOffset(),
671                        LoOperand.getTargetFlags());
672     return;
673   }
674 
675   // Handle jump tables.
676   if (HiOperand.isJTI()) {
677     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
678       .addJumpTableIndex(HiOperand.getIndex(), HiOperand.getTargetFlags())
679       .addImm(LoOperand.getImm());
680     return;
681   }
682   if (LoOperand.isJTI()) {
683     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
684       .addImm(HiOperand.getImm())
685       .addJumpTableIndex(LoOperand.getIndex(), LoOperand.getTargetFlags());
686     return;
687   }
688 
689   // Handle constant pools.
690   if (HiOperand.isCPI()) {
691     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
692       .addConstantPoolIndex(HiOperand.getIndex(), HiOperand.getOffset(),
693                             HiOperand.getTargetFlags())
694       .addImm(LoOperand.getImm());
695     return;
696   }
697   if (LoOperand.isCPI()) {
698     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
699       .addImm(HiOperand.getImm())
700       .addConstantPoolIndex(LoOperand.getIndex(), LoOperand.getOffset(),
701                             LoOperand.getTargetFlags());
702     return;
703   }
704 
705   // First preference should be given to Hexagon::A2_combineii instruction
706   // as it can include U6 (in Hexagon::A4_combineii) as well.
707   // In this instruction, HiOperand is const extended, if required.
708   if (isInt<8>(LoOperand.getImm())) {
709     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
710       .addImm(HiOperand.getImm())
711       .addImm(LoOperand.getImm());
712       return;
713   }
714 
715   // In this instruction, LoOperand is const extended, if required.
716   if (isInt<8>(HiOperand.getImm())) {
717     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineii), DoubleDestReg)
718       .addImm(HiOperand.getImm())
719       .addImm(LoOperand.getImm());
720     return;
721   }
722 
723   // Insert new combine instruction.
724   //  DoubleRegDest = combine #HiImm, #LoImm
725   BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combineii), DoubleDestReg)
726     .addImm(HiOperand.getImm())
727     .addImm(LoOperand.getImm());
728 }
729 
emitCombineIR(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)730 void HexagonCopyToCombine::emitCombineIR(MachineBasicBlock::iterator &InsertPt,
731                                          unsigned DoubleDestReg,
732                                          MachineOperand &HiOperand,
733                                          MachineOperand &LoOperand) {
734   unsigned LoReg = LoOperand.getReg();
735   unsigned LoRegKillFlag = getKillRegState(LoOperand.isKill());
736 
737   DebugLoc DL = InsertPt->getDebugLoc();
738   MachineBasicBlock *BB = InsertPt->getParent();
739 
740   // Handle globals.
741   if (HiOperand.isGlobal()) {
742     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
743       .addGlobalAddress(HiOperand.getGlobal(), HiOperand.getOffset(),
744                         HiOperand.getTargetFlags())
745       .addReg(LoReg, LoRegKillFlag);
746     return;
747   }
748   // Handle block addresses.
749   if (HiOperand.isBlockAddress()) {
750     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
751       .addBlockAddress(HiOperand.getBlockAddress(), HiOperand.getOffset(),
752                        HiOperand.getTargetFlags())
753       .addReg(LoReg, LoRegKillFlag);
754     return;
755   }
756   // Handle jump tables.
757   if (HiOperand.isJTI()) {
758     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
759       .addJumpTableIndex(HiOperand.getIndex(), HiOperand.getTargetFlags())
760       .addReg(LoReg, LoRegKillFlag);
761     return;
762   }
763   // Handle constant pools.
764   if (HiOperand.isCPI()) {
765     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
766       .addConstantPoolIndex(HiOperand.getIndex(), HiOperand.getOffset(),
767                             HiOperand.getTargetFlags())
768       .addReg(LoReg, LoRegKillFlag);
769     return;
770   }
771   // Insert new combine instruction.
772   //  DoubleRegDest = combine #HiImm, LoReg
773   BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineir), DoubleDestReg)
774     .addImm(HiOperand.getImm())
775     .addReg(LoReg, LoRegKillFlag);
776 }
777 
emitCombineRI(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)778 void HexagonCopyToCombine::emitCombineRI(MachineBasicBlock::iterator &InsertPt,
779                                          unsigned DoubleDestReg,
780                                          MachineOperand &HiOperand,
781                                          MachineOperand &LoOperand) {
782   unsigned HiRegKillFlag = getKillRegState(HiOperand.isKill());
783   unsigned HiReg = HiOperand.getReg();
784 
785   DebugLoc DL = InsertPt->getDebugLoc();
786   MachineBasicBlock *BB = InsertPt->getParent();
787 
788   // Handle global.
789   if (LoOperand.isGlobal()) {
790     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
791       .addReg(HiReg, HiRegKillFlag)
792       .addGlobalAddress(LoOperand.getGlobal(), LoOperand.getOffset(),
793                         LoOperand.getTargetFlags());
794     return;
795   }
796   // Handle block addresses.
797   if (LoOperand.isBlockAddress()) {
798     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
799       .addReg(HiReg, HiRegKillFlag)
800       .addBlockAddress(LoOperand.getBlockAddress(), LoOperand.getOffset(),
801                        LoOperand.getTargetFlags());
802     return;
803   }
804   // Handle jump tables.
805   if (LoOperand.isJTI()) {
806     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
807       .addReg(HiOperand.getReg(), HiRegKillFlag)
808       .addJumpTableIndex(LoOperand.getIndex(), LoOperand.getTargetFlags());
809     return;
810   }
811   // Handle constant pools.
812   if (LoOperand.isCPI()) {
813     BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
814       .addReg(HiOperand.getReg(), HiRegKillFlag)
815       .addConstantPoolIndex(LoOperand.getIndex(), LoOperand.getOffset(),
816                             LoOperand.getTargetFlags());
817     return;
818   }
819 
820   // Insert new combine instruction.
821   //  DoubleRegDest = combine HiReg, #LoImm
822   BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A4_combineri), DoubleDestReg)
823     .addReg(HiReg, HiRegKillFlag)
824     .addImm(LoOperand.getImm());
825 }
826 
emitCombineRR(MachineBasicBlock::iterator & InsertPt,unsigned DoubleDestReg,MachineOperand & HiOperand,MachineOperand & LoOperand)827 void HexagonCopyToCombine::emitCombineRR(MachineBasicBlock::iterator &InsertPt,
828                                          unsigned DoubleDestReg,
829                                          MachineOperand &HiOperand,
830                                          MachineOperand &LoOperand) {
831   unsigned LoRegKillFlag = getKillRegState(LoOperand.isKill());
832   unsigned HiRegKillFlag = getKillRegState(HiOperand.isKill());
833   unsigned LoReg = LoOperand.getReg();
834   unsigned HiReg = HiOperand.getReg();
835 
836   DebugLoc DL = InsertPt->getDebugLoc();
837   MachineBasicBlock *BB = InsertPt->getParent();
838 
839   // Insert new combine instruction.
840   //  DoubleRegDest = combine HiReg, LoReg
841   BuildMI(*BB, InsertPt, DL, TII->get(Hexagon::A2_combinew), DoubleDestReg)
842     .addReg(HiReg, HiRegKillFlag)
843     .addReg(LoReg, LoRegKillFlag);
844 }
845 
createHexagonCopyToCombine()846 FunctionPass *llvm::createHexagonCopyToCombine() {
847   return new HexagonCopyToCombine();
848 }
849