1 //===-- Thumb2ITBlockPass.cpp - Insert Thumb-2 IT blocks ------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9
10 #include "ARM.h"
11 #include "ARMMachineFunctionInfo.h"
12 #include "Thumb2InstrInfo.h"
13 #include "llvm/ADT/SmallSet.h"
14 #include "llvm/ADT/Statistic.h"
15 #include "llvm/CodeGen/MachineFunctionPass.h"
16 #include "llvm/CodeGen/MachineInstr.h"
17 #include "llvm/CodeGen/MachineInstrBuilder.h"
18 #include "llvm/CodeGen/MachineInstrBundle.h"
19 using namespace llvm;
20
21 #define DEBUG_TYPE "thumb2-it"
22
23 STATISTIC(NumITs, "Number of IT blocks inserted");
24 STATISTIC(NumMovedInsts, "Number of predicated instructions moved");
25
26 namespace {
27 class Thumb2ITBlockPass : public MachineFunctionPass {
28 public:
29 static char ID;
Thumb2ITBlockPass()30 Thumb2ITBlockPass() : MachineFunctionPass(ID) {}
31
32 bool restrictIT;
33 const Thumb2InstrInfo *TII;
34 const TargetRegisterInfo *TRI;
35 ARMFunctionInfo *AFI;
36
37 bool runOnMachineFunction(MachineFunction &Fn) override;
38
getRequiredProperties() const39 MachineFunctionProperties getRequiredProperties() const override {
40 return MachineFunctionProperties().set(
41 MachineFunctionProperties::Property::AllVRegsAllocated);
42 }
43
getPassName() const44 const char *getPassName() const override {
45 return "Thumb IT blocks insertion pass";
46 }
47
48 private:
49 bool MoveCopyOutOfITBlock(MachineInstr *MI,
50 ARMCC::CondCodes CC, ARMCC::CondCodes OCC,
51 SmallSet<unsigned, 4> &Defs,
52 SmallSet<unsigned, 4> &Uses);
53 bool InsertITInstructions(MachineBasicBlock &MBB);
54 };
55 char Thumb2ITBlockPass::ID = 0;
56 }
57
58 /// TrackDefUses - Tracking what registers are being defined and used by
59 /// instructions in the IT block. This also tracks "dependencies", i.e. uses
60 /// in the IT block that are defined before the IT instruction.
TrackDefUses(MachineInstr * MI,SmallSet<unsigned,4> & Defs,SmallSet<unsigned,4> & Uses,const TargetRegisterInfo * TRI)61 static void TrackDefUses(MachineInstr *MI,
62 SmallSet<unsigned, 4> &Defs,
63 SmallSet<unsigned, 4> &Uses,
64 const TargetRegisterInfo *TRI) {
65 SmallVector<unsigned, 4> LocalDefs;
66 SmallVector<unsigned, 4> LocalUses;
67
68 for (unsigned i = 0, e = MI->getNumOperands(); i != e; ++i) {
69 MachineOperand &MO = MI->getOperand(i);
70 if (!MO.isReg())
71 continue;
72 unsigned Reg = MO.getReg();
73 if (!Reg || Reg == ARM::ITSTATE || Reg == ARM::SP)
74 continue;
75 if (MO.isUse())
76 LocalUses.push_back(Reg);
77 else
78 LocalDefs.push_back(Reg);
79 }
80
81 for (unsigned i = 0, e = LocalUses.size(); i != e; ++i) {
82 unsigned Reg = LocalUses[i];
83 for (MCSubRegIterator Subreg(Reg, TRI, /*IncludeSelf=*/true);
84 Subreg.isValid(); ++Subreg)
85 Uses.insert(*Subreg);
86 }
87
88 for (unsigned i = 0, e = LocalDefs.size(); i != e; ++i) {
89 unsigned Reg = LocalDefs[i];
90 for (MCSubRegIterator Subreg(Reg, TRI, /*IncludeSelf=*/true);
91 Subreg.isValid(); ++Subreg)
92 Defs.insert(*Subreg);
93 if (Reg == ARM::CPSR)
94 continue;
95 }
96 }
97
98 /// Clear kill flags for any uses in the given set. This will likely
99 /// conservatively remove more kill flags than are necessary, but removing them
100 /// is safer than incorrect kill flags remaining on instructions.
ClearKillFlags(MachineInstr * MI,SmallSet<unsigned,4> & Uses)101 static void ClearKillFlags(MachineInstr *MI, SmallSet<unsigned, 4> &Uses) {
102 for (MachineOperand &MO : MI->operands()) {
103 if (!MO.isReg() || MO.isDef() || !MO.isKill())
104 continue;
105 if (!Uses.count(MO.getReg()))
106 continue;
107 MO.setIsKill(false);
108 }
109 }
110
isCopy(MachineInstr * MI)111 static bool isCopy(MachineInstr *MI) {
112 switch (MI->getOpcode()) {
113 default:
114 return false;
115 case ARM::MOVr:
116 case ARM::MOVr_TC:
117 case ARM::tMOVr:
118 case ARM::t2MOVr:
119 return true;
120 }
121 }
122
123 bool
MoveCopyOutOfITBlock(MachineInstr * MI,ARMCC::CondCodes CC,ARMCC::CondCodes OCC,SmallSet<unsigned,4> & Defs,SmallSet<unsigned,4> & Uses)124 Thumb2ITBlockPass::MoveCopyOutOfITBlock(MachineInstr *MI,
125 ARMCC::CondCodes CC, ARMCC::CondCodes OCC,
126 SmallSet<unsigned, 4> &Defs,
127 SmallSet<unsigned, 4> &Uses) {
128 if (!isCopy(MI))
129 return false;
130 // llvm models select's as two-address instructions. That means a copy
131 // is inserted before a t2MOVccr, etc. If the copy is scheduled in
132 // between selects we would end up creating multiple IT blocks.
133 assert(MI->getOperand(0).getSubReg() == 0 &&
134 MI->getOperand(1).getSubReg() == 0 &&
135 "Sub-register indices still around?");
136
137 unsigned DstReg = MI->getOperand(0).getReg();
138 unsigned SrcReg = MI->getOperand(1).getReg();
139
140 // First check if it's safe to move it.
141 if (Uses.count(DstReg) || Defs.count(SrcReg))
142 return false;
143
144 // If the CPSR is defined by this copy, then we don't want to move it. E.g.,
145 // if we have:
146 //
147 // movs r1, r1
148 // rsb r1, 0
149 // movs r2, r2
150 // rsb r2, 0
151 //
152 // we don't want this to be converted to:
153 //
154 // movs r1, r1
155 // movs r2, r2
156 // itt mi
157 // rsb r1, 0
158 // rsb r2, 0
159 //
160 const MCInstrDesc &MCID = MI->getDesc();
161 if (MI->hasOptionalDef() &&
162 MI->getOperand(MCID.getNumOperands() - 1).getReg() == ARM::CPSR)
163 return false;
164
165 // Then peek at the next instruction to see if it's predicated on CC or OCC.
166 // If not, then there is nothing to be gained by moving the copy.
167 MachineBasicBlock::iterator I = MI; ++I;
168 MachineBasicBlock::iterator E = MI->getParent()->end();
169 while (I != E && I->isDebugValue())
170 ++I;
171 if (I != E) {
172 unsigned NPredReg = 0;
173 ARMCC::CondCodes NCC = getITInstrPredicate(*I, NPredReg);
174 if (NCC == CC || NCC == OCC)
175 return true;
176 }
177 return false;
178 }
179
InsertITInstructions(MachineBasicBlock & MBB)180 bool Thumb2ITBlockPass::InsertITInstructions(MachineBasicBlock &MBB) {
181 bool Modified = false;
182
183 SmallSet<unsigned, 4> Defs;
184 SmallSet<unsigned, 4> Uses;
185 MachineBasicBlock::iterator MBBI = MBB.begin(), E = MBB.end();
186 while (MBBI != E) {
187 MachineInstr *MI = &*MBBI;
188 DebugLoc dl = MI->getDebugLoc();
189 unsigned PredReg = 0;
190 ARMCC::CondCodes CC = getITInstrPredicate(*MI, PredReg);
191 if (CC == ARMCC::AL) {
192 ++MBBI;
193 continue;
194 }
195
196 Defs.clear();
197 Uses.clear();
198 TrackDefUses(MI, Defs, Uses, TRI);
199
200 // Insert an IT instruction.
201 MachineInstrBuilder MIB = BuildMI(MBB, MBBI, dl, TII->get(ARM::t2IT))
202 .addImm(CC);
203
204 // Add implicit use of ITSTATE to IT block instructions.
205 MI->addOperand(MachineOperand::CreateReg(ARM::ITSTATE, false/*ifDef*/,
206 true/*isImp*/, false/*isKill*/));
207
208 MachineInstr *LastITMI = MI;
209 MachineBasicBlock::iterator InsertPos = MIB.getInstr();
210 ++MBBI;
211
212 // Form IT block.
213 ARMCC::CondCodes OCC = ARMCC::getOppositeCondition(CC);
214 unsigned Mask = 0, Pos = 3;
215
216 // v8 IT blocks are limited to one conditional op unless -arm-no-restrict-it
217 // is set: skip the loop
218 if (!restrictIT) {
219 // Branches, including tricky ones like LDM_RET, need to end an IT
220 // block so check the instruction we just put in the block.
221 for (; MBBI != E && Pos &&
222 (!MI->isBranch() && !MI->isReturn()) ; ++MBBI) {
223 if (MBBI->isDebugValue())
224 continue;
225
226 MachineInstr *NMI = &*MBBI;
227 MI = NMI;
228
229 unsigned NPredReg = 0;
230 ARMCC::CondCodes NCC = getITInstrPredicate(*NMI, NPredReg);
231 if (NCC == CC || NCC == OCC) {
232 Mask |= (NCC & 1) << Pos;
233 // Add implicit use of ITSTATE.
234 NMI->addOperand(MachineOperand::CreateReg(ARM::ITSTATE, false/*ifDef*/,
235 true/*isImp*/, false/*isKill*/));
236 LastITMI = NMI;
237 } else {
238 if (NCC == ARMCC::AL &&
239 MoveCopyOutOfITBlock(NMI, CC, OCC, Defs, Uses)) {
240 --MBBI;
241 MBB.remove(NMI);
242 MBB.insert(InsertPos, NMI);
243 ClearKillFlags(MI, Uses);
244 ++NumMovedInsts;
245 continue;
246 }
247 break;
248 }
249 TrackDefUses(NMI, Defs, Uses, TRI);
250 --Pos;
251 }
252 }
253
254 // Finalize IT mask.
255 Mask |= (1 << Pos);
256 // Tag along (firstcond[0] << 4) with the mask.
257 Mask |= (CC & 1) << 4;
258 MIB.addImm(Mask);
259
260 // Last instruction in IT block kills ITSTATE.
261 LastITMI->findRegisterUseOperand(ARM::ITSTATE)->setIsKill();
262
263 // Finalize the bundle.
264 finalizeBundle(MBB, InsertPos.getInstrIterator(),
265 ++LastITMI->getIterator());
266
267 Modified = true;
268 ++NumITs;
269 }
270
271 return Modified;
272 }
273
runOnMachineFunction(MachineFunction & Fn)274 bool Thumb2ITBlockPass::runOnMachineFunction(MachineFunction &Fn) {
275 const ARMSubtarget &STI =
276 static_cast<const ARMSubtarget &>(Fn.getSubtarget());
277 if (!STI.isThumb2())
278 return false;
279 AFI = Fn.getInfo<ARMFunctionInfo>();
280 TII = static_cast<const Thumb2InstrInfo *>(STI.getInstrInfo());
281 TRI = STI.getRegisterInfo();
282 restrictIT = STI.restrictIT();
283
284 if (!AFI->isThumbFunction())
285 return false;
286
287 bool Modified = false;
288 for (MachineFunction::iterator MFI = Fn.begin(), E = Fn.end(); MFI != E; ) {
289 MachineBasicBlock &MBB = *MFI;
290 ++MFI;
291 Modified |= InsertITInstructions(MBB);
292 }
293
294 if (Modified)
295 AFI->setHasITBlocks(true);
296
297 return Modified;
298 }
299
300 /// createThumb2ITBlockPass - Returns an instance of the Thumb2 IT blocks
301 /// insertion pass.
createThumb2ITBlockPass()302 FunctionPass *llvm::createThumb2ITBlockPass() {
303 return new Thumb2ITBlockPass();
304 }
305