1 // Copyright 2015 the V8 project authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "src/compiler/instruction-scheduler.h"
6
7 #include "src/base/adapters.h"
8
9 namespace v8 {
10 namespace internal {
11 namespace compiler {
12
ScheduleGraphNode(Zone * zone,Instruction * instr)13 InstructionScheduler::ScheduleGraphNode::ScheduleGraphNode(
14 Zone* zone,
15 Instruction* instr)
16 : instr_(instr),
17 successors_(zone),
18 unscheduled_predecessors_count_(0),
19 latency_(GetInstructionLatency(instr)),
20 total_latency_(-1),
21 start_cycle_(-1) {
22 }
23
24
AddSuccessor(ScheduleGraphNode * node)25 void InstructionScheduler::ScheduleGraphNode::AddSuccessor(
26 ScheduleGraphNode* node) {
27 successors_.push_back(node);
28 node->unscheduled_predecessors_count_++;
29 }
30
31
InstructionScheduler(Zone * zone,InstructionSequence * sequence)32 InstructionScheduler::InstructionScheduler(Zone* zone,
33 InstructionSequence* sequence)
34 : zone_(zone),
35 sequence_(sequence),
36 graph_(zone),
37 last_side_effect_instr_(nullptr),
38 pending_loads_(zone),
39 last_live_in_reg_marker_(nullptr) {
40 }
41
42
StartBlock(RpoNumber rpo)43 void InstructionScheduler::StartBlock(RpoNumber rpo) {
44 DCHECK(graph_.empty());
45 DCHECK(last_side_effect_instr_ == nullptr);
46 DCHECK(pending_loads_.empty());
47 DCHECK(last_live_in_reg_marker_ == nullptr);
48 sequence()->StartBlock(rpo);
49 }
50
51
EndBlock(RpoNumber rpo)52 void InstructionScheduler::EndBlock(RpoNumber rpo) {
53 ScheduleBlock();
54 sequence()->EndBlock(rpo);
55 graph_.clear();
56 last_side_effect_instr_ = nullptr;
57 pending_loads_.clear();
58 last_live_in_reg_marker_ = nullptr;
59 }
60
61
AddInstruction(Instruction * instr)62 void InstructionScheduler::AddInstruction(Instruction* instr) {
63 ScheduleGraphNode* new_node = new (zone()) ScheduleGraphNode(zone(), instr);
64
65 if (IsBlockTerminator(instr)) {
66 // Make sure that basic block terminators are not moved by adding them
67 // as successor of every instruction.
68 for (auto node : graph_) {
69 node->AddSuccessor(new_node);
70 }
71 } else if (IsFixedRegisterParameter(instr)) {
72 if (last_live_in_reg_marker_ != nullptr) {
73 last_live_in_reg_marker_->AddSuccessor(new_node);
74 }
75 last_live_in_reg_marker_ = new_node;
76 } else {
77 if (last_live_in_reg_marker_ != nullptr) {
78 last_live_in_reg_marker_->AddSuccessor(new_node);
79 }
80
81 // Instructions with side effects and memory operations can't be
82 // reordered with respect to each other.
83 if (HasSideEffect(instr)) {
84 if (last_side_effect_instr_ != nullptr) {
85 last_side_effect_instr_->AddSuccessor(new_node);
86 }
87 for (auto load : pending_loads_) {
88 load->AddSuccessor(new_node);
89 }
90 pending_loads_.clear();
91 last_side_effect_instr_ = new_node;
92 } else if (IsLoadOperation(instr)) {
93 // Load operations can't be reordered with side effects instructions but
94 // independent loads can be reordered with respect to each other.
95 if (last_side_effect_instr_ != nullptr) {
96 last_side_effect_instr_->AddSuccessor(new_node);
97 }
98 pending_loads_.push_back(new_node);
99 }
100
101 // Look for operand dependencies.
102 for (auto node : graph_) {
103 if (HasOperandDependency(node->instruction(), instr)) {
104 node->AddSuccessor(new_node);
105 }
106 }
107 }
108
109 graph_.push_back(new_node);
110 }
111
112
CompareNodes(ScheduleGraphNode * node1,ScheduleGraphNode * node2) const113 bool InstructionScheduler::CompareNodes(ScheduleGraphNode *node1,
114 ScheduleGraphNode *node2) const {
115 return node1->total_latency() > node2->total_latency();
116 }
117
118
ScheduleBlock()119 void InstructionScheduler::ScheduleBlock() {
120 ZoneLinkedList<ScheduleGraphNode*> ready_list(zone());
121
122 // Compute total latencies so that we can schedule the critical path first.
123 ComputeTotalLatencies();
124
125 // Add nodes which don't have dependencies to the ready list.
126 for (auto node : graph_) {
127 if (!node->HasUnscheduledPredecessor()) {
128 ready_list.push_back(node);
129 }
130 }
131
132 // Go through the ready list and schedule the instructions.
133 int cycle = 0;
134 while (!ready_list.empty()) {
135 auto candidate = ready_list.end();
136 for (auto iterator = ready_list.begin(); iterator != ready_list.end();
137 ++iterator) {
138 // Look for the best candidate to schedule.
139 // We only consider instructions that have all their operands ready and
140 // we try to schedule the critical path first (we look for the instruction
141 // with the highest latency on the path to reach the end of the graph).
142 if (cycle >= (*iterator)->start_cycle()) {
143 if ((candidate == ready_list.end()) ||
144 CompareNodes(*iterator, *candidate)) {
145 candidate = iterator;
146 }
147 }
148 }
149
150 if (candidate != ready_list.end()) {
151 sequence()->AddInstruction((*candidate)->instruction());
152
153 for (auto successor : (*candidate)->successors()) {
154 successor->DropUnscheduledPredecessor();
155 successor->set_start_cycle(
156 std::max(successor->start_cycle(),
157 cycle + (*candidate)->latency()));
158
159 if (!successor->HasUnscheduledPredecessor()) {
160 ready_list.push_back(successor);
161 }
162 }
163
164 ready_list.erase(candidate);
165 }
166
167 cycle++;
168 }
169 }
170
171
GetInstructionFlags(const Instruction * instr) const172 int InstructionScheduler::GetInstructionFlags(const Instruction* instr) const {
173 switch (instr->arch_opcode()) {
174 case kArchNop:
175 case kArchStackPointer:
176 case kArchFramePointer:
177 case kArchTruncateDoubleToI:
178 return kNoOpcodeFlags;
179
180 case kArchPrepareCallCFunction:
181 case kArchPrepareTailCall:
182 case kArchCallCFunction:
183 case kArchCallCodeObject:
184 case kArchCallJSFunction:
185 case kArchLazyBailout:
186 return kHasSideEffect;
187
188 case kArchTailCallCodeObject:
189 case kArchTailCallJSFunction:
190 return kHasSideEffect | kIsBlockTerminator;
191
192 case kArchDeoptimize:
193 case kArchJmp:
194 case kArchLookupSwitch:
195 case kArchTableSwitch:
196 case kArchRet:
197 case kArchThrowTerminator:
198 return kIsBlockTerminator;
199
200 case kCheckedLoadInt8:
201 case kCheckedLoadUint8:
202 case kCheckedLoadInt16:
203 case kCheckedLoadUint16:
204 case kCheckedLoadWord32:
205 case kCheckedLoadWord64:
206 case kCheckedLoadFloat32:
207 case kCheckedLoadFloat64:
208 return kIsLoadOperation;
209
210 case kCheckedStoreWord8:
211 case kCheckedStoreWord16:
212 case kCheckedStoreWord32:
213 case kCheckedStoreWord64:
214 case kCheckedStoreFloat32:
215 case kCheckedStoreFloat64:
216 case kArchStoreWithWriteBarrier:
217 return kHasSideEffect;
218
219 #define CASE(Name) case k##Name:
220 TARGET_ARCH_OPCODE_LIST(CASE)
221 #undef CASE
222 return GetTargetInstructionFlags(instr);
223 }
224
225 UNREACHABLE();
226 return kNoOpcodeFlags;
227 }
228
229
HasOperandDependency(const Instruction * instr1,const Instruction * instr2) const230 bool InstructionScheduler::HasOperandDependency(
231 const Instruction* instr1, const Instruction* instr2) const {
232 for (size_t i = 0; i < instr1->OutputCount(); ++i) {
233 for (size_t j = 0; j < instr2->InputCount(); ++j) {
234 const InstructionOperand* output = instr1->OutputAt(i);
235 const InstructionOperand* input = instr2->InputAt(j);
236
237 if (output->IsUnallocated() && input->IsUnallocated() &&
238 (UnallocatedOperand::cast(output)->virtual_register() ==
239 UnallocatedOperand::cast(input)->virtual_register())) {
240 return true;
241 }
242
243 if (output->IsConstant() && input->IsUnallocated() &&
244 (ConstantOperand::cast(output)->virtual_register() ==
245 UnallocatedOperand::cast(input)->virtual_register())) {
246 return true;
247 }
248 }
249 }
250
251 // TODO(bafsa): Do we need to look for anti-dependencies/output-dependencies?
252
253 return false;
254 }
255
256
IsBlockTerminator(const Instruction * instr) const257 bool InstructionScheduler::IsBlockTerminator(const Instruction* instr) const {
258 return ((GetInstructionFlags(instr) & kIsBlockTerminator) ||
259 (instr->flags_mode() == kFlags_branch));
260 }
261
262
ComputeTotalLatencies()263 void InstructionScheduler::ComputeTotalLatencies() {
264 for (auto node : base::Reversed(graph_)) {
265 int max_latency = 0;
266
267 for (auto successor : node->successors()) {
268 DCHECK(successor->total_latency() != -1);
269 if (successor->total_latency() > max_latency) {
270 max_latency = successor->total_latency();
271 }
272 }
273
274 node->set_total_latency(max_latency + node->latency());
275 }
276 }
277
278 } // namespace compiler
279 } // namespace internal
280 } // namespace v8
281