// Copyright 2013 the V8 project authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "src/compiler/scheduler.h" #include #include "src/base/iterator.h" #include "src/builtins/profile-data-reader.h" #include "src/codegen/tick-counter.h" #include "src/compiler/common-operator.h" #include "src/compiler/control-equivalence.h" #include "src/compiler/graph.h" #include "src/compiler/node-marker.h" #include "src/compiler/node-properties.h" #include "src/compiler/node.h" #include "src/utils/bit-vector.h" #include "src/zone/zone-containers.h" namespace v8 { namespace internal { namespace compiler { #define TRACE(...) \ do { \ if (FLAG_trace_turbo_scheduler) PrintF(__VA_ARGS__); \ } while (false) Scheduler::Scheduler(Zone* zone, Graph* graph, Schedule* schedule, Flags flags, size_t node_count_hint, TickCounter* tick_counter, const ProfileDataFromFile* profile_data) : zone_(zone), graph_(graph), schedule_(schedule), flags_(flags), scheduled_nodes_(zone), schedule_root_nodes_(zone), schedule_queue_(zone), node_data_(zone), tick_counter_(tick_counter), profile_data_(profile_data), common_dominator_cache_(zone) { node_data_.reserve(node_count_hint); node_data_.resize(graph->NodeCount(), DefaultSchedulerData()); } Schedule* Scheduler::ComputeSchedule(Zone* zone, Graph* graph, Flags flags, TickCounter* tick_counter, const ProfileDataFromFile* profile_data) { Zone* schedule_zone = (flags & Scheduler::kTempSchedule) ? zone : graph->zone(); // Reserve 10% more space for nodes if node splitting is enabled to try to // avoid resizing the vector since that would triple its zone memory usage. float node_hint_multiplier = (flags & Scheduler::kSplitNodes) ? 1.1 : 1; size_t node_count_hint = node_hint_multiplier * graph->NodeCount(); Schedule* schedule = schedule_zone->New(schedule_zone, node_count_hint); Scheduler scheduler(zone, graph, schedule, flags, node_count_hint, tick_counter, profile_data); scheduler.BuildCFG(); scheduler.ComputeSpecialRPONumbering(); scheduler.GenerateDominatorTree(); scheduler.PrepareUses(); scheduler.ScheduleEarly(); scheduler.ScheduleLate(); scheduler.SealFinalSchedule(); return schedule; } Scheduler::SchedulerData Scheduler::DefaultSchedulerData() { SchedulerData def = {schedule_->start(), 0, kUnknown}; return def; } Scheduler::SchedulerData* Scheduler::GetData(Node* node) { return &node_data_[node->id()]; } Scheduler::Placement Scheduler::InitializePlacement(Node* node) { SchedulerData* data = GetData(node); if (data->placement_ == kFixed) { // Nothing to do for control nodes that have been already fixed in // the schedule. return data->placement_; } DCHECK_EQ(kUnknown, data->placement_); switch (node->opcode()) { case IrOpcode::kParameter: case IrOpcode::kOsrValue: // Parameters and OSR values are always fixed to the start block. data->placement_ = kFixed; break; case IrOpcode::kPhi: case IrOpcode::kEffectPhi: { // Phis and effect phis are fixed if their control inputs are, whereas // otherwise they are coupled to a floating control node. Placement p = GetPlacement(NodeProperties::GetControlInput(node)); data->placement_ = (p == kFixed ? kFixed : kCoupled); break; } default: // Control nodes that were not control-reachable from end may float. data->placement_ = kSchedulable; break; } return data->placement_; } Scheduler::Placement Scheduler::GetPlacement(Node* node) { return GetData(node)->placement_; } bool Scheduler::IsLive(Node* node) { return GetPlacement(node) != kUnknown; } void Scheduler::UpdatePlacement(Node* node, Placement placement) { SchedulerData* data = GetData(node); if (data->placement_ == kUnknown) { // We only update control nodes from {kUnknown} to {kFixed}. Ideally, we // should check that {node} is a control node (including exceptional calls), // but that is expensive. DCHECK_EQ(Scheduler::kFixed, placement); data->placement_ = placement; return; } switch (node->opcode()) { case IrOpcode::kParameter: // Parameters are fixed once and for all. UNREACHABLE(); case IrOpcode::kPhi: case IrOpcode::kEffectPhi: { // Phis and effect phis are coupled to their respective blocks. DCHECK_EQ(Scheduler::kCoupled, data->placement_); DCHECK_EQ(Scheduler::kFixed, placement); Node* control = NodeProperties::GetControlInput(node); BasicBlock* block = schedule_->block(control); schedule_->AddNode(block, node); break; } #define DEFINE_CONTROL_CASE(V) case IrOpcode::k##V: CONTROL_OP_LIST(DEFINE_CONTROL_CASE) #undef DEFINE_CONTROL_CASE { // Control nodes force coupled uses to be placed. for (auto use : node->uses()) { if (GetPlacement(use) == Scheduler::kCoupled) { DCHECK_EQ(node, NodeProperties::GetControlInput(use)); UpdatePlacement(use, placement); } } break; } default: DCHECK_EQ(Scheduler::kSchedulable, data->placement_); DCHECK_EQ(Scheduler::kScheduled, placement); break; } // Reduce the use count of the node's inputs to potentially make them // schedulable. If all the uses of a node have been scheduled, then the node // itself can be scheduled. base::Optional coupled_control_edge = GetCoupledControlEdge(node); for (Edge const edge : node->input_edges()) { DCHECK_EQ(node, edge.from()); if (edge.index() != coupled_control_edge) { DecrementUnscheduledUseCount(edge.to(), node); } } data->placement_ = placement; } base::Optional Scheduler::GetCoupledControlEdge(Node* node) { if (GetPlacement(node) == kCoupled) { return NodeProperties::FirstControlIndex(node); } return {}; } void Scheduler::IncrementUnscheduledUseCount(Node* node, Node* from) { // Tracking use counts for fixed nodes is useless. if (GetPlacement(node) == kFixed) return; // Use count for coupled nodes is summed up on their control. if (GetPlacement(node) == kCoupled) { node = NodeProperties::GetControlInput(node); DCHECK_NE(GetPlacement(node), Placement::kFixed); DCHECK_NE(GetPlacement(node), Placement::kCoupled); } ++(GetData(node)->unscheduled_count_); if (FLAG_trace_turbo_scheduler) { TRACE(" Use count of #%d:%s (used by #%d:%s)++ = %d\n", node->id(), node->op()->mnemonic(), from->id(), from->op()->mnemonic(), GetData(node)->unscheduled_count_); } } void Scheduler::DecrementUnscheduledUseCount(Node* node, Node* from) { // Tracking use counts for fixed nodes is useless. if (GetPlacement(node) == kFixed) return; // Use count for coupled nodes is summed up on their control. if (GetPlacement(node) == kCoupled) { node = NodeProperties::GetControlInput(node); DCHECK_NE(GetPlacement(node), Placement::kFixed); DCHECK_NE(GetPlacement(node), Placement::kCoupled); } DCHECK_LT(0, GetData(node)->unscheduled_count_); --(GetData(node)->unscheduled_count_); if (FLAG_trace_turbo_scheduler) { TRACE(" Use count of #%d:%s (used by #%d:%s)-- = %d\n", node->id(), node->op()->mnemonic(), from->id(), from->op()->mnemonic(), GetData(node)->unscheduled_count_); } if (GetData(node)->unscheduled_count_ == 0) { TRACE(" newly eligible #%d:%s\n", node->id(), node->op()->mnemonic()); schedule_queue_.push(node); } } // ----------------------------------------------------------------------------- // Phase 1: Build control-flow graph. // Internal class to build a control flow graph (i.e the basic blocks and edges // between them within a Schedule) from the node graph. Visits control edges of // the graph backwards from an end node in order to find the connected control // subgraph, needed for scheduling. class CFGBuilder : public ZoneObject { public: CFGBuilder(Zone* zone, Scheduler* scheduler) : zone_(zone), scheduler_(scheduler), schedule_(scheduler->schedule_), queued_(scheduler->graph_, 2), queue_(zone), control_(zone), component_entry_(nullptr), component_start_(nullptr), component_end_(nullptr) {} // Run the control flow graph construction algorithm by walking the graph // backwards from end through control edges, building and connecting the // basic blocks for control nodes. void Run() { ResetDataStructures(); Queue(scheduler_->graph_->end()); while (!queue_.empty()) { // Breadth-first backwards traversal. scheduler_->tick_counter_->TickAndMaybeEnterSafepoint(); Node* node = queue_.front(); queue_.pop(); int max = NodeProperties::PastControlIndex(node); for (int i = NodeProperties::FirstControlIndex(node); i < max; i++) { Queue(node->InputAt(i)); } } for (NodeVector::iterator i = control_.begin(); i != control_.end(); ++i) { ConnectBlocks(*i); // Connect block to its predecessor/successors. } } // Run the control flow graph construction for a minimal control-connected // component ending in {exit} and merge that component into an existing // control flow graph at the bottom of {block}. void Run(BasicBlock* block, Node* exit) { ResetDataStructures(); Queue(exit); component_entry_ = nullptr; component_start_ = block; component_end_ = schedule_->block(exit); scheduler_->equivalence_->Run(exit); while (!queue_.empty()) { // Breadth-first backwards traversal. scheduler_->tick_counter_->TickAndMaybeEnterSafepoint(); Node* node = queue_.front(); queue_.pop(); // Use control dependence equivalence to find a canonical single-entry // single-exit region that makes up a minimal component to be scheduled. if (IsSingleEntrySingleExitRegion(node, exit)) { TRACE("Found SESE at #%d:%s\n", node->id(), node->op()->mnemonic()); DCHECK(!component_entry_); component_entry_ = node; continue; } int max = NodeProperties::PastControlIndex(node); for (int i = NodeProperties::FirstControlIndex(node); i < max; i++) { Queue(node->InputAt(i)); } } DCHECK(component_entry_); for (NodeVector::iterator i = control_.begin(); i != control_.end(); ++i) { ConnectBlocks(*i); // Connect block to its predecessor/successors. } } private: friend class ScheduleLateNodeVisitor; friend class Scheduler; void FixNode(BasicBlock* block, Node* node) { schedule_->AddNode(block, node); scheduler_->UpdatePlacement(node, Scheduler::kFixed); } void Queue(Node* node) { // Mark the connected control nodes as they are queued. if (!queued_.Get(node)) { BuildBlocks(node); queue_.push(node); queued_.Set(node, true); control_.push_back(node); } } void BuildBlocks(Node* node) { switch (node->opcode()) { case IrOpcode::kEnd: FixNode(schedule_->end(), node); break; case IrOpcode::kStart: FixNode(schedule_->start(), node); break; case IrOpcode::kLoop: case IrOpcode::kMerge: BuildBlockForNode(node); break; case IrOpcode::kTerminate: { // Put Terminate in the loop to which it refers. Node* loop = NodeProperties::GetControlInput(node); BasicBlock* block = BuildBlockForNode(loop); FixNode(block, node); break; } case IrOpcode::kBranch: case IrOpcode::kSwitch: BuildBlocksForSuccessors(node); break; #define BUILD_BLOCK_JS_CASE(Name, ...) case IrOpcode::k##Name: JS_OP_LIST(BUILD_BLOCK_JS_CASE) // JS opcodes are just like calls => fall through. #undef BUILD_BLOCK_JS_CASE case IrOpcode::kCall: if (NodeProperties::IsExceptionalCall(node)) { BuildBlocksForSuccessors(node); } break; default: break; } } void ConnectBlocks(Node* node) { switch (node->opcode()) { case IrOpcode::kLoop: case IrOpcode::kMerge: ConnectMerge(node); break; case IrOpcode::kBranch: scheduler_->UpdatePlacement(node, Scheduler::kFixed); ConnectBranch(node); break; case IrOpcode::kSwitch: scheduler_->UpdatePlacement(node, Scheduler::kFixed); ConnectSwitch(node); break; case IrOpcode::kDeoptimize: scheduler_->UpdatePlacement(node, Scheduler::kFixed); ConnectDeoptimize(node); break; case IrOpcode::kTailCall: scheduler_->UpdatePlacement(node, Scheduler::kFixed); ConnectTailCall(node); break; case IrOpcode::kReturn: scheduler_->UpdatePlacement(node, Scheduler::kFixed); ConnectReturn(node); break; case IrOpcode::kThrow: scheduler_->UpdatePlacement(node, Scheduler::kFixed); ConnectThrow(node); break; #define CONNECT_BLOCK_JS_CASE(Name, ...) case IrOpcode::k##Name: JS_OP_LIST(CONNECT_BLOCK_JS_CASE) // JS opcodes are just like calls => fall through. #undef CONNECT_BLOCK_JS_CASE case IrOpcode::kCall: if (NodeProperties::IsExceptionalCall(node)) { scheduler_->UpdatePlacement(node, Scheduler::kFixed); ConnectCall(node); } break; default: break; } } BasicBlock* BuildBlockForNode(Node* node) { BasicBlock* block = schedule_->block(node); if (block == nullptr) { block = schedule_->NewBasicBlock(); TRACE("Create block id:%d for #%d:%s\n", block->id().ToInt(), node->id(), node->op()->mnemonic()); FixNode(block, node); } return block; } void BuildBlocksForSuccessors(Node* node) { size_t const successor_cnt = node->op()->ControlOutputCount(); Node** successors = zone_->NewArray(successor_cnt); NodeProperties::CollectControlProjections(node, successors, successor_cnt); for (size_t index = 0; index < successor_cnt; ++index) { BuildBlockForNode(successors[index]); } } void CollectSuccessorBlocks(Node* node, BasicBlock** successor_blocks, size_t successor_cnt) { Node** successors = reinterpret_cast(successor_blocks); NodeProperties::CollectControlProjections(node, successors, successor_cnt); for (size_t index = 0; index < successor_cnt; ++index) { successor_blocks[index] = schedule_->block(successors[index]); } } BasicBlock* FindPredecessorBlock(Node* node) { BasicBlock* predecessor_block = nullptr; while (true) { predecessor_block = schedule_->block(node); if (predecessor_block != nullptr) break; node = NodeProperties::GetControlInput(node); } return predecessor_block; } void ConnectCall(Node* call) { BasicBlock* successor_blocks[2]; CollectSuccessorBlocks(call, successor_blocks, arraysize(successor_blocks)); // Consider the exception continuation to be deferred. successor_blocks[1]->set_deferred(true); Node* call_control = NodeProperties::GetControlInput(call); BasicBlock* call_block = FindPredecessorBlock(call_control); TraceConnect(call, call_block, successor_blocks[0]); TraceConnect(call, call_block, successor_blocks[1]); schedule_->AddCall(call_block, call, successor_blocks[0], successor_blocks[1]); } void ConnectBranch(Node* branch) { BasicBlock* successor_blocks[2]; CollectSuccessorBlocks(branch, successor_blocks, arraysize(successor_blocks)); BranchHint hint_from_profile = BranchHint::kNone; if (const ProfileDataFromFile* profile_data = scheduler_->profile_data()) { double block_zero_count = profile_data->GetCounter(successor_blocks[0]->id().ToSize()); double block_one_count = profile_data->GetCounter(successor_blocks[1]->id().ToSize()); // If a branch is visited a non-trivial number of times and substantially // more often than its alternative, then mark it as likely. constexpr double kMinimumCount = 100000; constexpr double kThresholdRatio = 4000; if (block_zero_count > kMinimumCount && block_zero_count / kThresholdRatio > block_one_count) { hint_from_profile = BranchHint::kTrue; } else if (block_one_count > kMinimumCount && block_one_count / kThresholdRatio > block_zero_count) { hint_from_profile = BranchHint::kFalse; } } // Consider branch hints. switch (hint_from_profile) { case BranchHint::kNone: switch (BranchHintOf(branch->op())) { case BranchHint::kNone: break; case BranchHint::kTrue: successor_blocks[1]->set_deferred(true); break; case BranchHint::kFalse: successor_blocks[0]->set_deferred(true); break; } break; case BranchHint::kTrue: successor_blocks[1]->set_deferred(true); break; case BranchHint::kFalse: successor_blocks[0]->set_deferred(true); break; } if (hint_from_profile != BranchHint::kNone && BranchHintOf(branch->op()) != BranchHint::kNone && hint_from_profile != BranchHintOf(branch->op())) { PrintF("Warning: profiling data overrode manual branch hint.\n"); } if (branch == component_entry_) { TraceConnect(branch, component_start_, successor_blocks[0]); TraceConnect(branch, component_start_, successor_blocks[1]); schedule_->InsertBranch(component_start_, component_end_, branch, successor_blocks[0], successor_blocks[1]); } else { Node* branch_control = NodeProperties::GetControlInput(branch); BasicBlock* branch_block = FindPredecessorBlock(branch_control); TraceConnect(branch, branch_block, successor_blocks[0]); TraceConnect(branch, branch_block, successor_blocks[1]); schedule_->AddBranch(branch_block, branch, successor_blocks[0], successor_blocks[1]); } } void ConnectSwitch(Node* sw) { size_t const successor_count = sw->op()->ControlOutputCount(); BasicBlock** successor_blocks = zone_->NewArray(successor_count); CollectSuccessorBlocks(sw, successor_blocks, successor_count); if (sw == component_entry_) { for (size_t index = 0; index < successor_count; ++index) { TraceConnect(sw, component_start_, successor_blocks[index]); } schedule_->InsertSwitch(component_start_, component_end_, sw, successor_blocks, successor_count); } else { Node* switch_control = NodeProperties::GetControlInput(sw); BasicBlock* switch_block = FindPredecessorBlock(switch_control); for (size_t index = 0; index < successor_count; ++index) { TraceConnect(sw, switch_block, successor_blocks[index]); } schedule_->AddSwitch(switch_block, sw, successor_blocks, successor_count); } for (size_t index = 0; index < successor_count; ++index) { if (BranchHintOf(successor_blocks[index]->front()->op()) == BranchHint::kFalse) { successor_blocks[index]->set_deferred(true); } } } void ConnectMerge(Node* merge) { // Don't connect the special merge at the end to its predecessors. if (IsFinalMerge(merge)) return; BasicBlock* block = schedule_->block(merge); DCHECK_NOT_NULL(block); // For all of the merge's control inputs, add a goto at the end to the // merge's basic block. for (Node* const input : merge->inputs()) { BasicBlock* predecessor_block = FindPredecessorBlock(input); TraceConnect(merge, predecessor_block, block); schedule_->AddGoto(predecessor_block, block); } } void ConnectTailCall(Node* call) { Node* call_control = NodeProperties::GetControlInput(call); BasicBlock* call_block = FindPredecessorBlock(call_control); TraceConnect(call, call_block, nullptr); schedule_->AddTailCall(call_block, call); } void ConnectReturn(Node* ret) { Node* return_control = NodeProperties::GetControlInput(ret); BasicBlock* return_block = FindPredecessorBlock(return_control); TraceConnect(ret, return_block, nullptr); schedule_->AddReturn(return_block, ret); } void ConnectDeoptimize(Node* deopt) { Node* deoptimize_control = NodeProperties::GetControlInput(deopt); BasicBlock* deoptimize_block = FindPredecessorBlock(deoptimize_control); TraceConnect(deopt, deoptimize_block, nullptr); schedule_->AddDeoptimize(deoptimize_block, deopt); } void ConnectThrow(Node* thr) { Node* throw_control = NodeProperties::GetControlInput(thr); BasicBlock* throw_block = FindPredecessorBlock(throw_control); TraceConnect(thr, throw_block, nullptr); schedule_->AddThrow(throw_block, thr); } void TraceConnect(Node* node, BasicBlock* block, BasicBlock* succ) { DCHECK_NOT_NULL(block); if (succ == nullptr) { TRACE("Connect #%d:%s, id:%d -> end\n", node->id(), node->op()->mnemonic(), block->id().ToInt()); } else { TRACE("Connect #%d:%s, id:%d -> id:%d\n", node->id(), node->op()->mnemonic(), block->id().ToInt(), succ->id().ToInt()); } } bool IsFinalMerge(Node* node) { return (node->opcode() == IrOpcode::kMerge && node == scheduler_->graph_->end()->InputAt(0)); } bool IsSingleEntrySingleExitRegion(Node* entry, Node* exit) const { size_t entry_class = scheduler_->equivalence_->ClassOf(entry); size_t exit_class = scheduler_->equivalence_->ClassOf(exit); return entry != exit && entry_class == exit_class; } void ResetDataStructures() { control_.clear(); DCHECK(queue_.empty()); DCHECK(control_.empty()); } Zone* zone_; Scheduler* scheduler_; Schedule* schedule_; NodeMarker queued_; // Mark indicating whether node is queued. ZoneQueue queue_; // Queue used for breadth-first traversal. NodeVector control_; // List of encountered control nodes. Node* component_entry_; // Component single-entry node. BasicBlock* component_start_; // Component single-entry block. BasicBlock* component_end_; // Component single-exit block. }; void Scheduler::BuildCFG() { TRACE("--- CREATING CFG -------------------------------------------\n"); // Instantiate a new control equivalence algorithm for the graph. equivalence_ = zone_->New(zone_, graph_); // Build a control-flow graph for the main control-connected component that // is being spanned by the graph's start and end nodes. control_flow_builder_ = zone_->New(zone_, this); control_flow_builder_->Run(); // Initialize per-block data. // Reserve an extra 10% to avoid resizing vector when fusing floating control. scheduled_nodes_.reserve(schedule_->BasicBlockCount() * 1.1); scheduled_nodes_.resize(schedule_->BasicBlockCount()); } // ----------------------------------------------------------------------------- // Phase 2: Compute special RPO and dominator tree. // Compute the special reverse-post-order block ordering, which is essentially // a RPO of the graph where loop bodies are contiguous. Properties: // 1. If block A is a predecessor of B, then A appears before B in the order, // unless B is a loop header and A is in the loop headed at B // (i.e. A -> B is a backedge). // => If block A dominates block B, then A appears before B in the order. // => If block A is a loop header, A appears before all blocks in the loop // headed at A. // 2. All loops are contiguous in the order (i.e. no intervening blocks that // do not belong to the loop.) // Note a simple RPO traversal satisfies (1) but not (2). class SpecialRPONumberer : public ZoneObject { public: SpecialRPONumberer(Zone* zone, Schedule* schedule) : zone_(zone), schedule_(schedule), order_(nullptr), beyond_end_(nullptr), loops_(zone), backedges_(zone), stack_(zone), previous_block_count_(0), empty_(0, zone) {} // Computes the special reverse-post-order for the main control flow graph, // that is for the graph spanned between the schedule's start and end blocks. void ComputeSpecialRPO() { DCHECK_EQ(0, schedule_->end()->SuccessorCount()); DCHECK(!order_); // Main order does not exist yet. ComputeAndInsertSpecialRPO(schedule_->start(), schedule_->end()); } // Computes the special reverse-post-order for a partial control flow graph, // that is for the graph spanned between the given {entry} and {end} blocks, // then updates the existing ordering with this new information. void UpdateSpecialRPO(BasicBlock* entry, BasicBlock* end) { DCHECK(order_); // Main order to be updated is present. ComputeAndInsertSpecialRPO(entry, end); } // Serialize the previously computed order as a special reverse-post-order // numbering for basic blocks into the final schedule. void SerializeRPOIntoSchedule() { int32_t number = 0; for (BasicBlock* b = order_; b != nullptr; b = b->rpo_next()) { b->set_rpo_number(number++); schedule_->rpo_order()->push_back(b); } BeyondEndSentinel()->set_rpo_number(number); } // Print and verify the special reverse-post-order. void PrintAndVerifySpecialRPO() { #if DEBUG if (FLAG_trace_turbo_scheduler) PrintRPO(); VerifySpecialRPO(); #endif } const ZoneVector& GetOutgoingBlocks(BasicBlock* block) { if (HasLoopNumber(block)) { LoopInfo const& loop = loops_[GetLoopNumber(block)]; if (loop.outgoing) return *loop.outgoing; } return empty_; } bool HasLoopBlocks() const { return loops_.size() != 0; } private: using Backedge = std::pair; // Numbering for BasicBlock::rpo_number for this block traversal: static const int kBlockOnStack = -2; static const int kBlockVisited1 = -3; static const int kBlockVisited2 = -4; static const int kBlockUnvisited1 = -1; static const int kBlockUnvisited2 = kBlockVisited1; struct SpecialRPOStackFrame { BasicBlock* block; size_t index; }; struct LoopInfo { BasicBlock* header; ZoneVector* outgoing; BitVector* members; LoopInfo* prev; BasicBlock* end; BasicBlock* start; void AddOutgoing(Zone* zone, BasicBlock* block) { if (outgoing == nullptr) { outgoing = zone->New>(zone); } outgoing->push_back(block); } }; int Push(int depth, BasicBlock* child, int unvisited) { if (child->rpo_number() == unvisited) { stack_[depth].block = child; stack_[depth].index = 0; child->set_rpo_number(kBlockOnStack); return depth + 1; } return depth; } BasicBlock* PushFront(BasicBlock* head, BasicBlock* block) { block->set_rpo_next(head); return block; } static int GetLoopNumber(BasicBlock* block) { return block->loop_number(); } static void SetLoopNumber(BasicBlock* block, int loop_number) { return block->set_loop_number(loop_number); } static bool HasLoopNumber(BasicBlock* block) { return block->loop_number() >= 0; } // We only need this special sentinel because some tests use the schedule's // end block in actual control flow (e.g. with end having successors). BasicBlock* BeyondEndSentinel() { if (beyond_end_ == nullptr) { BasicBlock::Id id = BasicBlock::Id::FromInt(-1); beyond_end_ = schedule_->zone()->New(schedule_->zone(), id); } return beyond_end_; } // Compute special RPO for the control flow graph between {entry} and {end}, // mutating any existing order so that the result is still valid. void ComputeAndInsertSpecialRPO(BasicBlock* entry, BasicBlock* end) { // RPO should not have been serialized for this schedule yet. CHECK_EQ(kBlockUnvisited1, schedule_->start()->loop_number()); CHECK_EQ(kBlockUnvisited1, schedule_->start()->rpo_number()); CHECK_EQ(0, static_cast(schedule_->rpo_order()->size())); // Find correct insertion point within existing order. BasicBlock* insertion_point = entry->rpo_next(); BasicBlock* order = insertion_point; // Perform an iterative RPO traversal using an explicit stack, // recording backedges that form cycles. O(|B|). DCHECK_LT(previous_block_count_, schedule_->BasicBlockCount()); stack_.resize(schedule_->BasicBlockCount() - previous_block_count_); previous_block_count_ = schedule_->BasicBlockCount(); int stack_depth = Push(0, entry, kBlockUnvisited1); int num_loops = static_cast(loops_.size()); while (stack_depth > 0) { int current = stack_depth - 1; SpecialRPOStackFrame* frame = &stack_[current]; if (frame->block != end && frame->index < frame->block->SuccessorCount()) { // Process the next successor. BasicBlock* succ = frame->block->SuccessorAt(frame->index++); if (succ->rpo_number() == kBlockVisited1) continue; if (succ->rpo_number() == kBlockOnStack) { // The successor is on the stack, so this is a backedge (cycle). backedges_.push_back(Backedge(frame->block, frame->index - 1)); if (!HasLoopNumber(succ)) { // Assign a new loop number to the header if it doesn't have one. SetLoopNumber(succ, num_loops++); } } else { // Push the successor onto the stack. DCHECK_EQ(kBlockUnvisited1, succ->rpo_number()); stack_depth = Push(stack_depth, succ, kBlockUnvisited1); } } else { // Finished with all successors; pop the stack and add the block. order = PushFront(order, frame->block); frame->block->set_rpo_number(kBlockVisited1); stack_depth--; } } // If no loops were encountered, then the order we computed was correct. if (num_loops > static_cast(loops_.size())) { // Otherwise, compute the loop information from the backedges in order // to perform a traversal that groups loop bodies together. ComputeLoopInfo(&stack_, num_loops, &backedges_); // Initialize the "loop stack". Note the entry could be a loop header. LoopInfo* loop = HasLoopNumber(entry) ? &loops_[GetLoopNumber(entry)] : nullptr; order = insertion_point; // Perform an iterative post-order traversal, visiting loop bodies before // edges that lead out of loops. Visits each block once, but linking loop // sections together is linear in the loop size, so overall is // O(|B| + max(loop_depth) * max(|loop|)) stack_depth = Push(0, entry, kBlockUnvisited2); while (stack_depth > 0) { SpecialRPOStackFrame* frame = &stack_[stack_depth - 1]; BasicBlock* block = frame->block; BasicBlock* succ = nullptr; if (block != end && frame->index < block->SuccessorCount()) { // Process the next normal successor. succ = block->SuccessorAt(frame->index++); } else if (HasLoopNumber(block)) { // Process additional outgoing edges from the loop header. if (block->rpo_number() == kBlockOnStack) { // Finish the loop body the first time the header is left on the // stack. DCHECK(loop != nullptr && loop->header == block); loop->start = PushFront(order, block); order = loop->end; block->set_rpo_number(kBlockVisited2); // Pop the loop stack and continue visiting outgoing edges within // the context of the outer loop, if any. loop = loop->prev; // We leave the loop header on the stack; the rest of this iteration // and later iterations will go through its outgoing edges list. } // Use the next outgoing edge if there are any. size_t outgoing_index = frame->index - block->SuccessorCount(); LoopInfo* info = &loops_[GetLoopNumber(block)]; DCHECK(loop != info); if (block != entry && info->outgoing != nullptr && outgoing_index < info->outgoing->size()) { succ = info->outgoing->at(outgoing_index); frame->index++; } } if (succ != nullptr) { // Process the next successor. if (succ->rpo_number() == kBlockOnStack) continue; if (succ->rpo_number() == kBlockVisited2) continue; DCHECK_EQ(kBlockUnvisited2, succ->rpo_number()); if (loop != nullptr && !loop->members->Contains(succ->id().ToInt())) { // The successor is not in the current loop or any nested loop. // Add it to the outgoing edges of this loop and visit it later. loop->AddOutgoing(zone_, succ); } else { // Push the successor onto the stack. stack_depth = Push(stack_depth, succ, kBlockUnvisited2); if (HasLoopNumber(succ)) { // Push the inner loop onto the loop stack. DCHECK(GetLoopNumber(succ) < num_loops); LoopInfo* next = &loops_[GetLoopNumber(succ)]; next->end = order; next->prev = loop; loop = next; } } } else { // Finished with all successors of the current block. if (HasLoopNumber(block)) { // If we are going to pop a loop header, then add its entire body. LoopInfo* info = &loops_[GetLoopNumber(block)]; for (BasicBlock* b = info->start; true; b = b->rpo_next()) { if (b->rpo_next() == info->end) { b->set_rpo_next(order); info->end = order; break; } } order = info->start; } else { // Pop a single node off the stack and add it to the order. order = PushFront(order, block); block->set_rpo_number(kBlockVisited2); } stack_depth--; } } } // Publish new order the first time. if (order_ == nullptr) order_ = order; // Compute the correct loop headers and set the correct loop ends. LoopInfo* current_loop = nullptr; BasicBlock* current_header = entry->loop_header(); int32_t loop_depth = entry->loop_depth(); if (entry->IsLoopHeader()) --loop_depth; // Entry might be a loop header. for (BasicBlock* b = order; b != insertion_point; b = b->rpo_next()) { BasicBlock* current = b; // Reset BasicBlock::rpo_number again. current->set_rpo_number(kBlockUnvisited1); // Finish the previous loop(s) if we just exited them. while (current_header != nullptr && current == current_header->loop_end()) { DCHECK(current_header->IsLoopHeader()); DCHECK_NOT_NULL(current_loop); current_loop = current_loop->prev; current_header = current_loop == nullptr ? nullptr : current_loop->header; --loop_depth; } current->set_loop_header(current_header); // Push a new loop onto the stack if this loop is a loop header. if (HasLoopNumber(current)) { ++loop_depth; current_loop = &loops_[GetLoopNumber(current)]; BasicBlock* loop_end = current_loop->end; current->set_loop_end(loop_end == nullptr ? BeyondEndSentinel() : loop_end); current_header = current_loop->header; TRACE("id:%d is a loop header, increment loop depth to %d\n", current->id().ToInt(), loop_depth); } current->set_loop_depth(loop_depth); if (current->loop_header() == nullptr) { TRACE("id:%d is not in a loop (depth == %d)\n", current->id().ToInt(), current->loop_depth()); } else { TRACE("id:%d has loop header id:%d, (depth == %d)\n", current->id().ToInt(), current->loop_header()->id().ToInt(), current->loop_depth()); } } } // Computes loop membership from the backedges of the control flow graph. void ComputeLoopInfo(ZoneVector* queue, size_t num_loops, ZoneVector* backedges) { // Extend existing loop membership vectors. for (LoopInfo& loop : loops_) { loop.members->Resize(static_cast(schedule_->BasicBlockCount()), zone_); } // Extend loop information vector. loops_.resize(num_loops, LoopInfo()); // Compute loop membership starting from backedges. // O(max(loop_depth) * max(|loop|) for (size_t i = 0; i < backedges->size(); i++) { BasicBlock* member = backedges->at(i).first; BasicBlock* header = member->SuccessorAt(backedges->at(i).second); size_t loop_num = GetLoopNumber(header); if (loops_[loop_num].header == nullptr) { loops_[loop_num].header = header; loops_[loop_num].members = zone_->New( static_cast(schedule_->BasicBlockCount()), zone_); } int queue_length = 0; if (member != header) { // As long as the header doesn't have a backedge to itself, // Push the member onto the queue and process its predecessors. if (!loops_[loop_num].members->Contains(member->id().ToInt())) { loops_[loop_num].members->Add(member->id().ToInt()); } (*queue)[queue_length++].block = member; } // Propagate loop membership backwards. All predecessors of M up to the // loop header H are members of the loop too. O(|blocks between M and H|). while (queue_length > 0) { BasicBlock* block = (*queue)[--queue_length].block; for (size_t j = 0; j < block->PredecessorCount(); j++) { BasicBlock* pred = block->PredecessorAt(j); if (pred != header) { if (!loops_[loop_num].members->Contains(pred->id().ToInt())) { loops_[loop_num].members->Add(pred->id().ToInt()); (*queue)[queue_length++].block = pred; } } } } } } #if DEBUG void PrintRPO() { StdoutStream os; os << "RPO with " << loops_.size() << " loops"; if (loops_.size() > 0) { os << " ("; for (size_t i = 0; i < loops_.size(); i++) { if (i > 0) os << " "; os << "id:" << loops_[i].header->id(); } os << ")"; } os << ":\n"; for (BasicBlock* block = order_; block != nullptr; block = block->rpo_next()) { os << std::setw(5) << "B" << block->rpo_number() << ":"; for (size_t i = 0; i < loops_.size(); i++) { bool range = loops_[i].header->LoopContains(block); bool membership = loops_[i].header != block && range; os << (membership ? " |" : " "); os << (range ? "x" : " "); } os << " id:" << block->id() << ": "; if (block->loop_end() != nullptr) { os << " range: [B" << block->rpo_number() << ", B" << block->loop_end()->rpo_number() << ")"; } if (block->loop_header() != nullptr) { os << " header: id:" << block->loop_header()->id(); } if (block->loop_depth() > 0) { os << " depth: " << block->loop_depth(); } os << "\n"; } } void VerifySpecialRPO() { BasicBlockVector* order = schedule_->rpo_order(); DCHECK_LT(0, order->size()); DCHECK_EQ(0, (*order)[0]->id().ToInt()); // entry should be first. for (size_t i = 0; i < loops_.size(); i++) { LoopInfo* loop = &loops_[i]; BasicBlock* header = loop->header; BasicBlock* end = header->loop_end(); DCHECK_NOT_NULL(header); DCHECK_LE(0, header->rpo_number()); DCHECK_LT(header->rpo_number(), order->size()); DCHECK_NOT_NULL(end); DCHECK_LE(end->rpo_number(), order->size()); DCHECK_GT(end->rpo_number(), header->rpo_number()); DCHECK_NE(header->loop_header(), header); // Verify the start ... end list relationship. int links = 0; BasicBlock* block = loop->start; DCHECK_EQ(header, block); bool end_found; while (true) { if (block == nullptr || block == loop->end) { end_found = (loop->end == block); break; } // The list should be in same order as the final result. DCHECK(block->rpo_number() == links + header->rpo_number()); links++; block = block->rpo_next(); DCHECK_LT(links, static_cast(2 * order->size())); // cycle? } DCHECK_LT(0, links); DCHECK_EQ(links, end->rpo_number() - header->rpo_number()); DCHECK(end_found); // Check loop depth of the header. int loop_depth = 0; for (LoopInfo* outer = loop; outer != nullptr; outer = outer->prev) { loop_depth++; } DCHECK_EQ(loop_depth, header->loop_depth()); // Check the contiguousness of loops. int count = 0; for (int j = 0; j < static_cast(order->size()); j++) { block = order->at(j); DCHECK_EQ(block->rpo_number(), j); if (j < header->rpo_number() || j >= end->rpo_number()) { DCHECK(!header->LoopContains(block)); } else { DCHECK(header->LoopContains(block)); DCHECK_GE(block->loop_depth(), loop_depth); count++; } } DCHECK_EQ(links, count); } } #endif // DEBUG Zone* zone_; Schedule* schedule_; BasicBlock* order_; BasicBlock* beyond_end_; ZoneVector loops_; ZoneVector backedges_; ZoneVector stack_; size_t previous_block_count_; ZoneVector const empty_; }; BasicBlockVector* Scheduler::ComputeSpecialRPO(Zone* zone, Schedule* schedule) { SpecialRPONumberer numberer(zone, schedule); numberer.ComputeSpecialRPO(); numberer.SerializeRPOIntoSchedule(); numberer.PrintAndVerifySpecialRPO(); return schedule->rpo_order(); } void Scheduler::ComputeSpecialRPONumbering() { TRACE("--- COMPUTING SPECIAL RPO ----------------------------------\n"); // Compute the special reverse-post-order for basic blocks. special_rpo_ = zone_->New(zone_, schedule_); special_rpo_->ComputeSpecialRPO(); } BasicBlock* Scheduler::GetCommonDominatorIfCached(BasicBlock* b1, BasicBlock* b2) { auto entry1 = common_dominator_cache_.find(b1->id().ToInt()); if (entry1 == common_dominator_cache_.end()) return nullptr; auto entry2 = entry1->second->find(b2->id().ToInt()); if (entry2 == entry1->second->end()) return nullptr; return entry2->second; } BasicBlock* Scheduler::GetCommonDominator(BasicBlock* b1, BasicBlock* b2) { // A very common fast case: if (b1 == b2) return b1; // Try to find the common dominator by walking, if there is a chance of // finding it quickly. constexpr int kCacheGranularity = 63; STATIC_ASSERT((kCacheGranularity & (kCacheGranularity + 1)) == 0); int depth_difference = b1->dominator_depth() - b2->dominator_depth(); if (depth_difference > -kCacheGranularity && depth_difference < kCacheGranularity) { for (int i = 0; i < kCacheGranularity; i++) { if (b1->dominator_depth() < b2->dominator_depth()) { b2 = b2->dominator(); } else { b1 = b1->dominator(); } if (b1 == b2) return b1; } // We might fall out of the loop here if the dominator tree has several // deep "parallel" subtrees. } // If it'd be a long walk, take the bus instead (i.e. use the cache). // To keep memory consumption low, there'll be a bus stop every 64 blocks. // First, walk to the nearest bus stop. if (b1->dominator_depth() < b2->dominator_depth()) std::swap(b1, b2); while ((b1->dominator_depth() & kCacheGranularity) != 0) { if (V8_LIKELY(b1->dominator_depth() > b2->dominator_depth())) { b1 = b1->dominator(); } else { b2 = b2->dominator(); } if (b1 == b2) return b1; } // Then, walk from bus stop to bus stop until we either find a bus (i.e. an // existing cache entry) or the result. Make a list of any empty bus stops // we'd like to populate for next time. constexpr int kMaxNewCacheEntries = 2 * 50; // Must be even. // This array stores a flattened list of pairs, e.g. if after finding the // {result}, we want to cache [(B11, B12) -> result, (B21, B22) -> result], // then we store [11, 12, 21, 22] here. int new_cache_entries[kMaxNewCacheEntries]; // Next free slot in {new_cache_entries}. int new_cache_entries_cursor = 0; while (b1 != b2) { if ((b1->dominator_depth() & kCacheGranularity) == 0) { BasicBlock* maybe_cache_hit = GetCommonDominatorIfCached(b1, b2); if (maybe_cache_hit != nullptr) { b1 = b2 = maybe_cache_hit; break; } else if (new_cache_entries_cursor < kMaxNewCacheEntries) { new_cache_entries[new_cache_entries_cursor++] = b1->id().ToInt(); new_cache_entries[new_cache_entries_cursor++] = b2->id().ToInt(); } } if (V8_LIKELY(b1->dominator_depth() > b2->dominator_depth())) { b1 = b1->dominator(); } else { b2 = b2->dominator(); } } // Lastly, create new cache entries we noted down earlier. BasicBlock* result = b1; for (int i = 0; i < new_cache_entries_cursor;) { int id1 = new_cache_entries[i++]; int id2 = new_cache_entries[i++]; ZoneMap* mapping; auto entry = common_dominator_cache_.find(id1); if (entry == common_dominator_cache_.end()) { mapping = zone_->New>(zone_); common_dominator_cache_[id1] = mapping; } else { mapping = entry->second; } // If there was an existing entry, we would have found it earlier. DCHECK_EQ(mapping->find(id2), mapping->end()); mapping->insert({id2, result}); } return result; } void Scheduler::PropagateImmediateDominators(BasicBlock* block) { for (/*nop*/; block != nullptr; block = block->rpo_next()) { auto pred = block->predecessors().begin(); auto end = block->predecessors().end(); DCHECK(pred != end); // All blocks except start have predecessors. BasicBlock* dominator = *pred; bool deferred = dominator->deferred(); // For multiple predecessors, walk up the dominator tree until a common // dominator is found. Visitation order guarantees that all predecessors // except for backwards edges have been visited. // We use a one-element cache for previously-seen dominators. This gets // hit a lot for functions that have long chains of diamonds, and in // those cases turns quadratic into linear complexity. BasicBlock* cache = nullptr; for (++pred; pred != end; ++pred) { // Don't examine backwards edges. if ((*pred)->dominator_depth() < 0) continue; if ((*pred)->dominator_depth() > 3 && ((*pred)->dominator()->dominator() == cache || (*pred)->dominator()->dominator()->dominator() == cache)) { // Nothing to do, the last iteration covered this case. DCHECK_EQ(dominator, BasicBlock::GetCommonDominator(dominator, *pred)); } else { dominator = BasicBlock::GetCommonDominator(dominator, *pred); } cache = (*pred)->dominator(); deferred = deferred & (*pred)->deferred(); } block->set_dominator(dominator); block->set_dominator_depth(dominator->dominator_depth() + 1); block->set_deferred(deferred | block->deferred()); TRACE("Block id:%d's idom is id:%d, depth = %d\n", block->id().ToInt(), dominator->id().ToInt(), block->dominator_depth()); } } void Scheduler::GenerateDominatorTree(Schedule* schedule) { // Seed start block to be the first dominator. schedule->start()->set_dominator_depth(0); // Build the block dominator tree resulting from the above seed. PropagateImmediateDominators(schedule->start()->rpo_next()); } void Scheduler::GenerateDominatorTree() { TRACE("--- IMMEDIATE BLOCK DOMINATORS -----------------------------\n"); GenerateDominatorTree(schedule_); } // ----------------------------------------------------------------------------- // Phase 3: Prepare use counts for nodes. class PrepareUsesVisitor { public: explicit PrepareUsesVisitor(Scheduler* scheduler, Graph* graph, Zone* zone) : scheduler_(scheduler), schedule_(scheduler->schedule_), graph_(graph), visited_(graph_->NodeCount(), false, zone), stack_(zone) {} void Run() { InitializePlacement(graph_->end()); while (!stack_.empty()) { Node* node = stack_.top(); stack_.pop(); VisitInputs(node); } } private: void InitializePlacement(Node* node) { TRACE("Pre #%d:%s\n", node->id(), node->op()->mnemonic()); DCHECK(!Visited(node)); if (scheduler_->InitializePlacement(node) == Scheduler::kFixed) { // Fixed nodes are always roots for schedule late. scheduler_->schedule_root_nodes_.push_back(node); if (!schedule_->IsScheduled(node)) { // Make sure root nodes are scheduled in their respective blocks. TRACE("Scheduling fixed position node #%d:%s\n", node->id(), node->op()->mnemonic()); IrOpcode::Value opcode = node->opcode(); BasicBlock* block = opcode == IrOpcode::kParameter ? schedule_->start() : schedule_->block(NodeProperties::GetControlInput(node)); DCHECK_NOT_NULL(block); schedule_->AddNode(block, node); } } stack_.push(node); visited_[node->id()] = true; } void VisitInputs(Node* node) { DCHECK_NE(scheduler_->GetPlacement(node), Scheduler::kUnknown); bool is_scheduled = schedule_->IsScheduled(node); base::Optional coupled_control_edge = scheduler_->GetCoupledControlEdge(node); for (auto edge : node->input_edges()) { Node* to = edge.to(); DCHECK_EQ(node, edge.from()); if (!Visited(to)) { InitializePlacement(to); } TRACE("PostEdge #%d:%s->#%d:%s\n", node->id(), node->op()->mnemonic(), to->id(), to->op()->mnemonic()); DCHECK_NE(scheduler_->GetPlacement(to), Scheduler::kUnknown); if (!is_scheduled && edge.index() != coupled_control_edge) { scheduler_->IncrementUnscheduledUseCount(to, node); } } } bool Visited(Node* node) { return visited_[node->id()]; } Scheduler* scheduler_; Schedule* schedule_; Graph* graph_; BoolVector visited_; ZoneStack stack_; }; void Scheduler::PrepareUses() { TRACE("--- PREPARE USES -------------------------------------------\n"); // Count the uses of every node, which is used to ensure that all of a // node's uses are scheduled before the node itself. PrepareUsesVisitor prepare_uses(this, graph_, zone_); prepare_uses.Run(); } // ----------------------------------------------------------------------------- // Phase 4: Schedule nodes early. class ScheduleEarlyNodeVisitor { public: ScheduleEarlyNodeVisitor(Zone* zone, Scheduler* scheduler) : scheduler_(scheduler), schedule_(scheduler->schedule_), queue_(zone) {} // Run the schedule early algorithm on a set of fixed root nodes. void Run(NodeVector* roots) { for (Node* const root : *roots) { queue_.push(root); } while (!queue_.empty()) { scheduler_->tick_counter_->TickAndMaybeEnterSafepoint(); VisitNode(queue_.front()); queue_.pop(); } } private: // Visits one node from the queue and propagates its current schedule early // position to all uses. This in turn might push more nodes onto the queue. void VisitNode(Node* node) { Scheduler::SchedulerData* data = scheduler_->GetData(node); // Fixed nodes already know their schedule early position. if (scheduler_->GetPlacement(node) == Scheduler::kFixed) { data->minimum_block_ = schedule_->block(node); TRACE("Fixing #%d:%s minimum_block = id:%d, dominator_depth = %d\n", node->id(), node->op()->mnemonic(), data->minimum_block_->id().ToInt(), data->minimum_block_->dominator_depth()); } // No need to propagate unconstrained schedule early positions. if (data->minimum_block_ == schedule_->start()) return; // Propagate schedule early position. DCHECK_NOT_NULL(data->minimum_block_); for (auto use : node->uses()) { if (scheduler_->IsLive(use)) { PropagateMinimumPositionToNode(data->minimum_block_, use); } } } // Propagates {block} as another minimum position into the given {node}. This // has the net effect of computing the minimum dominator block of {node} that // still post-dominates all inputs to {node} when the queue is processed. void PropagateMinimumPositionToNode(BasicBlock* block, Node* node) { Scheduler::SchedulerData* data = scheduler_->GetData(node); // No need to propagate to fixed node, it's guaranteed to be a root. if (scheduler_->GetPlacement(node) == Scheduler::kFixed) return; // Coupled nodes influence schedule early position of their control. if (scheduler_->GetPlacement(node) == Scheduler::kCoupled) { Node* control = NodeProperties::GetControlInput(node); PropagateMinimumPositionToNode(block, control); } // Propagate new position if it is deeper down the dominator tree than the // current. Note that all inputs need to have minimum block position inside // the dominator chain of {node}'s minimum block position. DCHECK(InsideSameDominatorChain(block, data->minimum_block_)); if (block->dominator_depth() > data->minimum_block_->dominator_depth()) { data->minimum_block_ = block; queue_.push(node); TRACE("Propagating #%d:%s minimum_block = id:%d, dominator_depth = %d\n", node->id(), node->op()->mnemonic(), data->minimum_block_->id().ToInt(), data->minimum_block_->dominator_depth()); } } #if DEBUG bool InsideSameDominatorChain(BasicBlock* b1, BasicBlock* b2) { BasicBlock* dominator = BasicBlock::GetCommonDominator(b1, b2); return dominator == b1 || dominator == b2; } #endif Scheduler* scheduler_; Schedule* schedule_; ZoneQueue queue_; }; void Scheduler::ScheduleEarly() { if (!special_rpo_->HasLoopBlocks()) { TRACE("--- NO LOOPS SO SKIPPING SCHEDULE EARLY --------------------\n"); return; } TRACE("--- SCHEDULE EARLY -----------------------------------------\n"); if (FLAG_trace_turbo_scheduler) { TRACE("roots: "); for (Node* node : schedule_root_nodes_) { TRACE("#%d:%s ", node->id(), node->op()->mnemonic()); } TRACE("\n"); } // Compute the minimum block for each node thereby determining the earliest // position each node could be placed within a valid schedule. ScheduleEarlyNodeVisitor schedule_early_visitor(zone_, this); schedule_early_visitor.Run(&schedule_root_nodes_); } // ----------------------------------------------------------------------------- // Phase 5: Schedule nodes late. class ScheduleLateNodeVisitor { public: ScheduleLateNodeVisitor(Zone* zone, Scheduler* scheduler) : zone_(zone), scheduler_(scheduler), schedule_(scheduler_->schedule_), marked_(scheduler->zone_), marking_queue_(scheduler->zone_) {} // Run the schedule late algorithm on a set of fixed root nodes. void Run(NodeVector* roots) { for (Node* const root : *roots) { ProcessQueue(root); } } private: void ProcessQueue(Node* root) { ZoneQueue* queue = &(scheduler_->schedule_queue_); for (Node* node : root->inputs()) { // Don't schedule coupled nodes on their own. if (scheduler_->GetPlacement(node) == Scheduler::kCoupled) { node = NodeProperties::GetControlInput(node); } // Test schedulability condition by looking at unscheduled use count. if (scheduler_->GetData(node)->unscheduled_count_ != 0) continue; queue->push(node); do { scheduler_->tick_counter_->TickAndMaybeEnterSafepoint(); Node* const n = queue->front(); queue->pop(); VisitNode(n); } while (!queue->empty()); } } // Visits one node from the queue of schedulable nodes and determines its // schedule late position. Also hoists nodes out of loops to find a more // optimal scheduling position. void VisitNode(Node* node) { DCHECK_EQ(0, scheduler_->GetData(node)->unscheduled_count_); // Don't schedule nodes that are already scheduled. if (schedule_->IsScheduled(node)) return; DCHECK_EQ(Scheduler::kSchedulable, scheduler_->GetPlacement(node)); // Determine the dominating block for all of the uses of this node. It is // the latest block that this node can be scheduled in. TRACE("Scheduling #%d:%s\n", node->id(), node->op()->mnemonic()); BasicBlock* block = GetCommonDominatorOfUses(node); DCHECK_NOT_NULL(block); // The schedule early block dominates the schedule late block. BasicBlock* min_block = scheduler_->GetData(node)->minimum_block_; DCHECK_EQ(min_block, BasicBlock::GetCommonDominator(block, min_block)); TRACE( "Schedule late of #%d:%s is id:%d at loop depth %d, minimum = id:%d\n", node->id(), node->op()->mnemonic(), block->id().ToInt(), block->loop_depth(), min_block->id().ToInt()); // Hoist nodes out of loops if possible. Nodes can be hoisted iteratively // into enclosing loop pre-headers until they would precede their schedule // early position. BasicBlock* hoist_block = GetHoistBlock(block); if (hoist_block && hoist_block->dominator_depth() >= min_block->dominator_depth()) { DCHECK(scheduler_->special_rpo_->HasLoopBlocks()); do { TRACE(" hoisting #%d:%s to block id:%d\n", node->id(), node->op()->mnemonic(), hoist_block->id().ToInt()); DCHECK_LT(hoist_block->loop_depth(), block->loop_depth()); block = hoist_block; hoist_block = GetHoistBlock(hoist_block); } while (hoist_block && hoist_block->dominator_depth() >= min_block->dominator_depth()); } else if (scheduler_->flags_ & Scheduler::kSplitNodes) { // Split the {node} if beneficial and return the new {block} for it. block = SplitNode(block, node); } // Schedule the node or a floating control structure. if (IrOpcode::IsMergeOpcode(node->opcode())) { ScheduleFloatingControl(block, node); } else if (node->opcode() == IrOpcode::kFinishRegion) { ScheduleRegion(block, node); } else { ScheduleNode(block, node); } } bool IsMarked(BasicBlock* block) const { DCHECK_LT(block->id().ToSize(), marked_.size()); return marked_[block->id().ToSize()]; } void Mark(BasicBlock* block) { marked_[block->id().ToSize()] = true; } // Mark {block} and push its non-marked predecessor on the marking queue. void MarkBlock(BasicBlock* block) { DCHECK_LT(block->id().ToSize(), marked_.size()); Mark(block); for (BasicBlock* pred_block : block->predecessors()) { if (IsMarked(pred_block)) continue; marking_queue_.push_back(pred_block); } } BasicBlock* SplitNode(BasicBlock* block, Node* node) { // For now, we limit splitting to pure nodes. if (!node->op()->HasProperty(Operator::kPure)) return block; // TODO(titzer): fix the special case of splitting of projections. if (node->opcode() == IrOpcode::kProjection) return block; // The {block} is common dominator of all uses of {node}, so we cannot // split anything unless the {block} has at least two successors. DCHECK_EQ(block, GetCommonDominatorOfUses(node)); if (block->SuccessorCount() < 2) return block; // Clear marking bits. DCHECK(marking_queue_.empty()); std::fill(marked_.begin(), marked_.end(), false); marked_.resize(schedule_->BasicBlockCount() + 1, false); // Check if the {node} has uses in {block}. for (Edge edge : node->use_edges()) { if (!scheduler_->IsLive(edge.from())) continue; BasicBlock* use_block = GetBlockForUse(edge); if (use_block == nullptr || IsMarked(use_block)) continue; if (use_block == block) { TRACE(" not splitting #%d:%s, it is used in id:%d\n", node->id(), node->op()->mnemonic(), block->id().ToInt()); marking_queue_.clear(); return block; } MarkBlock(use_block); } // Compute transitive marking closure; a block is marked if all its // successors are marked. do { BasicBlock* top_block = marking_queue_.front(); marking_queue_.pop_front(); if (IsMarked(top_block)) continue; bool marked = true; for (BasicBlock* successor : top_block->successors()) { if (!IsMarked(successor)) { marked = false; break; } } if (marked) MarkBlock(top_block); } while (!marking_queue_.empty()); // If the (common dominator) {block} is marked, we know that all paths from // {block} to the end contain at least one use of {node}, and hence there's // no point in splitting the {node} in this case. if (IsMarked(block)) { TRACE(" not splitting #%d:%s, its common dominator id:%d is perfect\n", node->id(), node->op()->mnemonic(), block->id().ToInt()); return block; } // Split {node} for uses according to the previously computed marking // closure. Every marking partition has a unique dominator, which get's a // copy of the {node} with the exception of the first partition, which get's // the {node} itself. ZoneMap dominators(scheduler_->zone_); for (Edge edge : node->use_edges()) { if (!scheduler_->IsLive(edge.from())) continue; BasicBlock* use_block = GetBlockForUse(edge); if (use_block == nullptr) continue; while (IsMarked(use_block->dominator())) { use_block = use_block->dominator(); } auto& use_node = dominators[use_block]; if (use_node == nullptr) { if (dominators.size() == 1u) { // Place the {node} at {use_block}. block = use_block; use_node = node; TRACE(" pushing #%d:%s down to id:%d\n", node->id(), node->op()->mnemonic(), block->id().ToInt()); } else { // Place a copy of {node} at {use_block}. use_node = CloneNode(node); TRACE(" cloning #%d:%s for id:%d\n", use_node->id(), use_node->op()->mnemonic(), use_block->id().ToInt()); scheduler_->schedule_queue_.push(use_node); } } edge.UpdateTo(use_node); } return block; } BasicBlock* GetHoistBlock(BasicBlock* block) { if (!scheduler_->special_rpo_->HasLoopBlocks()) return nullptr; if (block->IsLoopHeader()) return block->dominator(); // We have to check to make sure that the {block} dominates all // of the outgoing blocks. If it doesn't, then there is a path // out of the loop which does not execute this {block}, so we // can't hoist operations from this {block} out of the loop, as // that would introduce additional computations. if (BasicBlock* header_block = block->loop_header()) { for (BasicBlock* outgoing_block : scheduler_->special_rpo_->GetOutgoingBlocks(header_block)) { if (scheduler_->GetCommonDominator(block, outgoing_block) != block) { return nullptr; } } return header_block->dominator(); } return nullptr; } BasicBlock* GetCommonDominatorOfUses(Node* node) { BasicBlock* block = nullptr; for (Edge edge : node->use_edges()) { if (!scheduler_->IsLive(edge.from())) continue; BasicBlock* use_block = GetBlockForUse(edge); block = block == nullptr ? use_block : use_block == nullptr ? block : scheduler_->GetCommonDominator(block, use_block); } return block; } BasicBlock* FindPredecessorBlock(Node* node) { return scheduler_->control_flow_builder_->FindPredecessorBlock(node); } BasicBlock* GetBlockForUse(Edge edge) { // TODO(titzer): ignore uses from dead nodes (not visited in PrepareUses()). // Dead uses only occur if the graph is not trimmed before scheduling. Node* use = edge.from(); if (IrOpcode::IsPhiOpcode(use->opcode())) { // If the use is from a coupled (i.e. floating) phi, compute the common // dominator of its uses. This will not recurse more than one level. if (scheduler_->GetPlacement(use) == Scheduler::kCoupled) { TRACE(" inspecting uses of coupled #%d:%s\n", use->id(), use->op()->mnemonic()); // TODO(titzer): reenable once above TODO is addressed. // DCHECK_EQ(edge.to(), NodeProperties::GetControlInput(use)); return GetCommonDominatorOfUses(use); } // If the use is from a fixed (i.e. non-floating) phi, we use the // predecessor block of the corresponding control input to the merge. if (scheduler_->GetPlacement(use) == Scheduler::kFixed) { TRACE(" input@%d into a fixed phi #%d:%s\n", edge.index(), use->id(), use->op()->mnemonic()); Node* merge = NodeProperties::GetControlInput(use, 0); DCHECK(IrOpcode::IsMergeOpcode(merge->opcode())); Node* input = NodeProperties::GetControlInput(merge, edge.index()); return FindPredecessorBlock(input); } } else if (IrOpcode::IsMergeOpcode(use->opcode())) { // If the use is from a fixed (i.e. non-floating) merge, we use the // predecessor block of the current input to the merge. if (scheduler_->GetPlacement(use) == Scheduler::kFixed) { TRACE(" input@%d into a fixed merge #%d:%s\n", edge.index(), use->id(), use->op()->mnemonic()); return FindPredecessorBlock(edge.to()); } } BasicBlock* result = schedule_->block(use); if (result == nullptr) return nullptr; TRACE(" must dominate use #%d:%s in id:%d\n", use->id(), use->op()->mnemonic(), result->id().ToInt()); return result; } void ScheduleFloatingControl(BasicBlock* block, Node* node) { scheduler_->FuseFloatingControl(block, node); } void ScheduleRegion(BasicBlock* block, Node* region_end) { // We only allow regions of instructions connected into a linear // effect chain. The only value allowed to be produced by a node // in the chain must be the value consumed by the FinishRegion node. // We schedule back to front; we first schedule FinishRegion. CHECK_EQ(IrOpcode::kFinishRegion, region_end->opcode()); ScheduleNode(block, region_end); // Schedule the chain. Node* node = NodeProperties::GetEffectInput(region_end); while (node->opcode() != IrOpcode::kBeginRegion) { DCHECK_EQ(0, scheduler_->GetData(node)->unscheduled_count_); DCHECK_EQ(1, node->op()->EffectInputCount()); DCHECK_EQ(1, node->op()->EffectOutputCount()); DCHECK_EQ(0, node->op()->ControlOutputCount()); // The value output (if there is any) must be consumed // by the EndRegion node. DCHECK(node->op()->ValueOutputCount() == 0 || node == region_end->InputAt(0)); ScheduleNode(block, node); node = NodeProperties::GetEffectInput(node); } // Schedule the BeginRegion node. DCHECK_EQ(0, scheduler_->GetData(node)->unscheduled_count_); ScheduleNode(block, node); } void ScheduleNode(BasicBlock* block, Node* node) { schedule_->PlanNode(block, node); size_t block_id = block->id().ToSize(); if (!scheduler_->scheduled_nodes_[block_id]) { scheduler_->scheduled_nodes_[block_id] = zone_->New(zone_); } scheduler_->scheduled_nodes_[block_id]->push_back(node); scheduler_->UpdatePlacement(node, Scheduler::kScheduled); } Node* CloneNode(Node* node) { int const input_count = node->InputCount(); base::Optional coupled_control_edge = scheduler_->GetCoupledControlEdge(node); for (int index = 0; index < input_count; ++index) { if (index != coupled_control_edge) { Node* const input = node->InputAt(index); scheduler_->IncrementUnscheduledUseCount(input, node); } } Node* const copy = scheduler_->graph_->CloneNode(node); TRACE(("clone #%d:%s -> #%d\n"), node->id(), node->op()->mnemonic(), copy->id()); scheduler_->node_data_.resize(copy->id() + 1, scheduler_->DefaultSchedulerData()); scheduler_->node_data_[copy->id()] = scheduler_->node_data_[node->id()]; return copy; } Zone* zone_; Scheduler* scheduler_; Schedule* schedule_; BoolVector marked_; ZoneDeque marking_queue_; }; void Scheduler::ScheduleLate() { TRACE("--- SCHEDULE LATE ------------------------------------------\n"); if (FLAG_trace_turbo_scheduler) { TRACE("roots: "); for (Node* node : schedule_root_nodes_) { TRACE("#%d:%s ", node->id(), node->op()->mnemonic()); } TRACE("\n"); } // Schedule: Places nodes in dominator block of all their uses. ScheduleLateNodeVisitor schedule_late_visitor(zone_, this); schedule_late_visitor.Run(&schedule_root_nodes_); } // ----------------------------------------------------------------------------- // Phase 6: Seal the final schedule. void Scheduler::SealFinalSchedule() { TRACE("--- SEAL FINAL SCHEDULE ------------------------------------\n"); // Serialize the assembly order and reverse-post-order numbering. special_rpo_->SerializeRPOIntoSchedule(); special_rpo_->PrintAndVerifySpecialRPO(); // Add collected nodes for basic blocks to their blocks in the right order. int block_num = 0; for (NodeVector* nodes : scheduled_nodes_) { BasicBlock::Id id = BasicBlock::Id::FromInt(block_num++); BasicBlock* block = schedule_->GetBlockById(id); if (nodes) { for (Node* node : base::Reversed(*nodes)) { schedule_->AddNode(block, node); } } } } // ----------------------------------------------------------------------------- void Scheduler::FuseFloatingControl(BasicBlock* block, Node* node) { TRACE("--- FUSE FLOATING CONTROL ----------------------------------\n"); if (FLAG_trace_turbo_scheduler) { StdoutStream{} << "Schedule before control flow fusion:\n" << *schedule_; } // Iterate on phase 1: Build control-flow graph. control_flow_builder_->Run(block, node); // Iterate on phase 2: Compute special RPO and dominator tree. special_rpo_->UpdateSpecialRPO(block, schedule_->block(node)); // TODO(turbofan): Currently "iterate on" means "re-run". Fix that. for (BasicBlock* b = block->rpo_next(); b != nullptr; b = b->rpo_next()) { b->set_dominator_depth(-1); b->set_dominator(nullptr); } PropagateImmediateDominators(block->rpo_next()); // Iterate on phase 4: Schedule nodes early. // TODO(turbofan): The following loop gathering the propagation roots is a // temporary solution and should be merged into the rest of the scheduler as // soon as the approach settled for all floating loops. NodeVector propagation_roots(control_flow_builder_->control_); for (Node* control : control_flow_builder_->control_) { for (Node* use : control->uses()) { if (NodeProperties::IsPhi(use) && IsLive(use)) { propagation_roots.push_back(use); } } } if (FLAG_trace_turbo_scheduler) { TRACE("propagation roots: "); for (Node* r : propagation_roots) { TRACE("#%d:%s ", r->id(), r->op()->mnemonic()); } TRACE("\n"); } ScheduleEarlyNodeVisitor schedule_early_visitor(zone_, this); schedule_early_visitor.Run(&propagation_roots); // Move previously planned nodes. // TODO(turbofan): Improve that by supporting bulk moves. scheduled_nodes_.resize(schedule_->BasicBlockCount()); MovePlannedNodes(block, schedule_->block(node)); if (FLAG_trace_turbo_scheduler) { StdoutStream{} << "Schedule after control flow fusion:\n" << *schedule_; } } void Scheduler::MovePlannedNodes(BasicBlock* from, BasicBlock* to) { TRACE("Move planned nodes from id:%d to id:%d\n", from->id().ToInt(), to->id().ToInt()); NodeVector* from_nodes = scheduled_nodes_[from->id().ToSize()]; NodeVector* to_nodes = scheduled_nodes_[to->id().ToSize()]; if (!from_nodes) return; for (Node* const node : *from_nodes) { schedule_->SetBlockForNode(to, node); } if (to_nodes) { to_nodes->insert(to_nodes->end(), from_nodes->begin(), from_nodes->end()); from_nodes->clear(); } else { std::swap(scheduled_nodes_[from->id().ToSize()], scheduled_nodes_[to->id().ToSize()]); } } #undef TRACE } // namespace compiler } // namespace internal } // namespace v8