| // Copyright 2013 the V8 project authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "src/compiler/scheduler.h" |
| |
| #include <iomanip> |
| |
| #include "src/base/adapters.h" |
| #include "src/bit-vector.h" |
| #include "src/compiler/common-operator.h" |
| #include "src/compiler/control-equivalence.h" |
| #include "src/compiler/graph.h" |
| #include "src/compiler/node-marker.h" |
| #include "src/compiler/node-properties.h" |
| #include "src/compiler/node.h" |
| #include "src/zone/zone-containers.h" |
| |
| namespace v8 { |
| namespace internal { |
| namespace compiler { |
| |
| #define TRACE(...) \ |
| do { \ |
| if (FLAG_trace_turbo_scheduler) PrintF(__VA_ARGS__); \ |
| } while (false) |
| |
| Scheduler::Scheduler(Zone* zone, Graph* graph, Schedule* schedule, Flags flags, |
| size_t node_count_hint) |
| : zone_(zone), |
| graph_(graph), |
| schedule_(schedule), |
| flags_(flags), |
| scheduled_nodes_(zone), |
| schedule_root_nodes_(zone), |
| schedule_queue_(zone), |
| node_data_(zone) { |
| node_data_.reserve(node_count_hint); |
| node_data_.resize(graph->NodeCount(), DefaultSchedulerData()); |
| } |
| |
| Schedule* Scheduler::ComputeSchedule(Zone* zone, Graph* graph, Flags flags) { |
| Zone* schedule_zone = |
| (flags & Scheduler::kTempSchedule) ? zone : graph->zone(); |
| |
| // Reserve 10% more space for nodes if node splitting is enabled to try to |
| // avoid resizing the vector since that would triple its zone memory usage. |
| float node_hint_multiplier = (flags & Scheduler::kSplitNodes) ? 1.1 : 1; |
| size_t node_count_hint = node_hint_multiplier * graph->NodeCount(); |
| |
| Schedule* schedule = |
| new (schedule_zone) Schedule(schedule_zone, node_count_hint); |
| Scheduler scheduler(zone, graph, schedule, flags, node_count_hint); |
| |
| scheduler.BuildCFG(); |
| scheduler.ComputeSpecialRPONumbering(); |
| scheduler.GenerateImmediateDominatorTree(); |
| |
| scheduler.PrepareUses(); |
| scheduler.ScheduleEarly(); |
| scheduler.ScheduleLate(); |
| |
| scheduler.SealFinalSchedule(); |
| |
| return schedule; |
| } |
| |
| |
| Scheduler::SchedulerData Scheduler::DefaultSchedulerData() { |
| SchedulerData def = {schedule_->start(), 0, kUnknown}; |
| return def; |
| } |
| |
| |
| Scheduler::SchedulerData* Scheduler::GetData(Node* node) { |
| return &node_data_[node->id()]; |
| } |
| |
| Scheduler::Placement Scheduler::InitializePlacement(Node* node) { |
| SchedulerData* data = GetData(node); |
| if (data->placement_ == kFixed) { |
| // Nothing to do for control nodes that have been already fixed in |
| // the schedule. |
| return data->placement_; |
| } |
| DCHECK_EQ(kUnknown, data->placement_); |
| switch (node->opcode()) { |
| case IrOpcode::kParameter: |
| case IrOpcode::kOsrValue: |
| // Parameters and OSR values are always fixed to the start block. |
| data->placement_ = kFixed; |
| break; |
| case IrOpcode::kPhi: |
| case IrOpcode::kEffectPhi: { |
| // Phis and effect phis are fixed if their control inputs are, whereas |
| // otherwise they are coupled to a floating control node. |
| Placement p = GetPlacement(NodeProperties::GetControlInput(node)); |
| data->placement_ = (p == kFixed ? kFixed : kCoupled); |
| break; |
| } |
| #define DEFINE_CONTROL_CASE(V) case IrOpcode::k##V: |
| CONTROL_OP_LIST(DEFINE_CONTROL_CASE) |
| #undef DEFINE_CONTROL_CASE |
| { |
| // Control nodes that were not control-reachable from end may float. |
| data->placement_ = kSchedulable; |
| break; |
| } |
| default: |
| data->placement_ = kSchedulable; |
| break; |
| } |
| return data->placement_; |
| } |
| |
| Scheduler::Placement Scheduler::GetPlacement(Node* node) { |
| return GetData(node)->placement_; |
| } |
| |
| bool Scheduler::IsLive(Node* node) { return GetPlacement(node) != kUnknown; } |
| |
| void Scheduler::UpdatePlacement(Node* node, Placement placement) { |
| SchedulerData* data = GetData(node); |
| if (data->placement_ == kUnknown) { |
| // We only update control nodes from {kUnknown} to {kFixed}. Ideally, we |
| // should check that {node} is a control node (including exceptional calls), |
| // but that is expensive. |
| DCHECK_EQ(Scheduler::kFixed, placement); |
| data->placement_ = placement; |
| return; |
| } |
| |
| switch (node->opcode()) { |
| case IrOpcode::kParameter: |
| // Parameters are fixed once and for all. |
| UNREACHABLE(); |
| break; |
| case IrOpcode::kPhi: |
| case IrOpcode::kEffectPhi: { |
| // Phis and effect phis are coupled to their respective blocks. |
| DCHECK_EQ(Scheduler::kCoupled, data->placement_); |
| DCHECK_EQ(Scheduler::kFixed, placement); |
| Node* control = NodeProperties::GetControlInput(node); |
| BasicBlock* block = schedule_->block(control); |
| schedule_->AddNode(block, node); |
| break; |
| } |
| #define DEFINE_CONTROL_CASE(V) case IrOpcode::k##V: |
| CONTROL_OP_LIST(DEFINE_CONTROL_CASE) |
| #undef DEFINE_CONTROL_CASE |
| { |
| // Control nodes force coupled uses to be placed. |
| for (auto use : node->uses()) { |
| if (GetPlacement(use) == Scheduler::kCoupled) { |
| DCHECK_EQ(node, NodeProperties::GetControlInput(use)); |
| UpdatePlacement(use, placement); |
| } |
| } |
| break; |
| } |
| default: |
| DCHECK_EQ(Scheduler::kSchedulable, data->placement_); |
| DCHECK_EQ(Scheduler::kScheduled, placement); |
| break; |
| } |
| // Reduce the use count of the node's inputs to potentially make them |
| // schedulable. If all the uses of a node have been scheduled, then the node |
| // itself can be scheduled. |
| for (Edge const edge : node->input_edges()) { |
| DecrementUnscheduledUseCount(edge.to(), edge.index(), edge.from()); |
| } |
| data->placement_ = placement; |
| } |
| |
| |
| bool Scheduler::IsCoupledControlEdge(Node* node, int index) { |
| return GetPlacement(node) == kCoupled && |
| NodeProperties::FirstControlIndex(node) == index; |
| } |
| |
| |
| void Scheduler::IncrementUnscheduledUseCount(Node* node, int index, |
| Node* from) { |
| // Make sure that control edges from coupled nodes are not counted. |
| if (IsCoupledControlEdge(from, index)) return; |
| |
| // Tracking use counts for fixed nodes is useless. |
| if (GetPlacement(node) == kFixed) return; |
| |
| // Use count for coupled nodes is summed up on their control. |
| if (GetPlacement(node) == kCoupled) { |
| Node* control = NodeProperties::GetControlInput(node); |
| return IncrementUnscheduledUseCount(control, index, from); |
| } |
| |
| ++(GetData(node)->unscheduled_count_); |
| if (FLAG_trace_turbo_scheduler) { |
| TRACE(" Use count of #%d:%s (used by #%d:%s)++ = %d\n", node->id(), |
| node->op()->mnemonic(), from->id(), from->op()->mnemonic(), |
| GetData(node)->unscheduled_count_); |
| } |
| } |
| |
| |
| void Scheduler::DecrementUnscheduledUseCount(Node* node, int index, |
| Node* from) { |
| // Make sure that control edges from coupled nodes are not counted. |
| if (IsCoupledControlEdge(from, index)) return; |
| |
| // Tracking use counts for fixed nodes is useless. |
| if (GetPlacement(node) == kFixed) return; |
| |
| // Use count for coupled nodes is summed up on their control. |
| if (GetPlacement(node) == kCoupled) { |
| Node* control = NodeProperties::GetControlInput(node); |
| return DecrementUnscheduledUseCount(control, index, from); |
| } |
| |
| DCHECK_LT(0, GetData(node)->unscheduled_count_); |
| --(GetData(node)->unscheduled_count_); |
| if (FLAG_trace_turbo_scheduler) { |
| TRACE(" Use count of #%d:%s (used by #%d:%s)-- = %d\n", node->id(), |
| node->op()->mnemonic(), from->id(), from->op()->mnemonic(), |
| GetData(node)->unscheduled_count_); |
| } |
| if (GetData(node)->unscheduled_count_ == 0) { |
| TRACE(" newly eligible #%d:%s\n", node->id(), node->op()->mnemonic()); |
| schedule_queue_.push(node); |
| } |
| } |
| |
| |
| // ----------------------------------------------------------------------------- |
| // Phase 1: Build control-flow graph. |
| |
| |
| // Internal class to build a control flow graph (i.e the basic blocks and edges |
| // between them within a Schedule) from the node graph. Visits control edges of |
| // the graph backwards from an end node in order to find the connected control |
| // subgraph, needed for scheduling. |
| class CFGBuilder : public ZoneObject { |
| public: |
| CFGBuilder(Zone* zone, Scheduler* scheduler) |
| : zone_(zone), |
| scheduler_(scheduler), |
| schedule_(scheduler->schedule_), |
| queued_(scheduler->graph_, 2), |
| queue_(zone), |
| control_(zone), |
| component_entry_(nullptr), |
| component_start_(nullptr), |
| component_end_(nullptr) {} |
| |
| // Run the control flow graph construction algorithm by walking the graph |
| // backwards from end through control edges, building and connecting the |
| // basic blocks for control nodes. |
| void Run() { |
| ResetDataStructures(); |
| Queue(scheduler_->graph_->end()); |
| |
| while (!queue_.empty()) { // Breadth-first backwards traversal. |
| Node* node = queue_.front(); |
| queue_.pop(); |
| int max = NodeProperties::PastControlIndex(node); |
| for (int i = NodeProperties::FirstControlIndex(node); i < max; i++) { |
| Queue(node->InputAt(i)); |
| } |
| } |
| |
| for (NodeVector::iterator i = control_.begin(); i != control_.end(); ++i) { |
| ConnectBlocks(*i); // Connect block to its predecessor/successors. |
| } |
| } |
| |
| // Run the control flow graph construction for a minimal control-connected |
| // component ending in {exit} and merge that component into an existing |
| // control flow graph at the bottom of {block}. |
| void Run(BasicBlock* block, Node* exit) { |
| ResetDataStructures(); |
| Queue(exit); |
| |
| component_entry_ = nullptr; |
| component_start_ = block; |
| component_end_ = schedule_->block(exit); |
| scheduler_->equivalence_->Run(exit); |
| while (!queue_.empty()) { // Breadth-first backwards traversal. |
| Node* node = queue_.front(); |
| queue_.pop(); |
| |
| // Use control dependence equivalence to find a canonical single-entry |
| // single-exit region that makes up a minimal component to be scheduled. |
| if (IsSingleEntrySingleExitRegion(node, exit)) { |
| TRACE("Found SESE at #%d:%s\n", node->id(), node->op()->mnemonic()); |
| DCHECK(!component_entry_); |
| component_entry_ = node; |
| continue; |
| } |
| |
| int max = NodeProperties::PastControlIndex(node); |
| for (int i = NodeProperties::FirstControlIndex(node); i < max; i++) { |
| Queue(node->InputAt(i)); |
| } |
| } |
| DCHECK(component_entry_); |
| |
| for (NodeVector::iterator i = control_.begin(); i != control_.end(); ++i) { |
| ConnectBlocks(*i); // Connect block to its predecessor/successors. |
| } |
| } |
| |
| private: |
| friend class ScheduleLateNodeVisitor; |
| friend class Scheduler; |
| |
| void FixNode(BasicBlock* block, Node* node) { |
| schedule_->AddNode(block, node); |
| scheduler_->UpdatePlacement(node, Scheduler::kFixed); |
| } |
| |
| void Queue(Node* node) { |
| // Mark the connected control nodes as they are queued. |
| if (!queued_.Get(node)) { |
| BuildBlocks(node); |
| queue_.push(node); |
| queued_.Set(node, true); |
| control_.push_back(node); |
| } |
| } |
| |
| void BuildBlocks(Node* node) { |
| switch (node->opcode()) { |
| case IrOpcode::kEnd: |
| FixNode(schedule_->end(), node); |
| break; |
| case IrOpcode::kStart: |
| FixNode(schedule_->start(), node); |
| break; |
| case IrOpcode::kLoop: |
| case IrOpcode::kMerge: |
| BuildBlockForNode(node); |
| break; |
| case IrOpcode::kTerminate: { |
| // Put Terminate in the loop to which it refers. |
| Node* loop = NodeProperties::GetControlInput(node); |
| BasicBlock* block = BuildBlockForNode(loop); |
| FixNode(block, node); |
| break; |
| } |
| case IrOpcode::kBranch: |
| case IrOpcode::kSwitch: |
| BuildBlocksForSuccessors(node); |
| break; |
| #define BUILD_BLOCK_JS_CASE(Name) case IrOpcode::k##Name: |
| JS_OP_LIST(BUILD_BLOCK_JS_CASE) |
| // JS opcodes are just like calls => fall through. |
| #undef BUILD_BLOCK_JS_CASE |
| case IrOpcode::kCall: |
| case IrOpcode::kCallWithCallerSavedRegisters: |
| if (NodeProperties::IsExceptionalCall(node)) { |
| BuildBlocksForSuccessors(node); |
| } |
| break; |
| default: |
| break; |
| } |
| } |
| |
| void ConnectBlocks(Node* node) { |
| switch (node->opcode()) { |
| case IrOpcode::kLoop: |
| case IrOpcode::kMerge: |
| ConnectMerge(node); |
| break; |
| case IrOpcode::kBranch: |
| scheduler_->UpdatePlacement(node, Scheduler::kFixed); |
| ConnectBranch(node); |
| break; |
| case IrOpcode::kSwitch: |
| scheduler_->UpdatePlacement(node, Scheduler::kFixed); |
| ConnectSwitch(node); |
| break; |
| case IrOpcode::kDeoptimize: |
| scheduler_->UpdatePlacement(node, Scheduler::kFixed); |
| ConnectDeoptimize(node); |
| break; |
| case IrOpcode::kTailCall: |
| scheduler_->UpdatePlacement(node, Scheduler::kFixed); |
| ConnectTailCall(node); |
| break; |
| case IrOpcode::kReturn: |
| scheduler_->UpdatePlacement(node, Scheduler::kFixed); |
| ConnectReturn(node); |
| break; |
| case IrOpcode::kThrow: |
| scheduler_->UpdatePlacement(node, Scheduler::kFixed); |
| ConnectThrow(node); |
| break; |
| #define CONNECT_BLOCK_JS_CASE(Name) case IrOpcode::k##Name: |
| JS_OP_LIST(CONNECT_BLOCK_JS_CASE) |
| // JS opcodes are just like calls => fall through. |
| #undef CONNECT_BLOCK_JS_CASE |
| case IrOpcode::kCall: |
| case IrOpcode::kCallWithCallerSavedRegisters: |
| if (NodeProperties::IsExceptionalCall(node)) { |
| scheduler_->UpdatePlacement(node, Scheduler::kFixed); |
| ConnectCall(node); |
| } |
| break; |
| default: |
| break; |
| } |
| } |
| |
| BasicBlock* BuildBlockForNode(Node* node) { |
| BasicBlock* block = schedule_->block(node); |
| if (block == nullptr) { |
| block = schedule_->NewBasicBlock(); |
| TRACE("Create block id:%d for #%d:%s\n", block->id().ToInt(), node->id(), |
| node->op()->mnemonic()); |
| FixNode(block, node); |
| } |
| return block; |
| } |
| |
| void BuildBlocksForSuccessors(Node* node) { |
| size_t const successor_cnt = node->op()->ControlOutputCount(); |
| Node** successors = zone_->NewArray<Node*>(successor_cnt); |
| NodeProperties::CollectControlProjections(node, successors, successor_cnt); |
| for (size_t index = 0; index < successor_cnt; ++index) { |
| BuildBlockForNode(successors[index]); |
| } |
| } |
| |
| void CollectSuccessorBlocks(Node* node, BasicBlock** successor_blocks, |
| size_t successor_cnt) { |
| Node** successors = reinterpret_cast<Node**>(successor_blocks); |
| NodeProperties::CollectControlProjections(node, successors, successor_cnt); |
| for (size_t index = 0; index < successor_cnt; ++index) { |
| successor_blocks[index] = schedule_->block(successors[index]); |
| } |
| } |
| |
| BasicBlock* FindPredecessorBlock(Node* node) { |
| BasicBlock* predecessor_block = nullptr; |
| while (true) { |
| predecessor_block = schedule_->block(node); |
| if (predecessor_block != nullptr) break; |
| node = NodeProperties::GetControlInput(node); |
| } |
| return predecessor_block; |
| } |
| |
| void ConnectCall(Node* call) { |
| BasicBlock* successor_blocks[2]; |
| CollectSuccessorBlocks(call, successor_blocks, arraysize(successor_blocks)); |
| |
| // Consider the exception continuation to be deferred. |
| successor_blocks[1]->set_deferred(true); |
| |
| Node* call_control = NodeProperties::GetControlInput(call); |
| BasicBlock* call_block = FindPredecessorBlock(call_control); |
| TraceConnect(call, call_block, successor_blocks[0]); |
| TraceConnect(call, call_block, successor_blocks[1]); |
| schedule_->AddCall(call_block, call, successor_blocks[0], |
| successor_blocks[1]); |
| } |
| |
| void ConnectBranch(Node* branch) { |
| BasicBlock* successor_blocks[2]; |
| CollectSuccessorBlocks(branch, successor_blocks, |
| arraysize(successor_blocks)); |
| |
| // Consider branch hints. |
| switch (BranchHintOf(branch->op())) { |
| case BranchHint::kNone: |
| break; |
| case BranchHint::kTrue: |
| successor_blocks[1]->set_deferred(true); |
| break; |
| case BranchHint::kFalse: |
| successor_blocks[0]->set_deferred(true); |
| break; |
| } |
| |
| if (branch == component_entry_) { |
| TraceConnect(branch, component_start_, successor_blocks[0]); |
| TraceConnect(branch, component_start_, successor_blocks[1]); |
| schedule_->InsertBranch(component_start_, component_end_, branch, |
| successor_blocks[0], successor_blocks[1]); |
| } else { |
| Node* branch_control = NodeProperties::GetControlInput(branch); |
| BasicBlock* branch_block = FindPredecessorBlock(branch_control); |
| TraceConnect(branch, branch_block, successor_blocks[0]); |
| TraceConnect(branch, branch_block, successor_blocks[1]); |
| schedule_->AddBranch(branch_block, branch, successor_blocks[0], |
| successor_blocks[1]); |
| } |
| } |
| |
| void ConnectSwitch(Node* sw) { |
| size_t const successor_count = sw->op()->ControlOutputCount(); |
| BasicBlock** successor_blocks = |
| zone_->NewArray<BasicBlock*>(successor_count); |
| CollectSuccessorBlocks(sw, successor_blocks, successor_count); |
| |
| if (sw == component_entry_) { |
| for (size_t index = 0; index < successor_count; ++index) { |
| TraceConnect(sw, component_start_, successor_blocks[index]); |
| } |
| schedule_->InsertSwitch(component_start_, component_end_, sw, |
| successor_blocks, successor_count); |
| } else { |
| Node* switch_control = NodeProperties::GetControlInput(sw); |
| BasicBlock* switch_block = FindPredecessorBlock(switch_control); |
| for (size_t index = 0; index < successor_count; ++index) { |
| TraceConnect(sw, switch_block, successor_blocks[index]); |
| } |
| schedule_->AddSwitch(switch_block, sw, successor_blocks, successor_count); |
| } |
| } |
| |
| void ConnectMerge(Node* merge) { |
| // Don't connect the special merge at the end to its predecessors. |
| if (IsFinalMerge(merge)) return; |
| |
| BasicBlock* block = schedule_->block(merge); |
| DCHECK_NOT_NULL(block); |
| // For all of the merge's control inputs, add a goto at the end to the |
| // merge's basic block. |
| for (Node* const input : merge->inputs()) { |
| BasicBlock* predecessor_block = FindPredecessorBlock(input); |
| TraceConnect(merge, predecessor_block, block); |
| schedule_->AddGoto(predecessor_block, block); |
| } |
| } |
| |
| void ConnectTailCall(Node* call) { |
| Node* call_control = NodeProperties::GetControlInput(call); |
| BasicBlock* call_block = FindPredecessorBlock(call_control); |
| TraceConnect(call, call_block, nullptr); |
| schedule_->AddTailCall(call_block, call); |
| } |
| |
| void ConnectReturn(Node* ret) { |
| Node* return_control = NodeProperties::GetControlInput(ret); |
| BasicBlock* return_block = FindPredecessorBlock(return_control); |
| TraceConnect(ret, return_block, nullptr); |
| schedule_->AddReturn(return_block, ret); |
| } |
| |
| void ConnectDeoptimize(Node* deopt) { |
| Node* deoptimize_control = NodeProperties::GetControlInput(deopt); |
| BasicBlock* deoptimize_block = FindPredecessorBlock(deoptimize_control); |
| TraceConnect(deopt, deoptimize_block, nullptr); |
| schedule_->AddDeoptimize(deoptimize_block, deopt); |
| } |
| |
| void ConnectThrow(Node* thr) { |
| Node* throw_control = NodeProperties::GetControlInput(thr); |
| BasicBlock* throw_block = FindPredecessorBlock(throw_control); |
| TraceConnect(thr, throw_block, nullptr); |
| schedule_->AddThrow(throw_block, thr); |
| } |
| |
| void TraceConnect(Node* node, BasicBlock* block, BasicBlock* succ) { |
| DCHECK_NOT_NULL(block); |
| if (succ == nullptr) { |
| TRACE("Connect #%d:%s, id:%d -> end\n", node->id(), |
| node->op()->mnemonic(), block->id().ToInt()); |
| } else { |
| TRACE("Connect #%d:%s, id:%d -> id:%d\n", node->id(), |
| node->op()->mnemonic(), block->id().ToInt(), succ->id().ToInt()); |
| } |
| } |
| |
| bool IsFinalMerge(Node* node) { |
| return (node->opcode() == IrOpcode::kMerge && |
| node == scheduler_->graph_->end()->InputAt(0)); |
| } |
| |
| bool IsSingleEntrySingleExitRegion(Node* entry, Node* exit) const { |
| size_t entry_class = scheduler_->equivalence_->ClassOf(entry); |
| size_t exit_class = scheduler_->equivalence_->ClassOf(exit); |
| return entry != exit && entry_class == exit_class; |
| } |
| |
| void ResetDataStructures() { |
| control_.clear(); |
| DCHECK(queue_.empty()); |
| DCHECK(control_.empty()); |
| } |
| |
| Zone* zone_; |
| Scheduler* scheduler_; |
| Schedule* schedule_; |
| NodeMarker<bool> queued_; // Mark indicating whether node is queued. |
| ZoneQueue<Node*> queue_; // Queue used for breadth-first traversal. |
| NodeVector control_; // List of encountered control nodes. |
| Node* component_entry_; // Component single-entry node. |
| BasicBlock* component_start_; // Component single-entry block. |
| BasicBlock* component_end_; // Component single-exit block. |
| }; |
| |
| |
| void Scheduler::BuildCFG() { |
| TRACE("--- CREATING CFG -------------------------------------------\n"); |
| |
| // Instantiate a new control equivalence algorithm for the graph. |
| equivalence_ = new (zone_) ControlEquivalence(zone_, graph_); |
| |
| // Build a control-flow graph for the main control-connected component that |
| // is being spanned by the graph's start and end nodes. |
| control_flow_builder_ = new (zone_) CFGBuilder(zone_, this); |
| control_flow_builder_->Run(); |
| |
| // Initialize per-block data. |
| // Reserve an extra 10% to avoid resizing vector when fusing floating control. |
| scheduled_nodes_.reserve(schedule_->BasicBlockCount() * 1.1); |
| scheduled_nodes_.resize(schedule_->BasicBlockCount()); |
| } |
| |
| |
| // ----------------------------------------------------------------------------- |
| // Phase 2: Compute special RPO and dominator tree. |
| |
| |
| // Compute the special reverse-post-order block ordering, which is essentially |
| // a RPO of the graph where loop bodies are contiguous. Properties: |
| // 1. If block A is a predecessor of B, then A appears before B in the order, |
| // unless B is a loop header and A is in the loop headed at B |
| // (i.e. A -> B is a backedge). |
| // => If block A dominates block B, then A appears before B in the order. |
| // => If block A is a loop header, A appears before all blocks in the loop |
| // headed at A. |
| // 2. All loops are contiguous in the order (i.e. no intervening blocks that |
| // do not belong to the loop.) |
| // Note a simple RPO traversal satisfies (1) but not (2). |
| class SpecialRPONumberer : public ZoneObject { |
| public: |
| SpecialRPONumberer(Zone* zone, Schedule* schedule) |
| : zone_(zone), |
| schedule_(schedule), |
| order_(nullptr), |
| beyond_end_(nullptr), |
| loops_(zone), |
| backedges_(zone), |
| stack_(zone), |
| previous_block_count_(0), |
| empty_(0, zone) {} |
| |
| // Computes the special reverse-post-order for the main control flow graph, |
| // that is for the graph spanned between the schedule's start and end blocks. |
| void ComputeSpecialRPO() { |
| DCHECK_EQ(0, schedule_->end()->SuccessorCount()); |
| DCHECK(!order_); // Main order does not exist yet. |
| ComputeAndInsertSpecialRPO(schedule_->start(), schedule_->end()); |
| } |
| |
| // Computes the special reverse-post-order for a partial control flow graph, |
| // that is for the graph spanned between the given {entry} and {end} blocks, |
| // then updates the existing ordering with this new information. |
| void UpdateSpecialRPO(BasicBlock* entry, BasicBlock* end) { |
| DCHECK(order_); // Main order to be updated is present. |
| ComputeAndInsertSpecialRPO(entry, end); |
| } |
| |
| // Serialize the previously computed order as a special reverse-post-order |
| // numbering for basic blocks into the final schedule. |
| void SerializeRPOIntoSchedule() { |
| int32_t number = 0; |
| for (BasicBlock* b = order_; b != nullptr; b = b->rpo_next()) { |
| b->set_rpo_number(number++); |
| schedule_->rpo_order()->push_back(b); |
| } |
| BeyondEndSentinel()->set_rpo_number(number); |
| } |
| |
| // Print and verify the special reverse-post-order. |
| void PrintAndVerifySpecialRPO() { |
| #if DEBUG |
| if (FLAG_trace_turbo_scheduler) PrintRPO(); |
| VerifySpecialRPO(); |
| #endif |
| } |
| |
| const ZoneVector<BasicBlock*>& GetOutgoingBlocks(BasicBlock* block) { |
| if (HasLoopNumber(block)) { |
| LoopInfo const& loop = loops_[GetLoopNumber(block)]; |
| if (loop.outgoing) return *loop.outgoing; |
| } |
| return empty_; |
| } |
| |
| private: |
| typedef std::pair<BasicBlock*, size_t> Backedge; |
| |
| // Numbering for BasicBlock::rpo_number for this block traversal: |
| static const int kBlockOnStack = -2; |
| static const int kBlockVisited1 = -3; |
| static const int kBlockVisited2 = -4; |
| static const int kBlockUnvisited1 = -1; |
| static const int kBlockUnvisited2 = kBlockVisited1; |
| |
| struct SpecialRPOStackFrame { |
| BasicBlock* block; |
| size_t index; |
| }; |
| |
| struct LoopInfo { |
| BasicBlock* header; |
| ZoneVector<BasicBlock*>* outgoing; |
| BitVector* members; |
| LoopInfo* prev; |
| BasicBlock* end; |
| BasicBlock* start; |
| |
| void AddOutgoing(Zone* zone, BasicBlock* block) { |
| if (outgoing == nullptr) { |
| outgoing = new (zone->New(sizeof(ZoneVector<BasicBlock*>))) |
| ZoneVector<BasicBlock*>(zone); |
| } |
| outgoing->push_back(block); |
| } |
| }; |
| |
| int Push(ZoneVector<SpecialRPOStackFrame>& stack, int depth, |
| BasicBlock* child, int unvisited) { |
| if (child->rpo_number() == unvisited) { |
| stack[depth].block = child; |
| stack[depth].index = 0; |
| child->set_rpo_number(kBlockOnStack); |
| return depth + 1; |
| } |
| return depth; |
| } |
| |
| BasicBlock* PushFront(BasicBlock* head, BasicBlock* block) { |
| block->set_rpo_next(head); |
| return block; |
| } |
| |
| static int GetLoopNumber(BasicBlock* block) { return block->loop_number(); } |
| static void SetLoopNumber(BasicBlock* block, int loop_number) { |
| return block->set_loop_number(loop_number); |
| } |
| static bool HasLoopNumber(BasicBlock* block) { |
| return block->loop_number() >= 0; |
| } |
| |
| // TODO(mstarzinger): We only need this special sentinel because some tests |
| // use the schedule's end block in actual control flow (e.g. with end having |
| // successors). Once this has been cleaned up we can use the end block here. |
| BasicBlock* BeyondEndSentinel() { |
| if (beyond_end_ == nullptr) { |
| BasicBlock::Id id = BasicBlock::Id::FromInt(-1); |
| beyond_end_ = new (schedule_->zone()) BasicBlock(schedule_->zone(), id); |
| } |
| return beyond_end_; |
| } |
| |
| // Compute special RPO for the control flow graph between {entry} and {end}, |
| // mutating any existing order so that the result is still valid. |
| void ComputeAndInsertSpecialRPO(BasicBlock* entry, BasicBlock* end) { |
| // RPO should not have been serialized for this schedule yet. |
| CHECK_EQ(kBlockUnvisited1, schedule_->start()->loop_number()); |
| CHECK_EQ(kBlockUnvisited1, schedule_->start()->rpo_number()); |
| CHECK_EQ(0, static_cast<int>(schedule_->rpo_order()->size())); |
| |
| // Find correct insertion point within existing order. |
| BasicBlock* insertion_point = entry->rpo_next(); |
| BasicBlock* order = insertion_point; |
| |
| // Perform an iterative RPO traversal using an explicit stack, |
| // recording backedges that form cycles. O(|B|). |
| DCHECK_LT(previous_block_count_, schedule_->BasicBlockCount()); |
| stack_.resize(schedule_->BasicBlockCount() - previous_block_count_); |
| previous_block_count_ = schedule_->BasicBlockCount(); |
| int stack_depth = Push(stack_, 0, entry, kBlockUnvisited1); |
| int num_loops = static_cast<int>(loops_.size()); |
| |
| while (stack_depth > 0) { |
| int current = stack_depth - 1; |
| SpecialRPOStackFrame* frame = &stack_[current]; |
| |
| if (frame->block != end && |
| frame->index < frame->block->SuccessorCount()) { |
| // Process the next successor. |
| BasicBlock* succ = frame->block->SuccessorAt(frame->index++); |
| if (succ->rpo_number() == kBlockVisited1) continue; |
| if (succ->rpo_number() == kBlockOnStack) { |
| // The successor is on the stack, so this is a backedge (cycle). |
| backedges_.push_back(Backedge(frame->block, frame->index - 1)); |
| if (!HasLoopNumber(succ)) { |
| // Assign a new loop number to the header if it doesn't have one. |
| SetLoopNumber(succ, num_loops++); |
| } |
| } else { |
| // Push the successor onto the stack. |
| DCHECK_EQ(kBlockUnvisited1, succ->rpo_number()); |
| stack_depth = Push(stack_, stack_depth, succ, kBlockUnvisited1); |
| } |
| } else { |
| // Finished with all successors; pop the stack and add the block. |
| order = PushFront(order, frame->block); |
| frame->block->set_rpo_number(kBlockVisited1); |
| stack_depth--; |
| } |
| } |
| |
| // If no loops were encountered, then the order we computed was correct. |
| if (num_loops > static_cast<int>(loops_.size())) { |
| // Otherwise, compute the loop information from the backedges in order |
| // to perform a traversal that groups loop bodies together. |
| ComputeLoopInfo(stack_, num_loops, &backedges_); |
| |
| // Initialize the "loop stack". Note the entry could be a loop header. |
| LoopInfo* loop = |
| HasLoopNumber(entry) ? &loops_[GetLoopNumber(entry)] : nullptr; |
| order = insertion_point; |
| |
| // Perform an iterative post-order traversal, visiting loop bodies before |
| // edges that lead out of loops. Visits each block once, but linking loop |
| // sections together is linear in the loop size, so overall is |
| // O(|B| + max(loop_depth) * max(|loop|)) |
| stack_depth = Push(stack_, 0, entry, kBlockUnvisited2); |
| while (stack_depth > 0) { |
| SpecialRPOStackFrame* frame = &stack_[stack_depth - 1]; |
| BasicBlock* block = frame->block; |
| BasicBlock* succ = nullptr; |
| |
| if (block != end && frame->index < block->SuccessorCount()) { |
| // Process the next normal successor. |
| succ = block->SuccessorAt(frame->index++); |
| } else if (HasLoopNumber(block)) { |
| // Process additional outgoing edges from the loop header. |
| if (block->rpo_number() == kBlockOnStack) { |
| // Finish the loop body the first time the header is left on the |
| // stack. |
| DCHECK(loop != nullptr && loop->header == block); |
| loop->start = PushFront(order, block); |
| order = loop->end; |
| block->set_rpo_number(kBlockVisited2); |
| // Pop the loop stack and continue visiting outgoing edges within |
| // the context of the outer loop, if any. |
| loop = loop->prev; |
| // We leave the loop header on the stack; the rest of this iteration |
| // and later iterations will go through its outgoing edges list. |
| } |
| |
| // Use the next outgoing edge if there are any. |
| size_t outgoing_index = frame->index - block->SuccessorCount(); |
| LoopInfo* info = &loops_[GetLoopNumber(block)]; |
| DCHECK(loop != info); |
| if (block != entry && info->outgoing != nullptr && |
| outgoing_index < info->outgoing->size()) { |
| succ = info->outgoing->at(outgoing_index); |
| frame->index++; |
| } |
| } |
| |
| if (succ != nullptr) { |
| // Process the next successor. |
| if (succ->rpo_number() == kBlockOnStack) continue; |
| if (succ->rpo_number() == kBlockVisited2) continue; |
| DCHECK_EQ(kBlockUnvisited2, succ->rpo_number()); |
| if (loop != nullptr && !loop->members->Contains(succ->id().ToInt())) { |
| // The successor is not in the current loop or any nested loop. |
| // Add it to the outgoing edges of this loop and visit it later. |
| loop->AddOutgoing(zone_, succ); |
| } else { |
| // Push the successor onto the stack. |
| stack_depth = Push(stack_, stack_depth, succ, kBlockUnvisited2); |
| if (HasLoopNumber(succ)) { |
| // Push the inner loop onto the loop stack. |
| DCHECK(GetLoopNumber(succ) < num_loops); |
| LoopInfo* next = &loops_[GetLoopNumber(succ)]; |
| next->end = order; |
| next->prev = loop; |
| loop = next; |
| } |
| } |
| } else { |
| // Finished with all successors of the current block. |
| if (HasLoopNumber(block)) { |
| // If we are going to pop a loop header, then add its entire body. |
| LoopInfo* info = &loops_[GetLoopNumber(block)]; |
| for (BasicBlock* b = info->start; true; b = b->rpo_next()) { |
| if (b->rpo_next() == info->end) { |
| b->set_rpo_next(order); |
| info->end = order; |
| break; |
| } |
| } |
| order = info->start; |
| } else { |
| // Pop a single node off the stack and add it to the order. |
| order = PushFront(order, block); |
| block->set_rpo_number(kBlockVisited2); |
| } |
| stack_depth--; |
| } |
| } |
| } |
| |
| // Publish new order the first time. |
| if (order_ == nullptr) order_ = order; |
| |
| // Compute the correct loop headers and set the correct loop ends. |
| LoopInfo* current_loop = nullptr; |
| BasicBlock* current_header = entry->loop_header(); |
| int32_t loop_depth = entry->loop_depth(); |
| if (entry->IsLoopHeader()) --loop_depth; // Entry might be a loop header. |
| for (BasicBlock* b = order; b != insertion_point; b = b->rpo_next()) { |
| BasicBlock* current = b; |
| |
| // Reset BasicBlock::rpo_number again. |
| current->set_rpo_number(kBlockUnvisited1); |
| |
| // Finish the previous loop(s) if we just exited them. |
| while (current_header != nullptr && |
| current == current_header->loop_end()) { |
| DCHECK(current_header->IsLoopHeader()); |
| DCHECK_NOT_NULL(current_loop); |
| current_loop = current_loop->prev; |
| current_header = |
| current_loop == nullptr ? nullptr : current_loop->header; |
| --loop_depth; |
| } |
| current->set_loop_header(current_header); |
| |
| // Push a new loop onto the stack if this loop is a loop header. |
| if (HasLoopNumber(current)) { |
| ++loop_depth; |
| current_loop = &loops_[GetLoopNumber(current)]; |
| BasicBlock* end = current_loop->end; |
| current->set_loop_end(end == nullptr ? BeyondEndSentinel() : end); |
| current_header = current_loop->header; |
| TRACE("id:%d is a loop header, increment loop depth to %d\n", |
| current->id().ToInt(), loop_depth); |
| } |
| |
| current->set_loop_depth(loop_depth); |
| |
| if (current->loop_header() == nullptr) { |
| TRACE("id:%d is not in a loop (depth == %d)\n", current->id().ToInt(), |
| current->loop_depth()); |
| } else { |
| TRACE("id:%d has loop header id:%d, (depth == %d)\n", |
| current->id().ToInt(), current->loop_header()->id().ToInt(), |
| current->loop_depth()); |
| } |
| } |
| } |
| |
| // Computes loop membership from the backedges of the control flow graph. |
| void ComputeLoopInfo(ZoneVector<SpecialRPOStackFrame>& queue, |
| size_t num_loops, ZoneVector<Backedge>* backedges) { |
| // Extend existing loop membership vectors. |
| for (LoopInfo& loop : loops_) { |
| loop.members->Resize(static_cast<int>(schedule_->BasicBlockCount()), |
| zone_); |
| } |
| |
| // Extend loop information vector. |
| loops_.resize(num_loops, LoopInfo()); |
| |
| // Compute loop membership starting from backedges. |
| // O(max(loop_depth) * max(|loop|) |
| for (size_t i = 0; i < backedges->size(); i++) { |
| BasicBlock* member = backedges->at(i).first; |
| BasicBlock* header = member->SuccessorAt(backedges->at(i).second); |
| size_t loop_num = GetLoopNumber(header); |
| if (loops_[loop_num].header == nullptr) { |
| loops_[loop_num].header = header; |
| loops_[loop_num].members = new (zone_) |
| BitVector(static_cast<int>(schedule_->BasicBlockCount()), zone_); |
| } |
| |
| int queue_length = 0; |
| if (member != header) { |
| // As long as the header doesn't have a backedge to itself, |
| // Push the member onto the queue and process its predecessors. |
| if (!loops_[loop_num].members->Contains(member->id().ToInt())) { |
| loops_[loop_num].members->Add(member->id().ToInt()); |
| } |
| queue[queue_length++].block = member; |
| } |
| |
| // Propagate loop membership backwards. All predecessors of M up to the |
| // loop header H are members of the loop too. O(|blocks between M and H|). |
| while (queue_length > 0) { |
| BasicBlock* block = queue[--queue_length].block; |
| for (size_t i = 0; i < block->PredecessorCount(); i++) { |
| BasicBlock* pred = block->PredecessorAt(i); |
| if (pred != header) { |
| if (!loops_[loop_num].members->Contains(pred->id().ToInt())) { |
| loops_[loop_num].members->Add(pred->id().ToInt()); |
| queue[queue_length++].block = pred; |
| } |
| } |
| } |
| } |
| } |
| } |
| |
| #if DEBUG |
| void PrintRPO() { |
| OFStream os(stdout); |
| os << "RPO with " << loops_.size() << " loops"; |
| if (loops_.size() > 0) { |
| os << " ("; |
| for (size_t i = 0; i < loops_.size(); i++) { |
| if (i > 0) os << " "; |
| os << "id:" << loops_[i].header->id(); |
| } |
| os << ")"; |
| } |
| os << ":\n"; |
| |
| for (BasicBlock* block = order_; block != nullptr; |
| block = block->rpo_next()) { |
| os << std::setw(5) << "B" << block->rpo_number() << ":"; |
| for (size_t i = 0; i < loops_.size(); i++) { |
| bool range = loops_[i].header->LoopContains(block); |
| bool membership = loops_[i].header != block && range; |
| os << (membership ? " |" : " "); |
| os << (range ? "x" : " "); |
| } |
| os << " id:" << block->id() << ": "; |
| if (block->loop_end() != nullptr) { |
| os << " range: [B" << block->rpo_number() << ", B" |
| << block->loop_end()->rpo_number() << ")"; |
| } |
| if (block->loop_header() != nullptr) { |
| os << " header: id:" << block->loop_header()->id(); |
| } |
| if (block->loop_depth() > 0) { |
| os << " depth: " << block->loop_depth(); |
| } |
| os << "\n"; |
| } |
| } |
| |
| void VerifySpecialRPO() { |
| BasicBlockVector* order = schedule_->rpo_order(); |
| DCHECK_LT(0, order->size()); |
| DCHECK_EQ(0, (*order)[0]->id().ToInt()); // entry should be first. |
| |
| for (size_t i = 0; i < loops_.size(); i++) { |
| LoopInfo* loop = &loops_[i]; |
| BasicBlock* header = loop->header; |
| BasicBlock* end = header->loop_end(); |
| |
| DCHECK_NOT_NULL(header); |
| DCHECK_LE(0, header->rpo_number()); |
| DCHECK_LT(header->rpo_number(), order->size()); |
| DCHECK_NOT_NULL(end); |
| DCHECK_LE(end->rpo_number(), order->size()); |
| DCHECK_GT(end->rpo_number(), header->rpo_number()); |
| DCHECK_NE(header->loop_header(), header); |
| |
| // Verify the start ... end list relationship. |
| int links = 0; |
| BasicBlock* block = loop->start; |
| DCHECK_EQ(header, block); |
| bool end_found; |
| while (true) { |
| if (block == nullptr || block == loop->end) { |
| end_found = (loop->end == block); |
| break; |
| } |
| // The list should be in same order as the final result. |
| DCHECK(block->rpo_number() == links + header->rpo_number()); |
| links++; |
| block = block->rpo_next(); |
| DCHECK_LT(links, static_cast<int>(2 * order->size())); // cycle? |
| } |
| DCHECK_LT(0, links); |
| DCHECK_EQ(links, end->rpo_number() - header->rpo_number()); |
| DCHECK(end_found); |
| |
| // Check loop depth of the header. |
| int loop_depth = 0; |
| for (LoopInfo* outer = loop; outer != nullptr; outer = outer->prev) { |
| loop_depth++; |
| } |
| DCHECK_EQ(loop_depth, header->loop_depth()); |
| |
| // Check the contiguousness of loops. |
| int count = 0; |
| for (int j = 0; j < static_cast<int>(order->size()); j++) { |
| BasicBlock* block = order->at(j); |
| DCHECK_EQ(block->rpo_number(), j); |
| if (j < header->rpo_number() || j >= end->rpo_number()) { |
| DCHECK(!header->LoopContains(block)); |
| } else { |
| DCHECK(header->LoopContains(block)); |
| DCHECK_GE(block->loop_depth(), loop_depth); |
| count++; |
| } |
| } |
| DCHECK_EQ(links, count); |
| } |
| } |
| #endif // DEBUG |
| |
| Zone* zone_; |
| Schedule* schedule_; |
| BasicBlock* order_; |
| BasicBlock* beyond_end_; |
| ZoneVector<LoopInfo> loops_; |
| ZoneVector<Backedge> backedges_; |
| ZoneVector<SpecialRPOStackFrame> stack_; |
| size_t previous_block_count_; |
| ZoneVector<BasicBlock*> const empty_; |
| }; |
| |
| |
| BasicBlockVector* Scheduler::ComputeSpecialRPO(Zone* zone, Schedule* schedule) { |
| SpecialRPONumberer numberer(zone, schedule); |
| numberer.ComputeSpecialRPO(); |
| numberer.SerializeRPOIntoSchedule(); |
| numberer.PrintAndVerifySpecialRPO(); |
| return schedule->rpo_order(); |
| } |
| |
| |
| void Scheduler::ComputeSpecialRPONumbering() { |
| TRACE("--- COMPUTING SPECIAL RPO ----------------------------------\n"); |
| |
| // Compute the special reverse-post-order for basic blocks. |
| special_rpo_ = new (zone_) SpecialRPONumberer(zone_, schedule_); |
| special_rpo_->ComputeSpecialRPO(); |
| } |
| |
| |
| void Scheduler::PropagateImmediateDominators(BasicBlock* block) { |
| for (/*nop*/; block != nullptr; block = block->rpo_next()) { |
| auto pred = block->predecessors().begin(); |
| auto end = block->predecessors().end(); |
| DCHECK(pred != end); // All blocks except start have predecessors. |
| BasicBlock* dominator = *pred; |
| bool deferred = dominator->deferred(); |
| // For multiple predecessors, walk up the dominator tree until a common |
| // dominator is found. Visitation order guarantees that all predecessors |
| // except for backwards edges have been visited. |
| for (++pred; pred != end; ++pred) { |
| // Don't examine backwards edges. |
| if ((*pred)->dominator_depth() < 0) continue; |
| dominator = BasicBlock::GetCommonDominator(dominator, *pred); |
| deferred = deferred & (*pred)->deferred(); |
| } |
| block->set_dominator(dominator); |
| block->set_dominator_depth(dominator->dominator_depth() + 1); |
| block->set_deferred(deferred | block->deferred()); |
| TRACE("Block id:%d's idom is id:%d, depth = %d\n", block->id().ToInt(), |
| dominator->id().ToInt(), block->dominator_depth()); |
| } |
| } |
| |
| |
| void Scheduler::GenerateImmediateDominatorTree() { |
| TRACE("--- IMMEDIATE BLOCK DOMINATORS -----------------------------\n"); |
| |
| // Seed start block to be the first dominator. |
| schedule_->start()->set_dominator_depth(0); |
| |
| // Build the block dominator tree resulting from the above seed. |
| PropagateImmediateDominators(schedule_->start()->rpo_next()); |
| } |
| |
| |
| // ----------------------------------------------------------------------------- |
| // Phase 3: Prepare use counts for nodes. |
| |
| |
| class PrepareUsesVisitor { |
| public: |
| explicit PrepareUsesVisitor(Scheduler* scheduler) |
| : scheduler_(scheduler), schedule_(scheduler->schedule_) {} |
| |
| void Pre(Node* node) { |
| if (scheduler_->InitializePlacement(node) == Scheduler::kFixed) { |
| // Fixed nodes are always roots for schedule late. |
| scheduler_->schedule_root_nodes_.push_back(node); |
| if (!schedule_->IsScheduled(node)) { |
| // Make sure root nodes are scheduled in their respective blocks. |
| TRACE("Scheduling fixed position node #%d:%s\n", node->id(), |
| node->op()->mnemonic()); |
| IrOpcode::Value opcode = node->opcode(); |
| BasicBlock* block = |
| opcode == IrOpcode::kParameter |
| ? schedule_->start() |
| : schedule_->block(NodeProperties::GetControlInput(node)); |
| DCHECK_NOT_NULL(block); |
| schedule_->AddNode(block, node); |
| } |
| } |
| } |
| |
| void PostEdge(Node* from, int index, Node* to) { |
| // If the edge is from an unscheduled node, then tally it in the use count |
| // for all of its inputs. The same criterion will be used in ScheduleLate |
| // for decrementing use counts. |
| if (!schedule_->IsScheduled(from)) { |
| DCHECK_NE(Scheduler::kFixed, scheduler_->GetPlacement(from)); |
| scheduler_->IncrementUnscheduledUseCount(to, index, from); |
| } |
| } |
| |
| private: |
| Scheduler* scheduler_; |
| Schedule* schedule_; |
| }; |
| |
| |
| void Scheduler::PrepareUses() { |
| TRACE("--- PREPARE USES -------------------------------------------\n"); |
| |
| // Count the uses of every node, which is used to ensure that all of a |
| // node's uses are scheduled before the node itself. |
| PrepareUsesVisitor prepare_uses(this); |
| |
| // TODO(turbofan): simplify the careful pre/post ordering here. |
| BoolVector visited(graph_->NodeCount(), false, zone_); |
| ZoneStack<Node::InputEdges::iterator> stack(zone_); |
| Node* node = graph_->end(); |
| prepare_uses.Pre(node); |
| visited[node->id()] = true; |
| stack.push(node->input_edges().begin()); |
| while (!stack.empty()) { |
| Edge edge = *stack.top(); |
| Node* node = edge.to(); |
| if (visited[node->id()]) { |
| prepare_uses.PostEdge(edge.from(), edge.index(), edge.to()); |
| if (++stack.top() == edge.from()->input_edges().end()) stack.pop(); |
| } else { |
| prepare_uses.Pre(node); |
| visited[node->id()] = true; |
| if (node->InputCount() > 0) stack.push(node->input_edges().begin()); |
| } |
| } |
| } |
| |
| |
| // ----------------------------------------------------------------------------- |
| // Phase 4: Schedule nodes early. |
| |
| |
| class ScheduleEarlyNodeVisitor { |
| public: |
| ScheduleEarlyNodeVisitor(Zone* zone, Scheduler* scheduler) |
| : scheduler_(scheduler), schedule_(scheduler->schedule_), queue_(zone) {} |
| |
| // Run the schedule early algorithm on a set of fixed root nodes. |
| void Run(NodeVector* roots) { |
| for (Node* const root : *roots) { |
| queue_.push(root); |
| while (!queue_.empty()) { |
| VisitNode(queue_.front()); |
| queue_.pop(); |
| } |
| } |
| } |
| |
| private: |
| // Visits one node from the queue and propagates its current schedule early |
| // position to all uses. This in turn might push more nodes onto the queue. |
| void VisitNode(Node* node) { |
| Scheduler::SchedulerData* data = scheduler_->GetData(node); |
| |
| // Fixed nodes already know their schedule early position. |
| if (scheduler_->GetPlacement(node) == Scheduler::kFixed) { |
| data->minimum_block_ = schedule_->block(node); |
| TRACE("Fixing #%d:%s minimum_block = id:%d, dominator_depth = %d\n", |
| node->id(), node->op()->mnemonic(), |
| data->minimum_block_->id().ToInt(), |
| data->minimum_block_->dominator_depth()); |
| } |
| |
| // No need to propagate unconstrained schedule early positions. |
| if (data->minimum_block_ == schedule_->start()) return; |
| |
| // Propagate schedule early position. |
| DCHECK_NOT_NULL(data->minimum_block_); |
| for (auto use : node->uses()) { |
| if (scheduler_->IsLive(use)) { |
| PropagateMinimumPositionToNode(data->minimum_block_, use); |
| } |
| } |
| } |
| |
| // Propagates {block} as another minimum position into the given {node}. This |
| // has the net effect of computing the minimum dominator block of {node} that |
| // still post-dominates all inputs to {node} when the queue is processed. |
| void PropagateMinimumPositionToNode(BasicBlock* block, Node* node) { |
| Scheduler::SchedulerData* data = scheduler_->GetData(node); |
| |
| // No need to propagate to fixed node, it's guaranteed to be a root. |
| if (scheduler_->GetPlacement(node) == Scheduler::kFixed) return; |
| |
| // Coupled nodes influence schedule early position of their control. |
| if (scheduler_->GetPlacement(node) == Scheduler::kCoupled) { |
| Node* control = NodeProperties::GetControlInput(node); |
| PropagateMinimumPositionToNode(block, control); |
| } |
| |
| // Propagate new position if it is deeper down the dominator tree than the |
| // current. Note that all inputs need to have minimum block position inside |
| // the dominator chain of {node}'s minimum block position. |
| DCHECK(InsideSameDominatorChain(block, data->minimum_block_)); |
| if (block->dominator_depth() > data->minimum_block_->dominator_depth()) { |
| data->minimum_block_ = block; |
| queue_.push(node); |
| TRACE("Propagating #%d:%s minimum_block = id:%d, dominator_depth = %d\n", |
| node->id(), node->op()->mnemonic(), |
| data->minimum_block_->id().ToInt(), |
| data->minimum_block_->dominator_depth()); |
| } |
| } |
| |
| #if DEBUG |
| bool InsideSameDominatorChain(BasicBlock* b1, BasicBlock* b2) { |
| BasicBlock* dominator = BasicBlock::GetCommonDominator(b1, b2); |
| return dominator == b1 || dominator == b2; |
| } |
| #endif |
| |
| Scheduler* scheduler_; |
| Schedule* schedule_; |
| ZoneQueue<Node*> queue_; |
| }; |
| |
| |
| void Scheduler::ScheduleEarly() { |
| TRACE("--- SCHEDULE EARLY -----------------------------------------\n"); |
| if (FLAG_trace_turbo_scheduler) { |
| TRACE("roots: "); |
| for (Node* node : schedule_root_nodes_) { |
| TRACE("#%d:%s ", node->id(), node->op()->mnemonic()); |
| } |
| TRACE("\n"); |
| } |
| |
| // Compute the minimum block for each node thereby determining the earliest |
| // position each node could be placed within a valid schedule. |
| ScheduleEarlyNodeVisitor schedule_early_visitor(zone_, this); |
| schedule_early_visitor.Run(&schedule_root_nodes_); |
| } |
| |
| |
| // ----------------------------------------------------------------------------- |
| // Phase 5: Schedule nodes late. |
| |
| |
| class ScheduleLateNodeVisitor { |
| public: |
| ScheduleLateNodeVisitor(Zone* zone, Scheduler* scheduler) |
| : zone_(zone), |
| scheduler_(scheduler), |
| schedule_(scheduler_->schedule_), |
| marked_(scheduler->zone_), |
| marking_queue_(scheduler->zone_) {} |
| |
| // Run the schedule late algorithm on a set of fixed root nodes. |
| void Run(NodeVector* roots) { |
| for (Node* const root : *roots) { |
| ProcessQueue(root); |
| } |
| } |
| |
| private: |
| void ProcessQueue(Node* root) { |
| ZoneQueue<Node*>* queue = &(scheduler_->schedule_queue_); |
| for (Node* node : root->inputs()) { |
| // Don't schedule coupled nodes on their own. |
| if (scheduler_->GetPlacement(node) == Scheduler::kCoupled) { |
| node = NodeProperties::GetControlInput(node); |
| } |
| |
| // Test schedulability condition by looking at unscheduled use count. |
| if (scheduler_->GetData(node)->unscheduled_count_ != 0) continue; |
| |
| queue->push(node); |
| do { |
| Node* const node = queue->front(); |
| queue->pop(); |
| VisitNode(node); |
| } while (!queue->empty()); |
| } |
| } |
| |
| // Visits one node from the queue of schedulable nodes and determines its |
| // schedule late position. Also hoists nodes out of loops to find a more |
| // optimal scheduling position. |
| void VisitNode(Node* node) { |
| DCHECK_EQ(0, scheduler_->GetData(node)->unscheduled_count_); |
| |
| // Don't schedule nodes that are already scheduled. |
| if (schedule_->IsScheduled(node)) return; |
| DCHECK_EQ(Scheduler::kSchedulable, scheduler_->GetPlacement(node)); |
| |
| // Determine the dominating block for all of the uses of this node. It is |
| // the latest block that this node can be scheduled in. |
| TRACE("Scheduling #%d:%s\n", node->id(), node->op()->mnemonic()); |
| BasicBlock* block = GetCommonDominatorOfUses(node); |
| DCHECK_NOT_NULL(block); |
| |
| // The schedule early block dominates the schedule late block. |
| BasicBlock* min_block = scheduler_->GetData(node)->minimum_block_; |
| DCHECK_EQ(min_block, BasicBlock::GetCommonDominator(block, min_block)); |
| TRACE( |
| "Schedule late of #%d:%s is id:%d at loop depth %d, minimum = id:%d\n", |
| node->id(), node->op()->mnemonic(), block->id().ToInt(), |
| block->loop_depth(), min_block->id().ToInt()); |
| |
| // Hoist nodes out of loops if possible. Nodes can be hoisted iteratively |
| // into enclosing loop pre-headers until they would precede their schedule |
| // early position. |
| BasicBlock* hoist_block = GetHoistBlock(block); |
| if (hoist_block && |
| hoist_block->dominator_depth() >= min_block->dominator_depth()) { |
| do { |
| TRACE(" hoisting #%d:%s to block id:%d\n", node->id(), |
| node->op()->mnemonic(), hoist_block->id().ToInt()); |
| DCHECK_LT(hoist_block->loop_depth(), block->loop_depth()); |
| block = hoist_block; |
| hoist_block = GetHoistBlock(hoist_block); |
| } while (hoist_block && |
| hoist_block->dominator_depth() >= min_block->dominator_depth()); |
| } else if (scheduler_->flags_ & Scheduler::kSplitNodes) { |
| // Split the {node} if beneficial and return the new {block} for it. |
| block = SplitNode(block, node); |
| } |
| |
| // Schedule the node or a floating control structure. |
| if (IrOpcode::IsMergeOpcode(node->opcode())) { |
| ScheduleFloatingControl(block, node); |
| } else if (node->opcode() == IrOpcode::kFinishRegion) { |
| ScheduleRegion(block, node); |
| } else { |
| ScheduleNode(block, node); |
| } |
| } |
| |
| // Mark {block} and push its non-marked predecessor on the marking queue. |
| void MarkBlock(BasicBlock* block) { |
| DCHECK_LT(block->id().ToSize(), marked_.size()); |
| marked_[block->id().ToSize()] = true; |
| for (BasicBlock* pred_block : block->predecessors()) { |
| DCHECK_LT(pred_block->id().ToSize(), marked_.size()); |
| if (marked_[pred_block->id().ToSize()]) continue; |
| marking_queue_.push_back(pred_block); |
| } |
| } |
| |
| BasicBlock* SplitNode(BasicBlock* block, Node* node) { |
| // For now, we limit splitting to pure nodes. |
| if (!node->op()->HasProperty(Operator::kPure)) return block; |
| // TODO(titzer): fix the special case of splitting of projections. |
| if (node->opcode() == IrOpcode::kProjection) return block; |
| |
| // The {block} is common dominator of all uses of {node}, so we cannot |
| // split anything unless the {block} has at least two successors. |
| DCHECK_EQ(block, GetCommonDominatorOfUses(node)); |
| if (block->SuccessorCount() < 2) return block; |
| |
| // Clear marking bits. |
| DCHECK(marking_queue_.empty()); |
| std::fill(marked_.begin(), marked_.end(), false); |
| marked_.resize(schedule_->BasicBlockCount() + 1, false); |
| |
| // Check if the {node} has uses in {block}. |
| for (Edge edge : node->use_edges()) { |
| if (!scheduler_->IsLive(edge.from())) continue; |
| BasicBlock* use_block = GetBlockForUse(edge); |
| if (use_block == nullptr || marked_[use_block->id().ToSize()]) continue; |
| if (use_block == block) { |
| TRACE(" not splitting #%d:%s, it is used in id:%d\n", node->id(), |
| node->op()->mnemonic(), block->id().ToInt()); |
| marking_queue_.clear(); |
| return block; |
| } |
| MarkBlock(use_block); |
| } |
| |
| // Compute transitive marking closure; a block is marked if all its |
| // successors are marked. |
| do { |
| BasicBlock* top_block = marking_queue_.front(); |
| marking_queue_.pop_front(); |
| if (marked_[top_block->id().ToSize()]) continue; |
| bool marked = true; |
| for (BasicBlock* successor : top_block->successors()) { |
| if (!marked_[successor->id().ToSize()]) { |
| marked = false; |
| break; |
| } |
| } |
| if (marked) MarkBlock(top_block); |
| } while (!marking_queue_.empty()); |
| |
| // If the (common dominator) {block} is marked, we know that all paths from |
| // {block} to the end contain at least one use of {node}, and hence there's |
| // no point in splitting the {node} in this case. |
| if (marked_[block->id().ToSize()]) { |
| TRACE(" not splitting #%d:%s, its common dominator id:%d is perfect\n", |
| node->id(), node->op()->mnemonic(), block->id().ToInt()); |
| return block; |
| } |
| |
| // Split {node} for uses according to the previously computed marking |
| // closure. Every marking partition has a unique dominator, which get's a |
| // copy of the {node} with the exception of the first partition, which get's |
| // the {node} itself. |
| ZoneMap<BasicBlock*, Node*> dominators(scheduler_->zone_); |
| for (Edge edge : node->use_edges()) { |
| if (!scheduler_->IsLive(edge.from())) continue; |
| BasicBlock* use_block = GetBlockForUse(edge); |
| if (use_block == nullptr) continue; |
| while (marked_[use_block->dominator()->id().ToSize()]) { |
| use_block = use_block->dominator(); |
| } |
| auto& use_node = dominators[use_block]; |
| if (use_node == nullptr) { |
| if (dominators.size() == 1u) { |
| // Place the {node} at {use_block}. |
| block = use_block; |
| use_node = node; |
| TRACE(" pushing #%d:%s down to id:%d\n", node->id(), |
| node->op()->mnemonic(), block->id().ToInt()); |
| } else { |
| // Place a copy of {node} at {use_block}. |
| use_node = CloneNode(node); |
| TRACE(" cloning #%d:%s for id:%d\n", use_node->id(), |
| use_node->op()->mnemonic(), use_block->id().ToInt()); |
| scheduler_->schedule_queue_.push(use_node); |
| } |
| } |
| edge.UpdateTo(use_node); |
| } |
| return block; |
| } |
| |
| BasicBlock* GetHoistBlock(BasicBlock* block) { |
| if (block->IsLoopHeader()) return block->dominator(); |
| // We have to check to make sure that the {block} dominates all |
| // of the outgoing blocks. If it doesn't, then there is a path |
| // out of the loop which does not execute this {block}, so we |
| // can't hoist operations from this {block} out of the loop, as |
| // that would introduce additional computations. |
| if (BasicBlock* header_block = block->loop_header()) { |
| for (BasicBlock* outgoing_block : |
| scheduler_->special_rpo_->GetOutgoingBlocks(header_block)) { |
| if (BasicBlock::GetCommonDominator(block, outgoing_block) != block) { |
| return nullptr; |
| } |
| } |
| return header_block->dominator(); |
| } |
| return nullptr; |
| } |
| |
| BasicBlock* GetCommonDominatorOfUses(Node* node) { |
| BasicBlock* block = nullptr; |
| for (Edge edge : node->use_edges()) { |
| if (!scheduler_->IsLive(edge.from())) continue; |
| BasicBlock* use_block = GetBlockForUse(edge); |
| block = block == nullptr |
| ? use_block |
| : use_block == nullptr |
| ? block |
| : BasicBlock::GetCommonDominator(block, use_block); |
| } |
| return block; |
| } |
| |
| BasicBlock* FindPredecessorBlock(Node* node) { |
| return scheduler_->control_flow_builder_->FindPredecessorBlock(node); |
| } |
| |
| BasicBlock* GetBlockForUse(Edge edge) { |
| // TODO(titzer): ignore uses from dead nodes (not visited in PrepareUses()). |
| // Dead uses only occur if the graph is not trimmed before scheduling. |
| Node* use = edge.from(); |
| if (IrOpcode::IsPhiOpcode(use->opcode())) { |
| // If the use is from a coupled (i.e. floating) phi, compute the common |
| // dominator of its uses. This will not recurse more than one level. |
| if (scheduler_->GetPlacement(use) == Scheduler::kCoupled) { |
| TRACE(" inspecting uses of coupled #%d:%s\n", use->id(), |
| use->op()->mnemonic()); |
| // TODO(titzer): reenable once above TODO is addressed. |
| // DCHECK_EQ(edge.to(), NodeProperties::GetControlInput(use)); |
| return GetCommonDominatorOfUses(use); |
| } |
| // If the use is from a fixed (i.e. non-floating) phi, we use the |
| // predecessor block of the corresponding control input to the merge. |
| if (scheduler_->GetPlacement(use) == Scheduler::kFixed) { |
| TRACE(" input@%d into a fixed phi #%d:%s\n", edge.index(), use->id(), |
| use->op()->mnemonic()); |
| Node* merge = NodeProperties::GetControlInput(use, 0); |
| DCHECK(IrOpcode::IsMergeOpcode(merge->opcode())); |
| Node* input = NodeProperties::GetControlInput(merge, edge.index()); |
| return FindPredecessorBlock(input); |
| } |
| } else if (IrOpcode::IsMergeOpcode(use->opcode())) { |
| // If the use is from a fixed (i.e. non-floating) merge, we use the |
| // predecessor block of the current input to the merge. |
| if (scheduler_->GetPlacement(use) == Scheduler::kFixed) { |
| TRACE(" input@%d into a fixed merge #%d:%s\n", edge.index(), use->id(), |
| use->op()->mnemonic()); |
| return FindPredecessorBlock(edge.to()); |
| } |
| } |
| BasicBlock* result = schedule_->block(use); |
| if (result == nullptr) return nullptr; |
| TRACE(" must dominate use #%d:%s in id:%d\n", use->id(), |
| use->op()->mnemonic(), result->id().ToInt()); |
| return result; |
| } |
| |
| void ScheduleFloatingControl(BasicBlock* block, Node* node) { |
| scheduler_->FuseFloatingControl(block, node); |
| } |
| |
| void ScheduleRegion(BasicBlock* block, Node* region_end) { |
| // We only allow regions of instructions connected into a linear |
| // effect chain. The only value allowed to be produced by a node |
| // in the chain must be the value consumed by the FinishRegion node. |
| |
| // We schedule back to front; we first schedule FinishRegion. |
| CHECK_EQ(IrOpcode::kFinishRegion, region_end->opcode()); |
| ScheduleNode(block, region_end); |
| |
| // Schedule the chain. |
| Node* node = NodeProperties::GetEffectInput(region_end); |
| while (node->opcode() != IrOpcode::kBeginRegion) { |
| DCHECK_EQ(0, scheduler_->GetData(node)->unscheduled_count_); |
| DCHECK_EQ(1, node->op()->EffectInputCount()); |
| DCHECK_EQ(1, node->op()->EffectOutputCount()); |
| DCHECK_EQ(0, node->op()->ControlOutputCount()); |
| // The value output (if there is any) must be consumed |
| // by the EndRegion node. |
| DCHECK(node->op()->ValueOutputCount() == 0 || |
| node == region_end->InputAt(0)); |
| ScheduleNode(block, node); |
| node = NodeProperties::GetEffectInput(node); |
| } |
| // Schedule the BeginRegion node. |
| DCHECK_EQ(0, scheduler_->GetData(node)->unscheduled_count_); |
| ScheduleNode(block, node); |
| } |
| |
| void ScheduleNode(BasicBlock* block, Node* node) { |
| schedule_->PlanNode(block, node); |
| size_t block_id = block->id().ToSize(); |
| if (!scheduler_->scheduled_nodes_[block_id]) { |
| scheduler_->scheduled_nodes_[block_id] = |
| new (zone_->New(sizeof(NodeVector))) NodeVector(zone_); |
| } |
| scheduler_->scheduled_nodes_[block_id]->push_back(node); |
| scheduler_->UpdatePlacement(node, Scheduler::kScheduled); |
| } |
| |
| Node* CloneNode(Node* node) { |
| int const input_count = node->InputCount(); |
| for (int index = 0; index < input_count; ++index) { |
| Node* const input = node->InputAt(index); |
| scheduler_->IncrementUnscheduledUseCount(input, index, node); |
| } |
| Node* const copy = scheduler_->graph_->CloneNode(node); |
| TRACE(("clone #%d:%s -> #%d\n"), node->id(), node->op()->mnemonic(), |
| copy->id()); |
| scheduler_->node_data_.resize(copy->id() + 1, |
| scheduler_->DefaultSchedulerData()); |
| scheduler_->node_data_[copy->id()] = scheduler_->node_data_[node->id()]; |
| return copy; |
| } |
| |
| Zone* zone_; |
| Scheduler* scheduler_; |
| Schedule* schedule_; |
| BoolVector marked_; |
| ZoneDeque<BasicBlock*> marking_queue_; |
| }; |
| |
| |
| void Scheduler::ScheduleLate() { |
| TRACE("--- SCHEDULE LATE ------------------------------------------\n"); |
| if (FLAG_trace_turbo_scheduler) { |
| TRACE("roots: "); |
| for (Node* node : schedule_root_nodes_) { |
| TRACE("#%d:%s ", node->id(), node->op()->mnemonic()); |
| } |
| TRACE("\n"); |
| } |
| |
| // Schedule: Places nodes in dominator block of all their uses. |
| ScheduleLateNodeVisitor schedule_late_visitor(zone_, this); |
| schedule_late_visitor.Run(&schedule_root_nodes_); |
| } |
| |
| |
| // ----------------------------------------------------------------------------- |
| // Phase 6: Seal the final schedule. |
| |
| |
| void Scheduler::SealFinalSchedule() { |
| TRACE("--- SEAL FINAL SCHEDULE ------------------------------------\n"); |
| |
| // Serialize the assembly order and reverse-post-order numbering. |
| special_rpo_->SerializeRPOIntoSchedule(); |
| special_rpo_->PrintAndVerifySpecialRPO(); |
| |
| // Add collected nodes for basic blocks to their blocks in the right order. |
| int block_num = 0; |
| for (NodeVector* nodes : scheduled_nodes_) { |
| BasicBlock::Id id = BasicBlock::Id::FromInt(block_num++); |
| BasicBlock* block = schedule_->GetBlockById(id); |
| if (nodes) { |
| for (Node* node : base::Reversed(*nodes)) { |
| schedule_->AddNode(block, node); |
| } |
| } |
| } |
| } |
| |
| |
| // ----------------------------------------------------------------------------- |
| |
| |
| void Scheduler::FuseFloatingControl(BasicBlock* block, Node* node) { |
| TRACE("--- FUSE FLOATING CONTROL ----------------------------------\n"); |
| if (FLAG_trace_turbo_scheduler) { |
| OFStream os(stdout); |
| os << "Schedule before control flow fusion:\n" << *schedule_; |
| } |
| |
| // Iterate on phase 1: Build control-flow graph. |
| control_flow_builder_->Run(block, node); |
| |
| // Iterate on phase 2: Compute special RPO and dominator tree. |
| special_rpo_->UpdateSpecialRPO(block, schedule_->block(node)); |
| // TODO(mstarzinger): Currently "iterate on" means "re-run". Fix that. |
| for (BasicBlock* b = block->rpo_next(); b != nullptr; b = b->rpo_next()) { |
| b->set_dominator_depth(-1); |
| b->set_dominator(nullptr); |
| } |
| PropagateImmediateDominators(block->rpo_next()); |
| |
| // Iterate on phase 4: Schedule nodes early. |
| // TODO(mstarzinger): The following loop gathering the propagation roots is a |
| // temporary solution and should be merged into the rest of the scheduler as |
| // soon as the approach settled for all floating loops. |
| NodeVector propagation_roots(control_flow_builder_->control_); |
| for (Node* node : control_flow_builder_->control_) { |
| for (Node* use : node->uses()) { |
| if (NodeProperties::IsPhi(use) && IsLive(use)) { |
| propagation_roots.push_back(use); |
| } |
| } |
| } |
| if (FLAG_trace_turbo_scheduler) { |
| TRACE("propagation roots: "); |
| for (Node* node : propagation_roots) { |
| TRACE("#%d:%s ", node->id(), node->op()->mnemonic()); |
| } |
| TRACE("\n"); |
| } |
| ScheduleEarlyNodeVisitor schedule_early_visitor(zone_, this); |
| schedule_early_visitor.Run(&propagation_roots); |
| |
| // Move previously planned nodes. |
| // TODO(mstarzinger): Improve that by supporting bulk moves. |
| scheduled_nodes_.resize(schedule_->BasicBlockCount()); |
| MovePlannedNodes(block, schedule_->block(node)); |
| |
| if (FLAG_trace_turbo_scheduler) { |
| OFStream os(stdout); |
| os << "Schedule after control flow fusion:\n" << *schedule_; |
| } |
| } |
| |
| |
| void Scheduler::MovePlannedNodes(BasicBlock* from, BasicBlock* to) { |
| TRACE("Move planned nodes from id:%d to id:%d\n", from->id().ToInt(), |
| to->id().ToInt()); |
| NodeVector* from_nodes = scheduled_nodes_[from->id().ToSize()]; |
| NodeVector* to_nodes = scheduled_nodes_[to->id().ToSize()]; |
| if (!from_nodes) return; |
| |
| for (Node* const node : *from_nodes) { |
| schedule_->SetBlockForNode(to, node); |
| } |
| if (to_nodes) { |
| to_nodes->insert(to_nodes->end(), from_nodes->begin(), from_nodes->end()); |
| from_nodes->clear(); |
| } else { |
| std::swap(scheduled_nodes_[from->id().ToSize()], |
| scheduled_nodes_[to->id().ToSize()]); |
| } |
| } |
| |
| #undef TRACE |
| |
| } // namespace compiler |
| } // namespace internal |
| } // namespace v8 |