| // Copyright 2014 the V8 project authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "src/compiler/loop-analysis.h" |
| |
| #include "src/codegen/tick-counter.h" |
| #include "src/compiler/graph.h" |
| #include "src/compiler/node-marker.h" |
| #include "src/compiler/node-properties.h" |
| #include "src/compiler/node.h" |
| #include "src/zone/zone.h" |
| |
| namespace v8 { |
| namespace internal { |
| |
| class TickCounter; |
| |
| namespace compiler { |
| |
| #define OFFSET(x) ((x)&0x1F) |
| #define BIT(x) (1u << OFFSET(x)) |
| #define INDEX(x) ((x) >> 5) |
| |
| // Temporary information for each node during marking. |
| struct NodeInfo { |
| Node* node; |
| NodeInfo* next; // link in chaining loop members |
| }; |
| |
| |
| // Temporary loop info needed during traversal and building the loop tree. |
| struct TempLoopInfo { |
| Node* header; |
| NodeInfo* header_list; |
| NodeInfo* exit_list; |
| NodeInfo* body_list; |
| LoopTree::Loop* loop; |
| }; |
| |
| |
| // Encapsulation of the loop finding algorithm. |
| // ----------------------------------------------------------------------------- |
| // Conceptually, the contents of a loop are those nodes that are "between" the |
| // loop header and the backedges of the loop. Graphs in the soup of nodes can |
| // form improper cycles, so standard loop finding algorithms that work on CFGs |
| // aren't sufficient. However, in valid TurboFan graphs, all cycles involve |
| // either a {Loop} node or a phi. The {Loop} node itself and its accompanying |
| // phis are treated together as a set referred to here as the loop header. |
| // This loop finding algorithm works by traversing the graph in two directions, |
| // first from nodes to their inputs, starting at {end}, then in the reverse |
| // direction, from nodes to their uses, starting at loop headers. |
| // 1 bit per loop per node per direction are required during the marking phase. |
| // To handle nested loops correctly, the algorithm must filter some reachability |
| // marks on edges into/out-of the loop header nodes. |
| class LoopFinderImpl { |
| public: |
| LoopFinderImpl(Graph* graph, LoopTree* loop_tree, TickCounter* tick_counter, |
| Zone* zone) |
| : zone_(zone), |
| end_(graph->end()), |
| queue_(zone), |
| queued_(graph, 2), |
| info_(graph->NodeCount(), {nullptr, nullptr}, zone), |
| loops_(zone), |
| loop_num_(graph->NodeCount(), -1, zone), |
| loop_tree_(loop_tree), |
| loops_found_(0), |
| width_(0), |
| backward_(nullptr), |
| forward_(nullptr), |
| tick_counter_(tick_counter) {} |
| |
| void Run() { |
| PropagateBackward(); |
| PropagateForward(); |
| FinishLoopTree(); |
| } |
| |
| void Print() { |
| // Print out the results. |
| for (NodeInfo& ni : info_) { |
| if (ni.node == nullptr) continue; |
| for (int i = 1; i <= loops_found_; i++) { |
| int index = ni.node->id() * width_ + INDEX(i); |
| bool marked_forward = forward_[index] & BIT(i); |
| bool marked_backward = backward_[index] & BIT(i); |
| if (marked_forward && marked_backward) { |
| PrintF("X"); |
| } else if (marked_forward) { |
| PrintF(">"); |
| } else if (marked_backward) { |
| PrintF("<"); |
| } else { |
| PrintF(" "); |
| } |
| } |
| PrintF(" #%d:%s\n", ni.node->id(), ni.node->op()->mnemonic()); |
| } |
| |
| int i = 0; |
| for (TempLoopInfo& li : loops_) { |
| PrintF("Loop %d headed at #%d\n", i, li.header->id()); |
| i++; |
| } |
| |
| for (LoopTree::Loop* loop : loop_tree_->outer_loops_) { |
| PrintLoop(loop); |
| } |
| } |
| |
| private: |
| Zone* zone_; |
| Node* end_; |
| NodeDeque queue_; |
| NodeMarker<bool> queued_; |
| ZoneVector<NodeInfo> info_; |
| ZoneVector<TempLoopInfo> loops_; |
| ZoneVector<int> loop_num_; |
| LoopTree* loop_tree_; |
| int loops_found_; |
| int width_; |
| uint32_t* backward_; |
| uint32_t* forward_; |
| TickCounter* const tick_counter_; |
| |
| int num_nodes() { |
| return static_cast<int>(loop_tree_->node_to_loop_num_.size()); |
| } |
| |
| // Tb = Tb | (Fb - loop_filter) |
| bool PropagateBackwardMarks(Node* from, Node* to, int loop_filter) { |
| if (from == to) return false; |
| uint32_t* fp = &backward_[from->id() * width_]; |
| uint32_t* tp = &backward_[to->id() * width_]; |
| bool change = false; |
| for (int i = 0; i < width_; i++) { |
| uint32_t mask = i == INDEX(loop_filter) ? ~BIT(loop_filter) : 0xFFFFFFFF; |
| uint32_t prev = tp[i]; |
| uint32_t next = prev | (fp[i] & mask); |
| tp[i] = next; |
| if (!change && (prev != next)) change = true; |
| } |
| return change; |
| } |
| |
| // Tb = Tb | B |
| bool SetBackwardMark(Node* to, int loop_num) { |
| uint32_t* tp = &backward_[to->id() * width_ + INDEX(loop_num)]; |
| uint32_t prev = tp[0]; |
| uint32_t next = prev | BIT(loop_num); |
| tp[0] = next; |
| return next != prev; |
| } |
| |
| // Tf = Tf | B |
| bool SetForwardMark(Node* to, int loop_num) { |
| uint32_t* tp = &forward_[to->id() * width_ + INDEX(loop_num)]; |
| uint32_t prev = tp[0]; |
| uint32_t next = prev | BIT(loop_num); |
| tp[0] = next; |
| return next != prev; |
| } |
| |
| // Tf = Tf | (Ff & Tb) |
| bool PropagateForwardMarks(Node* from, Node* to) { |
| if (from == to) return false; |
| bool change = false; |
| int findex = from->id() * width_; |
| int tindex = to->id() * width_; |
| for (int i = 0; i < width_; i++) { |
| uint32_t marks = backward_[tindex + i] & forward_[findex + i]; |
| uint32_t prev = forward_[tindex + i]; |
| uint32_t next = prev | marks; |
| forward_[tindex + i] = next; |
| if (!change && (prev != next)) change = true; |
| } |
| return change; |
| } |
| |
| bool IsInLoop(Node* node, int loop_num) { |
| int offset = node->id() * width_ + INDEX(loop_num); |
| return backward_[offset] & forward_[offset] & BIT(loop_num); |
| } |
| |
| // Propagate marks backward from loop headers. |
| void PropagateBackward() { |
| ResizeBackwardMarks(); |
| SetBackwardMark(end_, 0); |
| Queue(end_); |
| |
| while (!queue_.empty()) { |
| tick_counter_->TickAndMaybeEnterSafepoint(); |
| Node* node = queue_.front(); |
| info(node); |
| queue_.pop_front(); |
| queued_.Set(node, false); |
| |
| int loop_num = -1; |
| // Setup loop headers first. |
| if (node->opcode() == IrOpcode::kLoop) { |
| // found the loop node first. |
| loop_num = CreateLoopInfo(node); |
| } else if (NodeProperties::IsPhi(node)) { |
| // found a phi first. |
| Node* merge = node->InputAt(node->InputCount() - 1); |
| if (merge->opcode() == IrOpcode::kLoop) { |
| loop_num = CreateLoopInfo(merge); |
| } |
| } else if (node->opcode() == IrOpcode::kLoopExit) { |
| // Intentionally ignore return value. Loop exit node marks |
| // are propagated normally. |
| CreateLoopInfo(node->InputAt(1)); |
| } else if (node->opcode() == IrOpcode::kLoopExitValue || |
| node->opcode() == IrOpcode::kLoopExitEffect) { |
| Node* loop_exit = NodeProperties::GetControlInput(node); |
| // Intentionally ignore return value. Loop exit node marks |
| // are propagated normally. |
| CreateLoopInfo(loop_exit->InputAt(1)); |
| } |
| |
| // Propagate marks backwards from this node. |
| for (int i = 0; i < node->InputCount(); i++) { |
| Node* input = node->InputAt(i); |
| if (IsBackedge(node, i)) { |
| // Only propagate the loop mark on backedges. |
| if (SetBackwardMark(input, loop_num)) Queue(input); |
| } else { |
| // Entry or normal edge. Propagate all marks except loop_num. |
| if (PropagateBackwardMarks(node, input, loop_num)) Queue(input); |
| } |
| } |
| } |
| } |
| |
| // Make a new loop if necessary for the given node. |
| int CreateLoopInfo(Node* node) { |
| DCHECK_EQ(IrOpcode::kLoop, node->opcode()); |
| int loop_num = LoopNum(node); |
| if (loop_num > 0) return loop_num; |
| |
| loop_num = ++loops_found_; |
| if (INDEX(loop_num) >= width_) ResizeBackwardMarks(); |
| |
| // Create a new loop. |
| loops_.push_back({node, nullptr, nullptr, nullptr, nullptr}); |
| loop_tree_->NewLoop(); |
| SetLoopMarkForLoopHeader(node, loop_num); |
| return loop_num; |
| } |
| |
| void SetLoopMark(Node* node, int loop_num) { |
| info(node); // create the NodeInfo |
| SetBackwardMark(node, loop_num); |
| loop_tree_->node_to_loop_num_[node->id()] = loop_num; |
| } |
| |
| void SetLoopMarkForLoopHeader(Node* node, int loop_num) { |
| DCHECK_EQ(IrOpcode::kLoop, node->opcode()); |
| SetLoopMark(node, loop_num); |
| for (Node* use : node->uses()) { |
| if (NodeProperties::IsPhi(use)) { |
| SetLoopMark(use, loop_num); |
| } |
| |
| // Do not keep the loop alive if it does not have any backedges. |
| if (node->InputCount() <= 1) continue; |
| |
| if (use->opcode() == IrOpcode::kLoopExit) { |
| SetLoopMark(use, loop_num); |
| for (Node* exit_use : use->uses()) { |
| if (exit_use->opcode() == IrOpcode::kLoopExitValue || |
| exit_use->opcode() == IrOpcode::kLoopExitEffect) { |
| SetLoopMark(exit_use, loop_num); |
| } |
| } |
| } |
| } |
| } |
| |
| void ResizeBackwardMarks() { |
| int new_width = width_ + 1; |
| int max = num_nodes(); |
| uint32_t* new_backward = zone_->NewArray<uint32_t>(new_width * max); |
| memset(new_backward, 0, new_width * max * sizeof(uint32_t)); |
| if (width_ > 0) { // copy old matrix data. |
| for (int i = 0; i < max; i++) { |
| uint32_t* np = &new_backward[i * new_width]; |
| uint32_t* op = &backward_[i * width_]; |
| for (int j = 0; j < width_; j++) np[j] = op[j]; |
| } |
| } |
| width_ = new_width; |
| backward_ = new_backward; |
| } |
| |
| void ResizeForwardMarks() { |
| int max = num_nodes(); |
| forward_ = zone_->NewArray<uint32_t>(width_ * max); |
| memset(forward_, 0, width_ * max * sizeof(uint32_t)); |
| } |
| |
| // Propagate marks forward from loops. |
| void PropagateForward() { |
| ResizeForwardMarks(); |
| for (TempLoopInfo& li : loops_) { |
| SetForwardMark(li.header, LoopNum(li.header)); |
| Queue(li.header); |
| } |
| // Propagate forward on paths that were backward reachable from backedges. |
| while (!queue_.empty()) { |
| tick_counter_->TickAndMaybeEnterSafepoint(); |
| Node* node = queue_.front(); |
| queue_.pop_front(); |
| queued_.Set(node, false); |
| for (Edge edge : node->use_edges()) { |
| Node* use = edge.from(); |
| if (!IsBackedge(use, edge.index())) { |
| if (PropagateForwardMarks(node, use)) Queue(use); |
| } |
| } |
| } |
| } |
| |
| bool IsLoopHeaderNode(Node* node) { |
| return node->opcode() == IrOpcode::kLoop || NodeProperties::IsPhi(node); |
| } |
| |
| bool IsLoopExitNode(Node* node) { |
| return node->opcode() == IrOpcode::kLoopExit || |
| node->opcode() == IrOpcode::kLoopExitValue || |
| node->opcode() == IrOpcode::kLoopExitEffect; |
| } |
| |
| bool IsBackedge(Node* use, int index) { |
| if (LoopNum(use) <= 0) return false; |
| if (NodeProperties::IsPhi(use)) { |
| return index != NodeProperties::FirstControlIndex(use) && |
| index != kAssumedLoopEntryIndex; |
| } else if (use->opcode() == IrOpcode::kLoop) { |
| return index != kAssumedLoopEntryIndex; |
| } |
| DCHECK(IsLoopExitNode(use)); |
| return false; |
| } |
| |
| int LoopNum(Node* node) { return loop_tree_->node_to_loop_num_[node->id()]; } |
| |
| NodeInfo& info(Node* node) { |
| NodeInfo& i = info_[node->id()]; |
| if (i.node == nullptr) i.node = node; |
| return i; |
| } |
| |
| void Queue(Node* node) { |
| if (!queued_.Get(node)) { |
| queue_.push_back(node); |
| queued_.Set(node, true); |
| } |
| } |
| |
| void AddNodeToLoop(NodeInfo* node_info, TempLoopInfo* loop, int loop_num) { |
| if (LoopNum(node_info->node) == loop_num) { |
| if (IsLoopHeaderNode(node_info->node)) { |
| node_info->next = loop->header_list; |
| loop->header_list = node_info; |
| } else { |
| DCHECK(IsLoopExitNode(node_info->node)); |
| node_info->next = loop->exit_list; |
| loop->exit_list = node_info; |
| } |
| } else { |
| node_info->next = loop->body_list; |
| loop->body_list = node_info; |
| } |
| } |
| |
| void FinishLoopTree() { |
| DCHECK(loops_found_ == static_cast<int>(loops_.size())); |
| DCHECK(loops_found_ == static_cast<int>(loop_tree_->all_loops_.size())); |
| |
| // Degenerate cases. |
| if (loops_found_ == 0) return; |
| if (loops_found_ == 1) return FinishSingleLoop(); |
| |
| for (int i = 1; i <= loops_found_; i++) ConnectLoopTree(i); |
| |
| size_t count = 0; |
| // Place the node into the innermost nested loop of which it is a member. |
| for (NodeInfo& ni : info_) { |
| if (ni.node == nullptr) continue; |
| |
| TempLoopInfo* innermost = nullptr; |
| int innermost_index = 0; |
| int pos = ni.node->id() * width_; |
| // Search the marks word by word. |
| for (int i = 0; i < width_; i++) { |
| uint32_t marks = backward_[pos + i] & forward_[pos + i]; |
| |
| for (int j = 0; j < 32; j++) { |
| if (marks & (1u << j)) { |
| int loop_num = i * 32 + j; |
| if (loop_num == 0) continue; |
| TempLoopInfo* loop = &loops_[loop_num - 1]; |
| if (innermost == nullptr || |
| loop->loop->depth_ > innermost->loop->depth_) { |
| innermost = loop; |
| innermost_index = loop_num; |
| } |
| } |
| } |
| } |
| if (innermost == nullptr) continue; |
| |
| // Return statements should never be found by forward or backward walk. |
| CHECK(ni.node->opcode() != IrOpcode::kReturn); |
| |
| AddNodeToLoop(&ni, innermost, innermost_index); |
| count++; |
| } |
| |
| // Serialize the node lists for loops into the loop tree. |
| loop_tree_->loop_nodes_.reserve(count); |
| for (LoopTree::Loop* loop : loop_tree_->outer_loops_) { |
| SerializeLoop(loop); |
| } |
| } |
| |
| // Handle the simpler case of a single loop (no checks for nesting necessary). |
| void FinishSingleLoop() { |
| // Place nodes into the loop header and body. |
| TempLoopInfo* li = &loops_[0]; |
| li->loop = &loop_tree_->all_loops_[0]; |
| loop_tree_->SetParent(nullptr, li->loop); |
| size_t count = 0; |
| for (NodeInfo& ni : info_) { |
| if (ni.node == nullptr || !IsInLoop(ni.node, 1)) continue; |
| |
| // Return statements should never be found by forward or backward walk. |
| CHECK(ni.node->opcode() != IrOpcode::kReturn); |
| |
| AddNodeToLoop(&ni, li, 1); |
| count++; |
| } |
| |
| // Serialize the node lists for the loop into the loop tree. |
| loop_tree_->loop_nodes_.reserve(count); |
| SerializeLoop(li->loop); |
| } |
| |
| // Recursively serialize the list of header nodes and body nodes |
| // so that nested loops occupy nested intervals. |
| void SerializeLoop(LoopTree::Loop* loop) { |
| int loop_num = loop_tree_->LoopNum(loop); |
| TempLoopInfo& li = loops_[loop_num - 1]; |
| |
| // Serialize the header. |
| loop->header_start_ = static_cast<int>(loop_tree_->loop_nodes_.size()); |
| for (NodeInfo* ni = li.header_list; ni != nullptr; ni = ni->next) { |
| loop_tree_->loop_nodes_.push_back(ni->node); |
| loop_tree_->node_to_loop_num_[ni->node->id()] = loop_num; |
| } |
| |
| // Serialize the body. |
| loop->body_start_ = static_cast<int>(loop_tree_->loop_nodes_.size()); |
| for (NodeInfo* ni = li.body_list; ni != nullptr; ni = ni->next) { |
| loop_tree_->loop_nodes_.push_back(ni->node); |
| loop_tree_->node_to_loop_num_[ni->node->id()] = loop_num; |
| } |
| |
| // Serialize nested loops. |
| for (LoopTree::Loop* child : loop->children_) SerializeLoop(child); |
| |
| // Serialize the exits. |
| loop->exits_start_ = static_cast<int>(loop_tree_->loop_nodes_.size()); |
| for (NodeInfo* ni = li.exit_list; ni != nullptr; ni = ni->next) { |
| loop_tree_->loop_nodes_.push_back(ni->node); |
| loop_tree_->node_to_loop_num_[ni->node->id()] = loop_num; |
| } |
| |
| loop->exits_end_ = static_cast<int>(loop_tree_->loop_nodes_.size()); |
| } |
| |
| // Connect the LoopTree loops to their parents recursively. |
| LoopTree::Loop* ConnectLoopTree(int loop_num) { |
| TempLoopInfo& li = loops_[loop_num - 1]; |
| if (li.loop != nullptr) return li.loop; |
| |
| NodeInfo& ni = info(li.header); |
| LoopTree::Loop* parent = nullptr; |
| for (int i = 1; i <= loops_found_; i++) { |
| if (i == loop_num) continue; |
| if (IsInLoop(ni.node, i)) { |
| // recursively create potential parent loops first. |
| LoopTree::Loop* upper = ConnectLoopTree(i); |
| if (parent == nullptr || upper->depth_ > parent->depth_) { |
| parent = upper; |
| } |
| } |
| } |
| li.loop = &loop_tree_->all_loops_[loop_num - 1]; |
| loop_tree_->SetParent(parent, li.loop); |
| return li.loop; |
| } |
| |
| void PrintLoop(LoopTree::Loop* loop) { |
| for (int i = 0; i < loop->depth_; i++) PrintF(" "); |
| PrintF("Loop depth = %d ", loop->depth_); |
| int i = loop->header_start_; |
| while (i < loop->body_start_) { |
| PrintF(" H#%d", loop_tree_->loop_nodes_[i++]->id()); |
| } |
| while (i < loop->exits_start_) { |
| PrintF(" B#%d", loop_tree_->loop_nodes_[i++]->id()); |
| } |
| while (i < loop->exits_end_) { |
| PrintF(" E#%d", loop_tree_->loop_nodes_[i++]->id()); |
| } |
| PrintF("\n"); |
| for (LoopTree::Loop* child : loop->children_) PrintLoop(child); |
| } |
| }; |
| |
| LoopTree* LoopFinder::BuildLoopTree(Graph* graph, TickCounter* tick_counter, |
| Zone* zone) { |
| LoopTree* loop_tree = |
| graph->zone()->New<LoopTree>(graph->NodeCount(), graph->zone()); |
| LoopFinderImpl finder(graph, loop_tree, tick_counter, zone); |
| finder.Run(); |
| if (FLAG_trace_turbo_loop) { |
| finder.Print(); |
| } |
| return loop_tree; |
| } |
| |
| Node* LoopTree::HeaderNode(Loop* loop) { |
| Node* first = *HeaderNodes(loop).begin(); |
| if (first->opcode() == IrOpcode::kLoop) return first; |
| DCHECK(IrOpcode::IsPhiOpcode(first->opcode())); |
| Node* header = NodeProperties::GetControlInput(first); |
| DCHECK_EQ(IrOpcode::kLoop, header->opcode()); |
| return header; |
| } |
| |
| } // namespace compiler |
| } // namespace internal |
| } // namespace v8 |