Source Code of havlakloopfinder.HavlakLoopFinder

// Copyright 2011 Google Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.


//======================================================
// Main Algorithm
//======================================================


/**
 * The Havlak loop finding algorithm.
 *
 * @author rhundt
 */
package havlakloopfinder;


import cfg.BasicBlock;
import cfg.CFG;


import lsg.LSG;
import lsg.SimpleLoop;


import java.util.*;


/**
 * class HavlakLoopFinder
 *
 * This class encapsulates the complete finder algorithm
 */
public class HavlakLoopFinder {


  public HavlakLoopFinder(CFG cfg, LSG lsg) {
    this.cfg = cfg;
    this.lsg = lsg;
  }


  public long getMaxMillis() {
    return maxMillis;
  }


  public long getMinMillis() {
    return minMillis;
  }


  /**
   * enum BasicBlockClass
   *
   * Basic Blocks and Loops are being classified as regular, irreducible,
   * and so on. This enum contains a symbolic name for all these classifications
   */
  public enum BasicBlockClass {
    BB_TOP,          // uninitialized
    BB_NONHEADER,    // a regular BB
    BB_REDUCIBLE,    // reducible loop
    BB_SELF,         // single BB loop
    BB_IRREDUCIBLE,  // irreducible loop
    BB_DEAD,         // a dead BB
    BB_LAST          // Sentinel
  }




  /**
   * class UnionFindNode
   *
   * The algorithm uses the Union/Find algorithm to collapse
   * complete loops into a single node. These nodes and the
   * corresponding functionality are implemented with this class
   */
  public class UnionFindNode {


    public UnionFindNode() {
    }


    // Initialize this node.
    //
    public void initNode(BasicBlock bb, int dfsNumber) {
      this.parent     = this;
      this.bb         = bb;
      this.dfsNumber  = dfsNumber;
      this.loop       = null;
    }


    // Union/Find Algorithm - The find routine.
    //
    // Implemented with Path Compression (inner loops are only
    // visited and collapsed once, however, deep nests would still
    // result in significant traversals).
    //
    public UnionFindNode findSet() {


      List<UnionFindNode> nodeList = new ArrayList<UnionFindNode>(2);


      UnionFindNode node = this;
      while (node != node.getParent()) {
        if (node.getParent() != node.getParent().getParent()) {
          nodeList.add(node);
        }
        node = node.getParent();
      }


      // Path Compression, all nodes' parents point to the 1st level parent.
      int len = nodeList.size();
      for (int i = 0; i < len; i++) {
      // for (UnionFindNode iter : nodeList)
        UnionFindNode iter = nodeList.get(i);
        iter.setParent(node.getParent());
      }
      return node;
    }


    // Union/Find Algorithm - The union routine.
    //
    // Trivial. Assigning parent pointer is enough,
    // we rely on path compression.
    //
    void union(UnionFindNode basicBlock) {
      setParent(basicBlock);
    }


    // Getters/Setters
    //
    UnionFindNode getParent() {
      return parent;
    }
    BasicBlock    getBb() {
      return bb;
    }
    SimpleLoop    getLoop() {
      return loop;
    }
    int           getDfsNumber() {
      return dfsNumber;
    }


    void          setParent(UnionFindNode parent) {
      this.parent = parent;
    }
    void          setLoop(SimpleLoop loop) {
      this.loop = loop;
    }


    private UnionFindNode parent;
    private BasicBlock    bb;
    private SimpleLoop    loop;
    private int           dfsNumber;
  }


  //
  // Constants
  //
  // Marker for uninitialized nodes.
  static final int UNVISITED = Integer.MAX_VALUE;


  // Safeguard against pathologic algorithm behavior.
  static final int MAXNONBACKPREDS = (32 * 1024);


  //
  // IsAncestor
  //
  // As described in the paper, determine whether a node 'w' is a
  // "true" ancestor for node 'v'.
  //
  // Dominance can be tested quickly using a pre-order trick
  // for depth-first spanning trees. This is why DFS is the first
  // thing we run below.
  //
  boolean isAncestor(int w, int v, int[] last) {
    return ((w <= v) && (v <= last[w]));
  }


  static class IntegerSet implements Iterable<Integer> {
    int[] arr;
    int size;
    static int total = 0;
    static int resize = 0;
    static {
      Runtime.getRuntime().addShutdownHook(new Thread() {
          @Override public void run() {
            System.out.println(total + " = total");
            System.out.println(resize + " = resize");
          }
        });
    }
    IntegerSet() {
      total++;
      arr = new int[2];
      size = 0;
    }
    boolean add(int e) {
      for (int i = 0; i < size; i++) {
        if (arr[i] == e) {
          return false;
        }
      }
      if (size == arr.length) {
        resize++;
        int[] old = arr;
        arr = new int[arr.length << 1];
        System.arraycopy(old, 0, arr, 0, old.length);
      }
      arr[size] = e;
      size++;
      return true;
    }


    int size() { return size; }
    @Override public Iterator<Integer> iterator() {
      return new Iterator<Integer>() {
        int curr = 0;
        @Override public boolean hasNext() {
          return curr != size;
        }
        @Override public Integer next() {
          return arr[curr++];
        }
        @Override public void remove() {
          throw new UnsupportedOperationException();
        }
      };
    }
    IntegerSet clear() {size = 0; return this;}
  }


  static class IntegerList implements Iterable<Integer> {
    int[] arr;
    int size;
    static int total = 0;
    static int resize = 0;
    static {
      Runtime.getRuntime().addShutdownHook(new Thread() {
          @Override public void run() {
            System.out.println(total + " = total");
            System.out.println(resize + " = resize");
          }
        });
    }
    IntegerList() {
      total++;
      arr = new int[2];
      size = 0;
    }
    IntegerList clear() {size = 0; return this;}
    int get(int i) {
      return arr[i];
    }
    boolean add(int e) {
      if (size == arr.length) {
        resize++;
        int[] old = arr;
        arr = new int[arr.length << 1];
        System.arraycopy(old, 0, arr, 0, old.length);
      }
      arr[size] = e;
      size++;
      return true;
    }


    int size() { return size; }
    @Override public Iterator<Integer> iterator() {
      return new Iterator<Integer>() {
        int curr = 0;
        @Override public boolean hasNext() {
          return curr != size;
        }
        @Override public Integer next() {
          return arr[curr++];
        }
        @Override public void remove() {
          throw new UnsupportedOperationException();
        }
      };
    }
  }


  //
  // DFS - Depth-First-Search
  //
  // DESCRIPTION:
  // Simple depth first traversal along out edges with node numbering.
  //
  int doDFS(BasicBlock             currentNode,
            UnionFindNode[]          nodes,
            Map<BasicBlock, Integer> number,
            int[]                    last,
            final int current) {
    nodes[current].initNode(currentNode, current);
    number.put(currentNode, current);


    int lastid = current;
    // for (BasicBlock target : currentNode.getOutEdges()) {
    int len = currentNode.getOutEdges().size();
    for (int i = 0; i < len; i++) {
      BasicBlock target = currentNode.getOutEdges().get(i);
      if (number.get(target) == UNVISITED) {
        lastid = doDFS(target, nodes, number, last, lastid + 1);
      }
    }
    last[number.get(currentNode)] = lastid;
    return lastid;
  }


  static List<IntegerSet>       nonBackPreds = new ArrayList<IntegerSet>(2);
  static List<IntegerList>      backPreds = new ArrayList<IntegerList>(2);
  static Map<BasicBlock, Integer> number = new HashMap<BasicBlock, Integer>();
  static int                      maxSize = 0;
  static int[]                    header;
  static BasicBlockClass[]        type;
  static int[]                    last;
  static UnionFindNode[]          nodes;
  static LinkedList<IntegerSet> freeListSet = new LinkedList<IntegerSet>();
  static LinkedList<IntegerList> freeListList = new LinkedList<IntegerList>();




  //
  // findLoops
  //
  // Find loops and build loop forest using Havlak's algorithm, which
  // is derived from Tarjan. Variable names and step numbering has
  // been chosen to be identical to the nomenclature in Havlak's
  // paper (which, in turn, is similar to the one used by Tarjan).
  //
  public void findLoops() {
    if (cfg.getStartBasicBlock() == null) {
      return;
    }


    long                     startMillis = System.currentTimeMillis();


    int                      size = cfg.getNumNodes();


    nonBackPreds.clear();
    backPreds.clear();
    number.clear();
    if (size > maxSize) {
      header = new int[size];
      type = new BasicBlockClass[size];
      last = new int[size];
      nodes = new UnionFindNode[size];
      maxSize = size;
    }
    /*
    List<Set<Integer>>       nonBackPreds = new ArrayList<Set<Integer>>();
    List<List<Integer>>      backPreds = new ArrayList<List<Integer>>();


    Map<BasicBlock, Integer> number = new HashMap<BasicBlock, Integer>();
    int[]                    header = new int[size];
    BasicBlockClass[]        type = new BasicBlockClass[size];
    int[]                    last = new int[size];
    UnionFindNode[]          nodes = new UnionFindNode[size];
    */


    for (int i = 0; i < size; ++i) {
      nonBackPreds.add(freeListSet.size() == 0 ? new IntegerSet() : freeListSet.removeFirst().clear());
      backPreds.add(freeListList.size() == 0 ? new IntegerList() : freeListList.removeFirst().clear());
      nodes[i] = new UnionFindNode();
    }


    // Step a:
    //   - initialize all nodes as unvisited.
    //   - depth-first traversal and numbering.
    //   - unreached BB's are marked as dead.
    //
    for (BasicBlock bbIter : cfg.getBasicBlocks().values()) {
      number.put(bbIter, UNVISITED);
    }


    doDFS(cfg.getStartBasicBlock(), nodes, number, last, 0);


    // Step b:
    //   - iterate over all nodes.
    //
    //   A backedge comes from a descendant in the DFS tree, and non-backedges
    //   from non-descendants (following Tarjan).
    //
    //   - check incoming edges 'v' and add them to either
    //     - the list of backedges (backPreds) or
    //     - the list of non-backedges (nonBackPreds)
    //
    for (int w = 0; w < size; w++) {
      header[w] = 0;
      type[w] = BasicBlockClass.BB_NONHEADER;


      BasicBlock nodeW = nodes[w].getBb();
      if (nodeW == null) {
        type[w] = BasicBlockClass.BB_DEAD;
        continue;  // dead BB
      }


      if (nodeW.getNumPred() > 0) {
        int len1 = nodeW.getInEdges().size();
        for (int i = 0; i < len1; i++) {
          // for (BasicBlock nodeV : nodeW.getInEdges()) {
          BasicBlock nodeV = nodeW.getInEdges().get(i);
          int v = number.get(nodeV);
          if (v == UNVISITED) {
            continue;  // dead node
          }


          if (isAncestor(w, v, last)) {
            backPreds.get(w).add(v);
          } else {
            nonBackPreds.get(w).add(v);
          }
        }
      }
    }


    // Start node is root of all other loops.
    header[0] = 0;


    // Step c:
    //
    // The outer loop, unchanged from Tarjan. It does nothing except
    // for those nodes which are the destinations of backedges.
    // For a header node w, we chase backward from the sources of the
    // backedges adding nodes to the set P, representing the body of
    // the loop headed by w.
    //
    // By running through the nodes in reverse of the DFST preorder,
    // we ensure that inner loop headers will be processed before the
    // headers for surrounding loops.
    //
    for (int w = size - 1; w >= 0; w--) {
      // this is 'P' in Havlak's paper
      LinkedList<UnionFindNode> nodePool = new LinkedList<UnionFindNode>();


      BasicBlock  nodeW = nodes[w].getBb();
      if (nodeW == null) {
        continue;  // dead BB
      }


      // Step d:
      int len = backPreds.get(w).size();
      for (int i = 0; i < len; i++) {
        int v = backPreds.get(w).get(i);
           // for (int v : backPreds.get(w)) {
        if (v != w) {
          nodePool.add(nodes[v].findSet());
        } else {
          type[w] = BasicBlockClass.BB_SELF;
        }
      }


      // Copy nodePool to workList.
      //
      LinkedList<UnionFindNode> workList = new LinkedList<UnionFindNode>();


      for (UnionFindNode niter : nodePool)
        workList.add(niter);


      if (nodePool.size() != 0) {
        type[w] = BasicBlockClass.BB_REDUCIBLE;
      }


      // work the list...
      //
      while (!workList.isEmpty()) {
        UnionFindNode x = workList.getFirst();
        workList.removeFirst();


        // Step e:
        //
        // Step e represents the main difference from Tarjan's method.
        // Chasing upwards from the sources of a node w's backedges. If
        // there is a node y' that is not a descendant of w, w is marked
        // the header of an irreducible loop, there is another entry
        // into this loop that avoids w.
        //


        // The algorithm has degenerated. Break and
        // return in this case.
        //
        int nonBackSize = nonBackPreds.get(x.getDfsNumber()).size();
        if (nonBackSize > MAXNONBACKPREDS) {
          return;
        }


        IntegerSet curr = nonBackPreds.get(x.getDfsNumber());
        for (int i = 0; i < curr.size; i++) {
          int iter = curr.arr[i];
          UnionFindNode  y = nodes[iter];
          UnionFindNode  ydash = y.findSet();


          if (!isAncestor(w, ydash.getDfsNumber(), last)) {
            type[w] = BasicBlockClass.BB_IRREDUCIBLE;
            nonBackPreds.get(w).add(ydash.getDfsNumber());
          } else {
            if (ydash.getDfsNumber() != w) {
              if (!nodePool.contains(ydash)) {
                workList.add(ydash);
                nodePool.add(ydash);
              }
            }
          }
        }
      }


      // Collapse/Unionize nodes in a SCC to a single node
      // For every SCC found, create a loop descriptor and link it in.
      //
      if ((nodePool.size() > 0) || (type[w] == BasicBlockClass.BB_SELF)) {
        SimpleLoop loop = lsg.createNewLoop();


        loop.setHeader(nodeW);
        loop.setIsReducible(type[w] != BasicBlockClass.BB_IRREDUCIBLE);


        // At this point, one can set attributes to the loop, such as:
        //
        // the bottom node:
        //    iter  = backPreds[w].begin();
        //    loop bottom is: nodes[iter].node);
        //
        // the number of backedges:
        //    backPreds[w].size()
        //
        // whether this loop is reducible:
        //    type[w] != BasicBlockClass.BB_IRREDUCIBLE
        //
        nodes[w].setLoop(loop);


        for (UnionFindNode node : nodePool) {
          // Add nodes to loop descriptor.
          header[node.getDfsNumber()] = w;
          node.union(nodes[w]);


          // Nested loops are not added, but linked together.
          if (node.getLoop() != null) {
            node.getLoop().setParent(loop);
          } else {
            loop.addNode(node.getBb());
          }
        }


        lsg.addLoop(loop);
      }  // nodePool.size
    }  // Step c


    long totalMillis = System.currentTimeMillis() - startMillis;


    if (totalMillis > maxMillis) {
      maxMillis = totalMillis;
    }
    if (totalMillis < minMillis) {
      minMillis = totalMillis;
    }
    for (int i = 0; i < size; ++i) {
      freeListSet.add(nonBackPreds.get(i));
      freeListList.add(backPreds.get(i));
      nodes[i] = new UnionFindNode();
    }
  }  // findLoops


  private CFG cfg;      // Control Flow Graph
  private LSG lsg;      // Loop Structure Graph


  private static long maxMillis = 0;
  private static long minMillis = Integer.MAX_VALUE;




}
Source Code of havlakloopfinder.HavlakLoopFinder

Related Classes of havlakloopfinder.HavlakLoopFinder