Source Code of org.apache.derby.impl.sql.compile.GroupByNode

/*


   Derby - Class org.apache.derby.impl.sql.compile.GroupByNode


   Copyright 1998, 2004 The Apache Software Foundation or its licensors, as applicable.


   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at


      http://www.apache.org/licenses/LICENSE-2.0


   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.


 */


package  org.apache.derby.impl.sql.compile;


import org.apache.derby.iapi.services.context.ContextManager;


import org.apache.derby.iapi.store.access.ColumnOrdering;


import org.apache.derby.iapi.sql.compile.AccessPath;
import org.apache.derby.iapi.sql.compile.Optimizable;
import org.apache.derby.iapi.sql.compile.OptimizableList;
import org.apache.derby.iapi.sql.compile.OptimizablePredicate;
import org.apache.derby.iapi.sql.compile.OptimizablePredicateList;
import org.apache.derby.iapi.sql.compile.Optimizer;
import org.apache.derby.iapi.sql.compile.CostEstimate;
import org.apache.derby.iapi.sql.compile.Visitable;
import org.apache.derby.iapi.sql.compile.Visitor;
import org.apache.derby.iapi.sql.compile.RequiredRowOrdering;
import org.apache.derby.iapi.sql.compile.RowOrdering;
import org.apache.derby.iapi.sql.compile.C_NodeTypes;


import org.apache.derby.iapi.sql.conn.LanguageConnectionContext;
import org.apache.derby.iapi.reference.ClassName;


import org.apache.derby.iapi.sql.dictionary.DataDictionary;
import org.apache.derby.iapi.sql.dictionary.DataDictionaryContext;
import org.apache.derby.iapi.sql.dictionary.ConglomerateDescriptor;
import org.apache.derby.catalog.IndexDescriptor;


import org.apache.derby.iapi.sql.execute.ExecutionContext;


import org.apache.derby.iapi.sql.Activation; 
import org.apache.derby.iapi.sql.LanguageFactory;
import org.apache.derby.iapi.sql.ResultColumnDescriptor;
import org.apache.derby.iapi.sql.ResultSet;


import org.apache.derby.iapi.error.StandardException;


import org.apache.derby.impl.sql.compile.ActivationClassBuilder;
import org.apache.derby.impl.sql.execute.AggregatorInfo;
import org.apache.derby.impl.sql.execute.AggregatorInfoList;


import org.apache.derby.iapi.services.compiler.MethodBuilder;


import org.apache.derby.iapi.services.sanity.SanityManager;


import org.apache.derby.iapi.services.io.FormatableArrayHolder;
import org.apache.derby.iapi.util.JBitSet;


import org.apache.derby.impl.sql.compile.MaxMinAggregateDefinition;
import org.apache.derby.iapi.services.classfile.VMOpcode;


import java.util.Vector;
import java.util.Properties;




/**
 * A GroupByNode represents a result set for a grouping operation
 * on a select.  Note that this includes a SELECT with aggregates
 * and no grouping columns (in which case the select list is null)
 * It has the same description as its input result set.
 * <p>
 * For the most part, it simply delegates operations to its bottomPRSet,
 * which is currently expected to be a ProjectRestrictResultSet generated
 * for a SelectNode.
 * <p>
 * NOTE: A GroupByNode extends FromTable since it can exist in a FromList.
 * <p>
 * There is a lot of room for optimizations here: <UL>
 * <LI> agg(distinct x) group by x => agg(x) group by x (for min and max) </LI>
 * <LI> min()/max() use index scans if possible, no sort may 
 *    be needed. </LI>
 * </UL>
 *
 * @author jerry, aggregates by jamie
 *
 */
public class GroupByNode extends SingleChildResultSetNode
{
  /**
   * The GROUP BY list
   */
  GroupByList groupingList;


  /**
   * The list of all aggregates in the query block
   * that contains this group by.
   */
  Vector  aggregateVector;


  /**
   * Information that is used at execution time to
   * process aggregates.
   */
  private AggregatorInfoList  aggInfo;


  /**
   * The parent to the GroupByNode.  If we need to
   * generate a ProjectRestrict over the group by
   * then this is set to that node.  Otherwise it
   * is null.
   */
  FromTable  parent;


  private boolean  addDistinctAggregate;
  private boolean singleInputRowOptimization;
  private int    addDistinctAggregateColumnNum;


  // Is the source in sorted order
  private boolean isInSortedOrder;


  /**
   * Intializer for a GroupByNode.
   *
   * @param bottomPR  The child FromTable
   * @param groupingList  The groupingList
   * @param aggregateVector  The vector of aggregates from
   *    the query block.  Since aggregation is done
   *    at the same time as grouping, we need them
   *    here.
   * @param tableProperties  Properties list associated with the table
   *
   * @exception StandardException    Thrown on error
   */
  public void init(
            Object  bottomPR,
            Object groupingList,
            Object  aggregateVector,
            Object tableProperties)
      throws StandardException
  {
    super.init(bottomPR, tableProperties);


    /* Group by without aggregates gets xformed into distinct */
    if (SanityManager.DEBUG)
    {
      SanityManager.ASSERT(((Vector) aggregateVector).size() > 0,
        "aggregateVector expected to be non-empty");
      if (!(childResult instanceof Optimizable))
      {
        SanityManager.THROWASSERT("childResult, " + childResult.getClass().getName() +
          ", expected to be instanceof Optimizable");
      }
      if (!(childResult instanceof FromTable))
      {
        SanityManager.THROWASSERT("childResult, " + childResult.getClass().getName() +
          ", expected to be instanceof FromTable");
      }
    }


    ResultColumnList newBottomRCL;
    this.groupingList = (GroupByList) groupingList;
    this.aggregateVector = (Vector) aggregateVector;
    this.parent = this;


    /*
    ** The first thing we do is put ourselves on
    ** top of the SELECT.  The select becomes the
    ** childResult.  So our RCL becomes its RCL (so
    ** nodes above it now point to us).  Map our
    ** RCL to its columns.
    */
    newBottomRCL = childResult.getResultColumns().copyListAndObjects();
    resultColumns = childResult.getResultColumns();
    childResult.setResultColumns(newBottomRCL);


    /*
    ** We have aggregates, so we need to add
    ** an extra PRNode and we also have to muck around
    ** with our trees a might.
    */
    addAggregates();


    /* We say that the source is never in sorted order if there is a distinct aggregate.
     * (Not sure what happens if it is, so just skip it for now.)
     * Otherwise, we check to see if the source is in sorted order on any permutation
     * of the grouping columns.)
     */
    if (! addDistinctAggregate && groupingList != null)
    {
      ColumnReference[] crs =
                new ColumnReference[this.groupingList.size()];


      // Now populate the CR array and see if ordered
      int glSize = this.groupingList.size();
      for (int index = 0; index < glSize; index++)
      {
        GroupByColumn gc =
            (GroupByColumn) this.groupingList.elementAt(index);
        crs[index] = gc.getColumnReference();
      }


      isInSortedOrder = childResult.isOrderedOn(crs, true, (Vector)null);
    }
  }


  /**
   * Get whether or not the source is in sorted order.
   *
   * @return Whether or not the source is in sorted order.
   */
  boolean getIsInSortedOrder()
  {
    return isInSortedOrder;
  }


  /**
   * Add the extra result columns required by the aggregates
   * to the result list.
   * 
   * @exception standard exception
   */
  private void addAggregates()
    throws StandardException
  {
    addNewPRNode();
    addNewColumnsForAggregation();
    addDistinctAggregatesToOrderBy();
  }


  /**
   * Add any distinct aggregates to the order by list.
   * Asserts that there are 0 or more distincts.
   */
  private void addDistinctAggregatesToOrderBy()
  {
    int numDistinct = numDistinctAggregates(aggregateVector);
    if (numDistinct != 0)
    {
      if (SanityManager.DEBUG)
      {
        SanityManager.ASSERT(numDistinct == 1,
          "Should not have more than 1 distinct aggregate per Group By node");
      }
      
      AggregatorInfo agg = null;
      int count = aggInfo.size();
      for (int i = 0; i < count; i++)
      {
        agg = (AggregatorInfo) aggInfo.elementAt(i);
        if (agg.isDistinct())
        {
          break;
        }
      }


      if (SanityManager.DEBUG)
      {
        SanityManager.ASSERT(agg != null && agg.isDistinct());
      }


      addDistinctAggregate = true;
      addDistinctAggregateColumnNum = agg.getInputColNum();
    }
  }
  
  /**
   * Add a new PR node for aggregation.  Put the
   * new PR under the sort.
   *    
   * @exception standard exception
   */
  private void addNewPRNode()
    throws StandardException
  {
    /*
    ** Get the new PR, put above the GroupBy.  
    */
    parent = (FromTable) getNodeFactory().getNode(
                    C_NodeTypes.PROJECT_RESTRICT_NODE,
                    this,   // child
                    resultColumns,    // result column list
                    null,        // restriction
                    null,        // restriction list
                    null,        // project subqueries
                    null,        // restrict subqueries
                    tableProperties,
                    getContextManager());




    /*
    ** Reset the bottom RCL to be empty.
    */
    childResult.setResultColumns((ResultColumnList)
                      getNodeFactory().getNode(
                        C_NodeTypes.RESULT_COLUMN_LIST,
                        getContextManager()));


    /*
    ** Set the group by RCL to be empty
    */
    resultColumns = (ResultColumnList) getNodeFactory().getNode(
                      C_NodeTypes.RESULT_COLUMN_LIST,
                      getContextManager());


  }




  /**
   * Add a whole slew of columns needed for 
   * aggregation. Basically, for each aggregate we add
   * 2 columns: the aggregate input expression
   * and the aggregator column.  The input expression is
   * taken directly from the aggregator node.  The aggregator
   * is the run time aggregator.  We add it to the RC list
   * as a new object coming into the sort node.
   * <P>
   * At this point this is invoked, we have the following
   * tree: <UL>
   *      PR - (PARENT): RCL is the original select list
   *       |
   *      PR - GROUP BY:  RCL is empty
   *       |
   *      PR - FROM TABLE: RCL is empty </UL> <P>
   *
   * For each ColumnReference in PR RCL <UL>
   *  <LI> clone the ref </LI>
   *  <LI> create a new RC in the bottom RCL and set it 
   *     to the col ref </LI>
   *  <LI> create a new RC in the GROUPBY RCL and set it to 
   *     point to the bottom RC </LI>
   *  <LI> reset the top PR ref to point to the new GROUPBY
   *     RC  
   *
   * For each aggregate in aggregateVector <UL>
   *  <LI> create RC in FROM TABLE.  Fill it with 
   *     aggs Operator.
   *  <LI> create RC in FROM TABLE for agg result</LI>
   *  <LI> create RC in FROM TABLE for aggregator</LI>
   *  <LI> create RC in GROUPBY for agg input, set it
   *    to point to FROM TABLE RC </LI>
   *  <LI> create RC in GROUPBY for agg result</LI>
   *  <LI> create RC in GROUPBY for aggregator</LI>
   *  <LI> replace Agg with reference to RC for agg result </LI>
   *
   * @exception standard exception
   */
  private void addNewColumnsForAggregation()
    throws StandardException
  {
    /*
    ** Now we have two new nodes, the sort and a new PR above
    ** it.  They all map to the child result set.  Now we must
    ** find every aggregate and massage the tree.  For now we
    ** will examine every result column of the original select
    ** list.
    */
    DataDictionary      dd;
    AggregateNode  aggregate = null;
    ColumnReference  newColumnRef;
    ResultColumn  rcBottom;
    ResultColumn  newRC;
    ResultColumn  gbRC;
    ResultColumn  tmpRC;
    ResultColumn  aggInputRC;
    ResultColumnList bottomRCL  = childResult.getResultColumns();
    ResultColumnList groupByRCL = resultColumns;
    ResultColumnList aggRCL;
    int        aggregatorVColId;
    int        aggInputVColId;
    int        aggResultVColId;


    LanguageFactory lf = getLanguageConnectionContext().getLanguageFactory();
    dd = getDataDictionary();
    aggInfo = new AggregatorInfoList();


    /*
    ** Get a list of all column references in the
    ** parent RCL, skipping (not going below) AggregateNodes
    */
    CollectNodesVisitor getUnaggVisitor = new CollectNodesVisitor(ColumnReference.class, AggregateNode.class);
    parent.getResultColumns().accept(getUnaggVisitor);
    Vector colRefVector = getUnaggVisitor.getList();


    /*
    ** Walk the list of unaggregated column references
    ** and push them down.
    */
    int crvSize = colRefVector.size();
    for (int index = 0; index < crvSize; index++)
    {
      ColumnReference origColumnRef = (ColumnReference) colRefVector.elementAt(index);
      newColumnRef = (ColumnReference)origColumnRef.getClone();


      /*
      ** Put the column reference in the bottom PR.
      */
      newRC = (ResultColumn) getNodeFactory().getNode(
                  C_NodeTypes.RESULT_COLUMN,
                  "##UnaggColumn",
                  newColumnRef,
                  getContextManager());
      newRC.setExpression(newColumnRef);
      bottomRCL.addElement(newRC);
      newRC.markGenerated();
      newRC.bindResultColumnToExpression();
      newRC.setVirtualColumnId(bottomRCL.size());


      /*
      ** Reset the group by column position
      */
      if (groupingList != null) 
      {
        GroupByColumn  gbColumn;
        if ((gbColumn = 
            groupingList.containsColumnReference(newColumnRef)) 
          != null)
        {
          gbColumn.setColumnPosition(bottomRCL.size());
        }
      }
    
      /*
      ** Add the column to the group by list
      */
      gbRC = getColumnReference(newRC, dd);
      groupByRCL.addElement(gbRC);
      gbRC.markGenerated();
      gbRC.bindResultColumnToExpression();
      gbRC.setVirtualColumnId(groupByRCL.size());
  
      /*
      ** Reset the original node to point to the
      ** Group By result set.
      */
      origColumnRef.setSource(gbRC);
    }
    /*
    ** Now process all of the aggregates.  Replace
    ** every aggregate with an RC.  We toss out
    ** the list of RCs, we need to get each RC
    ** as we process its corresponding aggregate.
    */
    ReplaceAggregatesWithCRVisitor replaceAggsVisitor = 
      new ReplaceAggregatesWithCRVisitor(
          (ResultColumnList) getNodeFactory().getNode(
                    C_NodeTypes.RESULT_COLUMN_LIST,
                    getContextManager()),
          ((FromTable) childResult).getTableNumber());
    parent.getResultColumns().accept(replaceAggsVisitor);


    /*
    ** For each aggregate
    */
    int alSize = aggregateVector.size();
    for (int index = 0; index < alSize; index++)
    {
      aggregate = (AggregateNode) aggregateVector.elementAt(index);


      /*
      ** AGG RESULT: Set the aggregate result to null in the
      ** bottom project restrict.
      */
      newRC = (ResultColumn) getNodeFactory().getNode(
                    C_NodeTypes.RESULT_COLUMN,
                    "##aggregate result",
                    aggregate.getNewNullResultExpression(),
                    getContextManager());
      newRC.markGenerated();
      newRC.bindResultColumnToExpression();
      bottomRCL.addElement(newRC);
      newRC.setVirtualColumnId(bottomRCL.size());
      aggResultVColId = newRC.getVirtualColumnId();


      /*
      ** Set the GB aggregrate result column to
      ** point to this.  The GB aggregate result
      ** was created when we called
      ** ReplaceAggregatesWithColumnReferencesVisitor()
      */
      newColumnRef = (ColumnReference) getNodeFactory().getNode(
                        C_NodeTypes.COLUMN_REFERENCE,
                        newRC.getName(),
                        null,
                        getContextManager());
      newColumnRef.setSource(newRC);
      newColumnRef.setType(newRC.getExpressionType());
      newColumnRef.setNestingLevel(this.getLevel());
      newColumnRef.setSourceLevel(this.getLevel());
      tmpRC = (ResultColumn) getNodeFactory().getNode(
                C_NodeTypes.RESULT_COLUMN,
                newRC.getColumnName(),
                newColumnRef,
                getContextManager());
      tmpRC.markGenerated();
      tmpRC.bindResultColumnToExpression();
      groupByRCL.addElement(tmpRC);
      tmpRC.setVirtualColumnId(groupByRCL.size());


      /*
      ** Set the column reference to point to
      ** this.
      */
      newColumnRef = aggregate.getGeneratedRef();
      newColumnRef.setSource(tmpRC);


      /*
      ** AGG INPUT: Create a ResultColumn in the bottom 
      ** project restrict that has the expression that is
      ** to be aggregated
      */
      newRC = aggregate.getNewExpressionResultColumn(dd);
      newRC.markGenerated();
      newRC.bindResultColumnToExpression();
      bottomRCL.addElement(newRC);
      newRC.setVirtualColumnId(bottomRCL.size());
      aggInputVColId = newRC.getVirtualColumnId();
      aggInputRC = newRC;
  
      /*
      ** Add a reference to this column into the
      ** group by columns.
      */
      tmpRC = getColumnReference(newRC, dd);
      groupByRCL.addElement(tmpRC);
      tmpRC.setVirtualColumnId(groupByRCL.size());


      /*
      ** AGGREGATOR: Add a getAggregator method call 
      ** to the bottom result column list.
      */
      newRC = aggregate.getNewAggregatorResultColumn(dd);
      newRC.markGenerated();
      newRC.bindResultColumnToExpression();
      bottomRCL.addElement(newRC);
      newRC.setVirtualColumnId(bottomRCL.size());
      aggregatorVColId = newRC.getVirtualColumnId();


      /*
      ** Add a reference to this column in the Group By result
      ** set.
      */
      tmpRC = getColumnReference(newRC, dd);
      groupByRCL.addElement(tmpRC);
      tmpRC.setVirtualColumnId(groupByRCL.size());


      /*
      ** Piece together a fake one column rcl that we will use
      ** to generate a proper result description for input
      ** to this agg if it is a user agg.
      */
      aggRCL = (ResultColumnList) getNodeFactory().getNode(
                      C_NodeTypes.RESULT_COLUMN_LIST,
                      getContextManager());
      aggRCL.addElement(aggInputRC);


      /*
      ** Note that the column ids in the row are 0 based
      ** so we have to subtract 1.
      */
      aggInfo.addElement(new AggregatorInfo(
              aggregate.getAggregateName(),
              aggregate.getAggregatorClassName(),
              aggInputVColId - 1,      // aggregate input column
              aggResultVColId -1,      // the aggregate result column
              aggregatorVColId - 1,    // the aggregator column  
              aggregate.isDistinct(),
              lf.getResultDescription(aggRCL.makeResultDescriptors(), "SELECT")
            ));
    }
  }


  /**
   * Return the parent node to this one, if there is
   * one.  It will return 'this' if there is no generated
   * node above this one.
   *
   * @return the parent node
   */
  public FromTable getParent()
  {
    return parent;
  }




  /*
   *  Optimizable interface
   */


  /**
   * @see Optimizable#optimizeIt
   *
   * @exception StandardException    Thrown on error
   */
  public CostEstimate optimizeIt(
              Optimizer optimizer,
              OptimizablePredicateList predList,
              CostEstimate outerCost,
              RowOrdering rowOrdering)
      throws StandardException
  {
    // RESOLVE: NEED TO FACTOR IN THE COST OF GROUPING (SORTING) HERE
    CostEstimate childCost = ((Optimizable) childResult).optimizeIt(
                          optimizer,
                          predList,
                          outerCost,
                          rowOrdering);


    CostEstimate retval = super.optimizeIt(
                        optimizer,
                        predList,
                        outerCost,
                        rowOrdering
                        );


    return retval;
  }


  /**
   * @see Optimizable#estimateCost
   *
   * @exception StandardException    Thrown on error
   */
  public CostEstimate estimateCost(OptimizablePredicateList predList,
                    ConglomerateDescriptor cd,
                    CostEstimate outerCost,
                    Optimizer optimizer,
                    RowOrdering rowOrdering
                    )
      throws StandardException
  {
    // RESOLVE: NEED TO FACTOR IN THE COST OF GROUPING (SORTING) HERE
    //
    CostEstimate childCost = ((Optimizable) childResult).estimateCost(
                          predList,
                          cd,
                          outerCost,
                          optimizer,
                          rowOrdering);


    CostEstimate costEstimate = getCostEstimate(optimizer);
    costEstimate.setCost(childCost.getEstimatedCost(),
              childCost.rowCount(),
              childCost.singleScanRowCount());


    return costEstimate;
  }


  /**
   * @see org.apache.derby.iapi.sql.compile.Optimizable#pushOptPredicate
   *
   * @exception StandardException    Thrown on error
   */


  public boolean pushOptPredicate(OptimizablePredicate optimizablePredicate)
      throws StandardException
  {
    return ((Optimizable) childResult).pushOptPredicate(optimizablePredicate);
  }


  /**
   * Convert this object to a String.  See comments in QueryTreeNode.java
   * for how this should be done for tree printing.
   *
   * @return  This object as a String
   */


  public String toString()
  {
    if (SanityManager.DEBUG)
    {
      return "singleInputRowOptimization: " + singleInputRowOptimization + "\n" +
        childResult.toString() + "\n" + super.toString();
    }
    else
    {
      return "";
    }
  }


  /**
   * Evaluate whether or not the subquery in a FromSubquery is flattenable.
   * Currently, a FSqry is flattenable if all of the following are true:
   *    o  Subquery is a SelectNode.
   *    o  It contains no top level subqueries.  (RESOLVE - we can relax this)
   *    o  It does not contain a group by or having clause
   *    o  It does not contain aggregates.
   *
   * @param fromList  The outer from list
   *
   * @return boolean  Whether or not the FromSubquery is flattenable.
   */
  public boolean flattenableInFromSubquery(FromList fromList)
  {
    /* Can't flatten a GroupByNode */
    return false;
  }


  /**
   * Optimize this GroupByNode.
   *
   * @param dataDictionary  The DataDictionary to use for optimization
   * @param predicateList    The PredicateList to optimize.  This should
   *              be a join predicate.
   * @param outerRows      The number of outer joining rows
   *
   * @return  ResultSetNode  The top of the optimized subtree
   *
   * @exception StandardException    Thrown on error
   */


  public ResultSetNode optimize(DataDictionary dataDictionary,
                  PredicateList predicates,
                  double outerRows)
          throws StandardException
  {
    /* We need to implement this method since a PRN can appear above a
     * SelectNode in a query tree.
     */
    childResult = (FromTable) childResult.optimize(
                      dataDictionary,
                      predicates,
                      outerRows);
    Optimizer optimizer = getOptimizer(
            (FromList) getNodeFactory().getNode(
                  C_NodeTypes.FROM_LIST,
                  getNodeFactory().doJoinOrderOptimization(),
                  getContextManager()),
            predicates,
            dataDictionary,
            (RequiredRowOrdering) null);


    // RESOLVE: NEED TO FACTOR IN COST OF SORTING AND FIGURE OUT HOW
    // MANY ROWS HAVE BEEN ELIMINATED.
    costEstimate = optimizer.newCostEstimate();


    costEstimate.setCost(childResult.getCostEstimate().getEstimatedCost(),
              childResult.getCostEstimate().rowCount(),
              childResult.getCostEstimate().singleScanRowCount());


    return this;
  }


  ResultColumnDescriptor[] makeResultDescriptors(ExecutionContext ec)
  {
      return childResult.makeResultDescriptors(ec);
  }


  /**
   * Return whether or not the underlying ResultSet tree will return
   * a single row, at most.
   * This is important for join nodes where we can save the extra next
   * on the right side if we know that it will return at most 1 row.
   *
   * @return Whether or not the underlying ResultSet tree will return a single row.
   * @exception StandardException    Thrown on error
   */
  public boolean isOneRowResultSet()  throws StandardException
  {
    // Only consider scalar aggregates for now
    return ((groupingList == null) ||  (groupingList.size() == 0));
  }


    /**
     * generate the sort result set operating over the source
   * resultset.  Adds distinct aggregates to the sort if
   * necessary.
     *
   * @exception StandardException    Thrown on error
     */
  public void generate(ActivationClassBuilder acb,
                MethodBuilder mb)
              throws StandardException
  {
    int          orderingItem = 0;
    int          aggInfoItem = 0;
    FormatableArrayHolder  orderingHolder;


    /* Get the next ResultSet#, so we can number this ResultSetNode, its
     * ResultColumnList and ResultSet.
     */
    assignResultSetNumber();


    // Get the cost estimate from the child if we don't have one yet
    if (costEstimate == null)
    {
      costEstimate = childResult.getFinalCostEstimate();
    }


    /*
    ** Get the column ordering for the sort.  Note that
    ** for a scalar aggegate we may not have any ordering
    ** columns (if there are no distinct aggregates).
    ** WARNING: if a distinct aggregate is passed to
    ** SortResultSet it assumes that the last column
    ** is the distinct one.  If this assumption changes
    ** then SortResultSet will have to change.
    */
    orderingHolder = acb.getColumnOrdering(groupingList);
    if (addDistinctAggregate)
    {
      orderingHolder = acb.addColumnToOrdering(
                  orderingHolder,
                  addDistinctAggregateColumnNum);
    }


    if (SanityManager.DEBUG)
    {
      if (SanityManager.DEBUG_ON("AggregateTrace"))
      {
        StringBuffer s = new StringBuffer();
          
        s.append("Group by column ordering is (");
        ColumnOrdering[] ordering = 
            (ColumnOrdering[])orderingHolder.getArray(ColumnOrdering.class);


        for (int i = 0; i < ordering.length; i++)  
        {
          s.append(ordering[i].getColumnId());
          s.append(" ");
        }
        s.append(")");
        SanityManager.DEBUG("AggregateTrace", s.toString());
      }
    }


    orderingItem = acb.addItem(orderingHolder);


    /*
    ** We have aggregates, so save the aggInfo
    ** struct in the activation and store the number
    */
    if (SanityManager.DEBUG)
    {
      SanityManager.ASSERT(aggInfo != null,
          "aggInfo not set up as expected");
    }
    aggInfoItem = acb.addItem(aggInfo);


    acb.pushGetResultSetFactoryExpression(mb);


    // Generate the child ResultSet
    childResult.generate(acb, mb);
    mb.push(isInSortedOrder);
    mb.push(aggInfoItem);
    mb.push(orderingItem);
    acb.pushThisAsActivation(mb);


    resultColumns.generateHolder(acb, mb);


    mb.push(resultColumns.getTotalColumnSize());
    mb.push(resultSetNumber);


    /* Generate a (Distinct)ScalarAggregateResultSet if scalar aggregates */
    if ((groupingList == null) ||  (groupingList.size() == 0))
    {
      genScalarAggregateResultSet(acb, mb);
    }
    /* Generate a (Distinct)GroupedAggregateResultSet if grouped aggregates */
    else
    {
      genGroupedAggregateResultSet(acb, mb);
    }
  }


  /**
   * Generate the code to evaluate scalar aggregates.
   *
   */
  private  void genScalarAggregateResultSet(ActivationClassBuilder acb,
                           MethodBuilder mb)
  {
    /* Generate the (Distinct)ScalarAggregateResultSet:
     *  arg1: childExpress - Expression for childResult
     *  arg2: isInSortedOrder - true if source result set in sorted order
     *  arg3: aggregateItem - entry in saved objects for the aggregates,
     *  arg4: orderItem - entry in saved objects for the ordering
     *  arg5: Activation
     *  arg6: rowAllocator - method to construct rows for fetching
     *      from the sort
     *  arg7: row size
     *  arg8: resultSetNumber
     *  arg9: Whether or not to perform min optimization.
     *  arg12: closeCleanup
     */
    String resultSet = (addDistinctAggregate) ? "getDistinctScalarAggregateResultSet" : "getScalarAggregateResultSet";


    mb.push(singleInputRowOptimization);
    mb.push(costEstimate.rowCount());
    mb.push(costEstimate.getEstimatedCost());


    closeMethodArgument(acb, mb);


    mb.callMethod(VMOpcode.INVOKEINTERFACE, (String) null, resultSet, ClassName.NoPutResultSet, 12);
  }


  /**
   * Generate the code to evaluate grouped aggregates.
   *
   */
  private  void genGroupedAggregateResultSet(ActivationClassBuilder acb,
                           MethodBuilder mb)
        throws StandardException
  {
    /* Generate the (Distinct)GroupedAggregateResultSet:
     *  arg1: childExpress - Expression for childResult
     *  arg2: isInSortedOrder - true if source result set in sorted order
     *  arg3: aggregateItem - entry in saved objects for the aggregates,
     *  arg4: orderItem - entry in saved objects for the ordering
     *  arg5: Activation
     *  arg6: rowAllocator - method to construct rows for fetching
     *      from the sort
     *  arg7: row size
     *  arg8: resultSetNumber
     *  arg11: closeCleanup
     */
    String resultSet = (addDistinctAggregate) ? "getDistinctGroupedAggregateResultSet" : "getGroupedAggregateResultSet";
    
    mb.push(costEstimate.rowCount());
    mb.push(costEstimate.getEstimatedCost());


    closeMethodArgument(acb, mb);


    mb.callMethod(VMOpcode.INVOKEINTERFACE, (String) null, resultSet, ClassName.NoPutResultSet, 11);


  }


  ///////////////////////////////////////////////////////////////
  //
  // UTILITIES
  //
  ///////////////////////////////////////////////////////////////
  /**
   * Method for creating a new result column referencing
   * the one passed in.
   *
   * @param  targetRC  the source
   * @param  dd
   *
   * @return the new result column
   *
   * @exception StandardException  on error
   */
  private ResultColumn getColumnReference(ResultColumn targetRC, 
                DataDictionary    dd)
    throws StandardException
  {
    ColumnReference  tmpColumnRef;
    ResultColumn  newRC;
  
    tmpColumnRef = (ColumnReference) getNodeFactory().getNode(
                      C_NodeTypes.COLUMN_REFERENCE,
                      targetRC.getName(),
                      null,
                      getContextManager());
    tmpColumnRef.setSource(targetRC);
    tmpColumnRef.setType(targetRC.getExpressionType());
    tmpColumnRef.setNestingLevel(this.getLevel());
    tmpColumnRef.setSourceLevel(this.getLevel());
    newRC = (ResultColumn) getNodeFactory().getNode(
                  C_NodeTypes.RESULT_COLUMN,
                  targetRC.getColumnName(),
                  tmpColumnRef,
                  getContextManager());
    newRC.markGenerated();
    newRC.bindResultColumnToExpression();
    return newRC;
  }


  /**
   * Consider any optimizations after the optimizer has chosen a plan.
   * Optimizations include:
   *  o  min optimization for scalar aggregates
   *  o  max optimization for scalar aggregates
   *
   * @param selectHasPredicates true if SELECT containing this
   *    vector/scalar aggregate has a restriction
   *
   * @return Nothing.
   *
   * @exception StandardException  on error
   */
  void considerPostOptimizeOptimizations(boolean selectHasPredicates)
    throws StandardException
  {
    /* Consider the optimization for min with asc index on that column or
     * max with desc index on that column:
     *  o  No group by
     *  o  One of:
     *    o  min/max(ColumnReference) is only aggregate && source is 
     *       ordered on the ColumnReference
     *    o  min/max(ConstantNode)
     * The optimization of the other way around (min with desc index or
     * max with asc index) has the same restrictions with the additional
     * temporary restriction of no qualifications at all (because
     * we don't have true backward scans).
     */
    if (groupingList == null)
    {
      if (aggregateVector.size() == 1)
      {
        AggregateNode an = (AggregateNode) aggregateVector.elementAt(0);
        AggregateDefinition ad = an.getAggregateDefinition();
        if (ad instanceof MaxMinAggregateDefinition)
        {
          if (an.getOperand() instanceof ColumnReference)
          {
            /* See if the underlying ResultSet tree
             * is ordered on the ColumnReference.
             */
            ColumnReference[] crs = new ColumnReference[1];
            crs[0] = (ColumnReference) an.getOperand();
            
            Vector tableVector = new Vector();
            boolean minMaxOptimizationPossible = isOrderedOn(crs, false, tableVector);
            if (SanityManager.DEBUG)
            {
              SanityManager.ASSERT(tableVector.size() <= 1, "bad number of FromBaseTables returned by isOrderedOn() -- "+tableVector.size());
            }


            if (minMaxOptimizationPossible)
            {
              boolean ascIndex = true;
              int colNum = crs[0].getColumnNumber();
              
              /* Check if we have an access path, this will be
               * null in a join case (See Beetle 4423)
               */
              AccessPath accessPath= getTrulyTheBestAccessPath();
              if (accessPath == null)
                return;
              IndexDescriptor id = accessPath.
                        getConglomerateDescriptor().
                        getIndexDescriptor();
              int[] keyColumns = id.baseColumnPositions();
              boolean[] isAscending = id.isAscending();
              for (int i = 0; i < keyColumns.length; i++)
              {
                /* in such a query: select min(c3) from
                 * tab1 where c1 = 2 and c2 = 5, if prefix keys
                 * have equality operator, then we can still use
                 * the index.  The checking of equality operator
                 * has been done in isStrictlyOrderedOn.
                 */
                if (colNum == keyColumns[i])
                {
                  if (! isAscending[i])
                    ascIndex = false;
                  break;
                }
              }
              FromBaseTable fbt = (FromBaseTable)tableVector.firstElement();
              MaxMinAggregateDefinition temp = (MaxMinAggregateDefinition)ad;


              /*  MAX   ASC      NULLABLE 
                             *  ----  ----------
               *  TRUE  TRUE      TRUE/FALSE  =  Special Last Key Scan (ASC Index Last key with null skips)
               *  TRUE  FALSE     TRUE/FALSE  =  JustDisableBulk(DESC index 1st key with null skips)
               *  FALSE TRUE      TRUE/FALSE  = JustDisableBulk(ASC index 1st key)
               *  FALSE FALSE     TRUE/FALSE  = Special Last Key Scan(Desc Index Last Key)
               */


              if (((!temp.isMax()) && ascIndex) || 
                ((temp.isMax()) && !ascIndex))
              {
                fbt.disableBulkFetch();
                singleInputRowOptimization = true;
              }
              /*
              ** Max optimization with asc index or min with
              ** desc index is currently more
              ** restrictive than otherwise.
              ** We are getting the store to return the last
              ** row from an index (for the time being, the
              ** store cannot do real backward scans).  SO
              ** we cannot do this optimization if we have
              ** any predicates at all.
              */
              else if (!selectHasPredicates && 
                   ((temp.isMax() && ascIndex) || 
                    (!temp.isMax() && !ascIndex )))
              {
                fbt.disableBulkFetch();
                fbt.doSpecialMaxScan();
                singleInputRowOptimization = true;
              }
            }
          }
          else if (an.getOperand() instanceof ConstantNode)
          {
            singleInputRowOptimization = true;
          }
        }
      }
    }
  }
}
Source Code of org.apache.derby.impl.sql.compile.GroupByNode

Related Classes of org.apache.derby.impl.sql.compile.GroupByNode