Package org.apache.drill.exec.planner.sql.logical

Source Code of org.apache.drill.exec.planner.sql.logical.HivePushPartitionFilterIntoScan

/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.drill.exec.planner.sql.logical;

import java.util.LinkedList;
import java.util.List;

import org.apache.drill.common.exceptions.DrillRuntimeException;
import org.apache.drill.common.exceptions.ExecutionSetupException;
import org.apache.drill.exec.physical.base.GroupScan;
import org.apache.drill.exec.planner.logical.DirPathBuilder;
import org.apache.drill.exec.planner.logical.DrillFilterRel;
import org.apache.drill.exec.planner.logical.DrillProjectRel;
import org.apache.drill.exec.planner.logical.DrillRel;
import org.apache.drill.exec.planner.logical.DrillScanRel;
import org.apache.drill.exec.planner.logical.PartitionPruningUtil;
import org.apache.drill.exec.planner.logical.RelOptHelper;
import org.apache.drill.exec.planner.sql.HivePartitionDescriptor;
import org.apache.drill.exec.store.StoragePluginOptimizerRule;
import org.apache.drill.exec.store.hive.HiveReadEntry;
import org.apache.drill.exec.store.hive.HiveScan;
import org.apache.drill.exec.store.hive.HiveTable;
import org.apache.drill.exec.store.hive.HiveTable.HivePartition;
import org.eigenbase.relopt.RelOptRuleCall;
import org.eigenbase.relopt.RelOptRuleOperand;

import com.google.common.collect.Lists;

public abstract class HivePushPartitionFilterIntoScan extends StoragePluginOptimizerRule {

  public static final StoragePluginOptimizerRule HIVE_FILTER_ON_PROJECT =
      new HivePushPartitionFilterIntoScan(
          RelOptHelper.some(DrillFilterRel.class, RelOptHelper.some(DrillProjectRel.class, RelOptHelper.any(DrillScanRel.class))),
          "HivePushPartitionFilterIntoScan:Filter_On_Project") {

        @Override
        public boolean matches(RelOptRuleCall call) {
          final DrillScanRel scan = (DrillScanRel) call.rel(2);
          GroupScan groupScan = scan.getGroupScan();
          return groupScan instanceof HiveScan &&  groupScan.supportsPartitionFilterPushdown();
        }

        @Override
        public void onMatch(RelOptRuleCall call) {
          final DrillFilterRel filterRel = (DrillFilterRel) call.rel(0);
          final DrillProjectRel projectRel = (DrillProjectRel) call.rel(1);
          final DrillScanRel scanRel = (DrillScanRel) call.rel(2);
          doOnMatch(call, filterRel, projectRel, scanRel);
        }
      };

  public static final StoragePluginOptimizerRule HIVE_FILTER_ON_SCAN =
      new HivePushPartitionFilterIntoScan(
          RelOptHelper.some(DrillFilterRel.class, RelOptHelper.any(DrillScanRel.class)),
          "HivePushPartitionFilterIntoScan:Filter_On_Scan") {

        @Override
        public boolean matches(RelOptRuleCall call) {
          final DrillScanRel scan = (DrillScanRel) call.rel(1);
          GroupScan groupScan = scan.getGroupScan();
          return groupScan instanceof HiveScan &&  groupScan.supportsPartitionFilterPushdown();
        }

        @Override
        public void onMatch(RelOptRuleCall call) {
          final DrillFilterRel filterRel = (DrillFilterRel) call.rel(0);
          final DrillScanRel scanRel = (DrillScanRel) call.rel(1);
          doOnMatch(call, filterRel, null, scanRel);
        }
      };

  private HivePushPartitionFilterIntoScan(
      RelOptRuleOperand operand,
      String id) {
    super(operand, id);
  }

  private HiveReadEntry splitFilter(HiveReadEntry origReadEntry, DirPathBuilder builder) {
    HiveTable table = origReadEntry.table;
    List<HivePartition> partitions = origReadEntry.partitions;
    List<HivePartition> newPartitions = new LinkedList<>();
    String pathPrefix = PartitionPruningUtil.truncatePrefixFromPath(table.getTable().getSd().getLocation());
    List<String> newFiles = Lists.newArrayList();
    List<String> dirPathList = builder.getDirPath();

    for (String dirPath : dirPathList) {
      String fullPath = pathPrefix + dirPath;
      // check containment of this path in the list of files
      for (HivePartition part: partitions) {
        String origFilePath = origReadEntry.getPartitionLocation(part);
        String origFileName = PartitionPruningUtil.truncatePrefixFromPath(origFilePath);

        if (origFileName.startsWith(fullPath)) {
          newFiles.add(origFileName);
          newPartitions.add(part);
        }
      }
    }

    if (newFiles.size() > 0) {
      HiveReadEntry newReadEntry = new HiveReadEntry(table, newPartitions, origReadEntry.hiveConfigOverride);
      return newReadEntry;
    }
    return origReadEntry;
  }

  protected void doOnMatch(RelOptRuleCall call, DrillFilterRel filterRel, DrillProjectRel projectRel, DrillScanRel scanRel) {
    DrillRel inputRel = projectRel != null ? projectRel : scanRel;
    HiveReadEntry origReadEntry = ((HiveScan)scanRel.getGroupScan()).hiveReadEntry;
    DirPathBuilder builder = new DirPathBuilder(filterRel, inputRel, filterRel.getCluster().getRexBuilder(), new HivePartitionDescriptor(origReadEntry.table.partitionKeys));
    HiveReadEntry newReadEntry = splitFilter(origReadEntry, builder);

    if (origReadEntry == newReadEntry) {
      return; // no directory filter was pushed down
    }

    try {
      HiveScan oldScan = (HiveScan) scanRel.getGroupScan();
      HiveScan hiveScan = new HiveScan(newReadEntry, oldScan.storagePlugin, oldScan.columns);
      PartitionPruningUtil.rewritePlan(call, filterRel, projectRel, scanRel, hiveScan, builder);
    } catch (ExecutionSetupException e) {
      throw new DrillRuntimeException(e);
    }

  }
}
TOP

Related Classes of org.apache.drill.exec.planner.sql.logical.HivePushPartitionFilterIntoScan

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.