Package org.apache.drill.exec.store.hive

Source Code of org.apache.drill.exec.store.hive.HiveScanBatchCreator

/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.exec.store.hive;

import com.google.common.collect.Lists;
import org.apache.drill.common.exceptions.ExecutionSetupException;
import org.apache.drill.exec.ops.FragmentContext;
import org.apache.drill.exec.physical.impl.BatchCreator;
import org.apache.drill.exec.physical.impl.ScanBatch;
import org.apache.drill.exec.record.RecordBatch;
import org.apache.drill.exec.store.RecordReader;
import org.apache.hadoop.hive.metastore.api.Partition;
import org.apache.hadoop.hive.metastore.api.Table;
import org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe;
import org.apache.hadoop.mapred.InputSplit;
import org.apache.hadoop.mapred.TextInputFormat;

import java.util.List;

public class HiveScanBatchCreator implements BatchCreator<HiveSubScan> {

  @Override
  public RecordBatch getBatch(FragmentContext context, HiveSubScan config, List<RecordBatch> children) throws ExecutionSetupException {
    List<RecordReader> readers = Lists.newArrayList();
    Table table = config.getTable();
    List<InputSplit> splits = config.getInputSplits();
    List<Partition> partitions = config.getPartitions();
    boolean hasPartitions = (partitions != null && partitions.size() > 0);
    int i = 0;

    // Native hive text record reader doesn't handle all types currently. For now use HiveRecordReader which uses
    // Hive InputFormat and SerDe classes to read the data.
    //if (table.getSd().getInputFormat().equals(TextInputFormat.class.getCanonicalName()) &&
    //        table.getSd().getSerdeInfo().getSerializationLib().equals(LazySimpleSerDe.class.getCanonicalName()) &&
    //        config.getColumns() != null) {
    //  for (InputSplit split : splits) {
    //    readers.add(new HiveTextRecordReader(table,
    //        (hasPartitions ? partitions.get(i++) : null),
    //        split, config.getColumns(), context));
    //  }
    //} else {
      for (InputSplit split : splits) {
        readers.add(new HiveRecordReader(table,
            (hasPartitions ? partitions.get(i++) : null),
            split, config.getColumns(), context, config.getHiveReadEntry().hiveConfigOverride));
      }
    //}

    // If there are no readers created (which is possible when the table is empty), create an empty RecordReader to
    // output the schema
    if (readers.size() == 0) {
      readers.add(new HiveRecordReader(table, null, null, config.getColumns(), context,
          config.getHiveReadEntry().hiveConfigOverride));
    }

    return new ScanBatch(config, context, readers.iterator());
  }
}
TOP

Related Classes of org.apache.drill.exec.store.hive.HiveScanBatchCreator

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.