Package org.apache.blur.thrift.util

Source Code of org.apache.blur.thrift.util.LoadData

package org.apache.blur.thrift.util;

/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements.  See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.PrintWriter;
import java.util.ArrayList;
import java.util.List;
import java.util.Random;
import java.util.concurrent.TimeUnit;

import org.apache.blur.thirdparty.thrift_0_9_0.TException;
import org.apache.blur.thrift.BlurClient;
import org.apache.blur.thrift.generated.Blur.Iface;
import org.apache.blur.thrift.generated.BlurException;
import org.apache.blur.thrift.generated.Column;
import org.apache.blur.thrift.generated.Record;
import org.apache.blur.thrift.generated.RecordMutation;
import org.apache.blur.thrift.generated.RecordMutationType;
import org.apache.blur.thrift.generated.RowMutation;
import org.apache.blur.thrift.generated.RowMutationType;

public class LoadData {

  private static final long _5_SECONDS = TimeUnit.SECONDS.toNanos(5);
  private static Random random = new Random();
  private static List<String> words = new ArrayList<String>();

  public static void main(String[] args) throws BlurException, TException, IOException {
    final int numberOfColumns = 3;
    int numberRows = 100000;
    final int numberRecordsPerRow = 3;
    final int numberOfFamilies = 3;
    final int numberOfWords = 30;
    int batch = 1;
    String connectionString = args[0];
    String table = args[1];
    Iface client = BlurClient.getClient(connectionString);
    runLoad(client, false, table, numberRows, numberRecordsPerRow, numberOfFamilies, numberOfColumns, numberOfWords,
        batch, new PrintWriter(System.out));
  }

  public static void runLoad(Iface client, boolean enqueue, String table, int numberRows, int numberRecordsPerRow,
      int numberOfFamilies, int numberOfColumns, int numberOfWords, int batch, PrintWriter out) throws IOException,
      BlurException, TException {
    loadWords();

    int countRow = 0;
    int countRecord = 0;
    final long start = System.currentTimeMillis();
    long s = start;

    List<RowMutation> mutations = new ArrayList<RowMutation>();

    long ts = System.nanoTime();
    for (int i = 0; i < numberRows; i++) {
      long now = System.nanoTime();
      if (ts + _5_SECONDS < now) {
        printPerformance(out, countRow, countRecord, start, s, i);
        countRow = 0;
        countRecord = 0;
        s = System.currentTimeMillis();
        ts = System.nanoTime();
      }

      RowMutation mutation = new RowMutation();
      mutation.setTable(table);
      String rowId = getRowId();
      mutation.setRowId(rowId);
      mutation.setRowMutationType(RowMutationType.REPLACE_ROW);
      for (int j = 0; j < numberRecordsPerRow; j++) {
        mutation.addToRecordMutations(getRecordMutation(numberOfColumns, numberOfFamilies, numberOfWords));
        countRecord++;
      }
      if (batch == 1) {
        if (enqueue) {
          client.enqueueMutate(mutation);
        } else {
          client.mutate(mutation);
        }
      } else {
        mutations.add(mutation);
        if (mutations.size() >= batch) {
          if (enqueue) {
            client.enqueueMutateBatch(mutations);
          } else {
            client.mutateBatch(mutations);
          }
          mutations.clear();
        }
      }
      countRow++;
    }
    if (!mutations.isEmpty()) {
      if (enqueue) {
        client.enqueueMutateBatch(mutations);
      } else {
        client.mutateBatch(mutations);
      }
    }
    printPerformance(out, countRow, countRecord, start, s, numberRows);
  }

  private static void printPerformance(PrintWriter out, int countRow, int countRecord, final long start, long s, int i) {
    double totalSeconds = (System.currentTimeMillis() - start) / 1000.0;
    double seconds = (System.currentTimeMillis() - s) / 1000.0;
    double recordRate = countRecord / seconds;
    double rowRate = countRow / seconds;
    double avgRowRate = i / totalSeconds;
    out.printf("Rows indexed [%d] at Avg Rows [%f/s] Rows [%f/s] Records [%f/s]%n", i, avgRowRate, rowRate, recordRate);
    out.flush();
  }

  private static void loadWords() throws IOException {
    InputStream inputStream = LoadData.class.getResourceAsStream("words.txt");
    BufferedReader reader = new BufferedReader(new InputStreamReader(inputStream));
    String word;
    while ((word = reader.readLine()) != null) {
      words.add(word.trim());
    }
    reader.close();
  }

  protected static RecordMutation getRecordMutation(int numberOfColumns, int numberOfFamilies, int numberOfWords) {
    RecordMutation recordMutation = new RecordMutation();
    recordMutation.setRecord(getRecord(numberOfColumns, numberOfFamilies, numberOfWords));
    recordMutation.setRecordMutationType(RecordMutationType.REPLACE_ENTIRE_RECORD);
    return recordMutation;
  }

  private static Record getRecord(int numberOfColumns, int numberOfFamilies, int numberOfWords) {
    Record record = new Record();
    record.setRecordId(getRowId());
    record.setFamily(getFamily(numberOfFamilies));
    for (int i = 0; i < numberOfColumns; i++) {
      record.addToColumns(new Column("col" + i, getWords(numberOfWords)));
    }
    return record;
  }

  private static String getWords(int numberOfWords) {
    StringBuilder builder = new StringBuilder();
    for (int i = 0; i < numberOfWords; i++) {
      if (i != 0) {
        builder.append(' ');
      }
      builder.append(getWord());
    }
    return builder.toString();
  }

  private static String getFamily(int numberOfFamilies) {
    return "fam" + random.nextInt(numberOfFamilies);
  }

  private static String getWord() {
    return makeUpperCaseRandomly(words.get(random.nextInt(words.size())), random);
  }

  private static String makeUpperCaseRandomly(String s, Random r) {
    if (r.nextBoolean()) {
      return s.substring(0, 1).toUpperCase() + s.substring(1);
    }
    return s;
  }

  protected static String getRowId() {
    return Long.toString(Math.abs(random.nextLong())) + "-" + Long.toString(Math.abs(random.nextLong()));
  }

}
TOP

Related Classes of org.apache.blur.thrift.util.LoadData

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.