Package com.cloudera.cdk.tools

Source Code of com.cloudera.cdk.tools.TestCombinedLogFormatConverter

/**
* Copyright 2013 Cloudera Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.cloudera.cdk.tools;

import com.cloudera.cdk.data.Dataset;
import com.cloudera.cdk.data.DatasetReader;
import com.cloudera.cdk.data.DatasetRepositories;
import com.cloudera.cdk.data.DatasetRepository;
import com.google.common.io.Resources;
import java.io.File;
import junit.framework.Assert;
import org.apache.avro.generic.GenericRecord;
import org.apache.hadoop.fs.FileUtil;
import org.junit.Before;
import org.junit.Test;

public class TestCombinedLogFormatConverter {

  private static final File TEST_DIR = new File("/tmp", TestCombinedLogFormatConverter
      .class.getName());

  @Before
  public void setUp() {
    FileUtil.fullyDelete(TEST_DIR);
  }

  @Test
  public void test() throws Exception {
    CombinedLogFormatConverter tool = new CombinedLogFormatConverter();

    String input = Resources.getResource("access_log.txt").toExternalForm();
    String datasetUri = "repo:" + TEST_DIR.toURI().toURL().toExternalForm();
    String datasetName = "logs";

    int exitCode = tool.run(input, datasetUri, datasetName);

    Assert.assertEquals(0, exitCode);

    DatasetRepository repo = DatasetRepositories.open(datasetUri);
    Dataset<GenericRecord> dataset = repo.load(datasetName);
    DatasetReader<GenericRecord> reader = dataset.newReader();
    try {
      reader.open();
      Assert.assertTrue(reader.hasNext());
      GenericRecord first = reader.next();

      Assert.assertEquals("ip1", first.get("host"));
      Assert.assertNull(first.get("rfc931_identity"));
      Assert.assertNull(first.get("username"));
      Assert.assertEquals("24/Apr/2011:04:06:01 -0400", first.get("datetime"));
      Assert.assertEquals("GET /~strabal/grease/photo9/927-3.jpg HTTP/1.1",
          first.get("request"));
      Assert.assertEquals(200, first.get("http_status_code"));
      Assert.assertEquals(40028, first.get("response_size"));
      Assert.assertNull(first.get("referrer"));
      Assert.assertEquals("Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex" +
          ".com/bots)", first.get("user_agent"));
    } finally {
      reader.close();
    }

  }
}
TOP

Related Classes of com.cloudera.cdk.tools.TestCombinedLogFormatConverter

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.