Package org.apache.pig.test

Source Code of org.apache.pig.test.TestCharArrayToNumeric

/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* http://www.apache.org/licenses/LICENSE-2.0
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.pig.test;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNull;

import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Random;

import org.apache.pig.ExecType;
import org.apache.pig.PigServer;
import org.apache.pig.backend.executionengine.ExecException;
import org.apache.pig.backend.hadoop.executionengine.physicalLayer.PhysicalOperator;
import org.apache.pig.backend.hadoop.executionengine.physicalLayer.expressionOperators.POCast;
import org.apache.pig.backend.hadoop.executionengine.physicalLayer.expressionOperators.POProject;
import org.apache.pig.data.DataType;
import org.apache.pig.data.Tuple;
import org.apache.pig.data.TupleFactory;
import org.apache.pig.impl.plan.NodeIdGenerator;
import org.apache.pig.impl.plan.OperatorKey;
import org.junit.AfterClass;
import org.junit.Before;
import org.junit.Test;

public class TestCharArrayToNumeric {
    private Double dummyDouble = null;
    private Float dummyFloat = null;
    private Long dummyLong = null;
    private Integer dummyInteger = null;
    private Double MaxDouble = Double.MIN_VALUE;
    private Double MinDouble = Double.MIN_VALUE;
    private Float MaxFloat = Float.MAX_VALUE;
    private Float MinFloat = Float.MIN_VALUE;
    private Long MaxLong = Long.MAX_VALUE;
    private Long MinLong = Long.MIN_VALUE;
    private Integer MaxInteger = Integer.MAX_VALUE;
    private Integer MinInteger = Integer.MIN_VALUE;

    static MiniCluster cluster = MiniCluster.buildCluster();
    PigServer pig;

    @Before
    public void setUp() throws Exception {
        pig = new PigServer(ExecType.MAPREDUCE, cluster.getProperties());
    }

    @AfterClass
    public static void oneTimeTearDown() throws Exception {
        cluster.shutDown();
    }

    public static OperatorKey newOperatorKey() {
        long newId = NodeIdGenerator.getGenerator().getNextNodeId("scope");
        return new OperatorKey("scope", newId);
    }

    @Test
    public void testCast() throws ExecException {
        POCast cast = new POCast(newOperatorKey(), -1);
        POProject proj = new POProject(newOperatorKey(), -1, 0);
        proj.setResultType(DataType.CHARARRAY);
        List<PhysicalOperator> inputs = new ArrayList<PhysicalOperator>();
        inputs.add(proj);
        cast.setInputs(inputs);

        // cast to double
        String[] items = { "12.0", "-13.2", "0.1f", "1.3e2", "zjf",
                        MaxDouble.toString(), MinDouble.toString() };
        Double[] doubleExpected = { 12.0, -13.2, 0.1, 1.3e2, null, MaxDouble,
                        MinDouble };
        for (int i = 0; i < items.length; ++i) {
            Tuple tuple = TupleFactory.getInstance().newTuple(1);
            tuple.set(0, items[i]);
            proj.attachInput(tuple);
            Double actual = (Double)cast.getNextDouble().result;
            if (doubleExpected[i] != null) {
                assertEquals(doubleExpected[i], actual, 1e-6);
            } else {
                assertNull(actual);
            }
        }

        // cast to float
        items = new String[] { "12.0", "-13.2", "0.1f", "1.3e2",
                        MaxFloat.toString(), MinFloat.toString(), "zjf" };
        Float[] floatExpected = { 12.0f, -13.2f, 0.1f, 1.3e2f, MaxFloat,
                        MinFloat, null };
        for (int i = 0; i < items.length; ++i) {
            Tuple tuple = TupleFactory.getInstance().newTuple(1);
            tuple.set(0, items[i]);
            proj.attachInput(tuple);
            Float actual = (Float)cast.getNextFloat().result;
            if (floatExpected[i] != null) {
                assertEquals(floatExpected[i], actual, 1e-6);
            } else {
                assertNull(actual);
            }
        }

        // cast to long
        items = new String[] { "1", "-1", "12.2", "12.8", MaxLong.toString(),
                        MinLong.toString(), "df1.2" };
        Long[] longExpected = { 1L, -1L, 12L, 12L, MaxLong, MinLong, null };
        for (int i = 0; i < items.length; ++i) {
            Tuple tuple = TupleFactory.getInstance().newTuple(1);
            tuple.set(0, items[i]);
            proj.attachInput(tuple);
            Long actual = (Long)cast.getNextLong().result;
            if (longExpected[i] != null) {
                assertEquals(longExpected[i], actual);
            } else {
                assertNull(actual);
            }
        }

        // cast to int
        items = new String[] { "1", "-1", "12.2", "12.8",
                        MaxInteger.toString(), MinInteger.toString(), "ff4332" };
        Integer[] intExpected = { 1, -1, 12, 12, MaxInteger, MinInteger, null };
        for (int i = 0; i < items.length; ++i) {
            Tuple tuple = TupleFactory.getInstance().newTuple(1);
            tuple.set(0, items[i]);
            proj.attachInput(tuple);
            Integer actual = (Integer)cast.getNextInteger().result;
            if (intExpected[i] != null) {
                assertEquals(intExpected[i], actual);
            } else {
                assertNull(actual);
            }
        }
    }

    @Test
    public void testCharArray2FloatAndDoubleScript() throws IOException {
        // create a input file with format (key,value)
        int size = 100;
        String[] numbers = new String[size + 1];
        Random rand = new Random();
        Map<Integer, Double> map = new HashMap<Integer, Double>();

        try {
            for (int i = 0; i < numbers.length; ++i) {
                int key = i;
                double value = rand.nextDouble() * 100;
                numbers[i] = (key + "\t" + value);
                map.put(key, value);
            }
            // append a null at the last line, to test string which can not been
            // cast
            numbers[numbers.length - 1] = (numbers.length + "\t" + "null");
            map.put(numbers.length, null);
            Util.createInputFile(cluster, "pig_jira_893-input1.txt", numbers);
            byte[] numericTypes = new byte[] { DataType.DOUBLE, DataType.FLOAT, };
            for (byte type : numericTypes) {
                pig.registerQuery("A = Load 'pig_jira_893-input1.txt' AS " +
                        "(key:int,value:chararray);");
                pig.registerQuery("B = FOREACH A GENERATE key,("
                        + DataType.findTypeName(type) + ")value;");
                Iterator<Tuple> iter = pig.openIterator("B");
                while (iter.hasNext()) {
                    Tuple tuple = iter.next();
                    Integer key = (Integer)tuple.get(0);
                    String value = null;
                    if (tuple.get(1) != null) {
                        value = tuple.get(1).toString();
                    }

                    if (type == DataType.DOUBLE) {
                        Double expected = map.get(key);
                        if (value != null) {
                            assertEquals(expected, (Double)Double.parseDouble(value));
                        } else {
                            assertNull(expected);
                        }

                    }
                    if (type == DataType.FLOAT) {
                        Float expected = null;
                        if (map.get(key) != null) {
                            expected = map.get(key).floatValue();
                        }
                        if (value != null) {
                            assertEquals(expected, (Float)Float.parseFloat(value));
                        } else {
                            assertNull(expected);
                        }
                    }
                }
            }
        } finally {
            Util.deleteFile(cluster, "pig_jira_893-input1.txt");
        }
    }

    @Test
    public void testCharArrayToIntAndLongScript() throws IOException {
        // create a input file with format (key,value)
        int size = 100;
        String[] numbers = new String[size + 1];
        Random rand = new Random();
        Map<Integer, Long> map = new HashMap<Integer, Long>();

        try {
            for (int i = 0; i < numbers.length; ++i) {
                int key = i;
                long value = rand.nextInt(100);
                numbers[i] = (key + "\t" + value);
                map.put(key, value);
            }
            // append a null at the last line, to test string which can not been
            // cast
            numbers[numbers.length - 1] = (numbers.length + "\t" + "null");
            map.put(numbers.length, null);
            Util.createInputFile(cluster, "pig_jira_893-input2.txt", numbers);
            byte[] numericTypes = new byte[] { DataType.INTEGER, DataType.LONG, };
            for (byte type : numericTypes) {
                pig.registerQuery("A = Load 'pig_jira_893-input2.txt' AS " +
                        "(key:int,value:chararray);");
                pig.registerQuery("B = FOREACH A GENERATE key,("
                        + DataType.findTypeName(type) + ")value;");
                Iterator<Tuple> iter = pig.openIterator("B");
                while (iter.hasNext()) {
                    Tuple tuple = iter.next();
                    Integer key = (Integer)tuple.get(0);
                    String value = null;
                    if (tuple.get(1) != null) {
                        value = tuple.get(1).toString();
                    }

                    if (type == DataType.LONG) {
                        Long expected = map.get(key);
                        if (value != null) {
                            Long actual = Long.parseLong(value);
                            assertEquals(expected, actual);
                        } else {
                            assertEquals(expected, null);
                        }
                    }
                    if (type == DataType.INTEGER) {
                        Integer expected = null;
                        if (map.get(key) != null) {
                            expected = map.get(key).intValue();
                        }
                        if (value != null) {
                            Integer actual = Integer.parseInt(value);
                            assertEquals(expected, actual);
                        } else {
                            assertNull(expected);
                        }
                    }
                }
            }
        } finally {
            Util.deleteFile(cluster, "pig_jira_893-input2.txt");
        }
    }
}
TOP

Related Classes of org.apache.pig.test.TestCharArrayToNumeric

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.