Package org.dmg.pmml31.UnivariateStatsDocument

Examples of org.dmg.pmml31.UnivariateStatsDocument.UnivariateStats


        return getPmml();
    }           
   
    public PMMLDocument toPMMLDocument()
    {
        PMMLDocument result = PMMLDocument.Factory.newInstance();
        PMML pmmlObject = result.addNewPMML();
        pmmlObject.setVersion("3.0");
        // head of PMML document
        Header header = pmmlObject.addNewHeader();
        header.setCopyright("www.gridminer.org");
        Application application = header.addNewApplication();
View Full Code Here


        throws ActivityProcessingException,
               ActivityTerminatedException,
               ActivityUserException
    {
        TupleListIterator tuples = (TupleListIterator)iterationData[0];
        PMMLDocument pmmlInput = (PMMLDocument) iterationData[1];
       
        ModelStatsInterval modelStats =
            new ModelStatsInterval(tuples, pmmlInput);
        modelStats.countStatistics();
        try
View Full Code Here

    protected void processIteration(Object[] iterationData)
        throws ActivityProcessingException,
               ActivityTerminatedException,
               ActivityUserException
    {
        PMMLDocument pmml = (PMMLDocument)iterationData[0];
        try
        {
            mOutput.write(pmml.toString().toCharArray());
        }
        catch (PipeClosedException e)
        {
            iterativeStageComplete();
        }
View Full Code Here

        TupleListIterator tupleList = (TupleListIterator) iterationData[0];
        ListIterator columnList = (ListIterator) iterationData[1];
        ListIterator methodsList = (ListIterator) iterationData[2];
        ListIterator causeList = (ListIterator) iterationData[3];
        ListIterator parameterList = (ListIterator) iterationData[4];
        PMMLDocument pmml = (PMMLDocument) iterationData[5];

        Integer column;
        while ((column = (Integer) columnList.nextValue()) != null)
        {
            String method = (String) methodsList.nextValue();
            String cause = (String) causeList.nextValue();
            Object[] parameters = (Object[]) parameterList.nextValue();

            if (method == null || cause == null || parameters == null)
            {
                throw new ActivityUserException(
                        new UnmatchedInputException(
                                new String[] {
                                        INPUT_COLUMNS,
                                        INPUT_METHODS,
                                        INPUT_CAUSE,
                                        INPUT_PARAMETERS },
                                new Object[] {
                                        column, method, cause, parameters }));
            }

            DPPMethodForColumn methodForColumn = loadMethod(
                    column.intValue(),
                    method,
                    cause,
                    parameters,
                    pmml.getPMML());
            mColumnMethods.put(column, methodForColumn);
        }

        if (methodsList.nextValue() != null
                || causeList.nextValue() != null
                || parameterList.nextValue() != null)
        {
            throw new ActivityUserException(
                    new UnmatchedInputException(
                            new String[] {
                                    INPUT_COLUMNS,
                                    INPUT_METHODS,
                                    INPUT_CAUSE,
                                    INPUT_PARAMETERS }));
        }

        TupleMetadata metadata =
            (TupleMetadata) tupleList.getMetadataWrapper().getMetadata();

        // load all intervals
        mInterval = DPPHelper.loadIntervals(metadata, pmml.getPMML());

        // write metadata to output
        writeBlock(tupleList.getMetadataWrapper());
        // now apply DPP methods to input tuples and write the results
        Tuple tuple;
View Full Code Here

    }
   
    public PMMLDocument toObject()
    {
        PMMLDocument result = PMMLDocument.Factory.newInstance();
        PMML pmmlObject = result.addNewPMML();
        pmmlObject.setVersion("3.0");
        //head of PMML document
        pmmlObject.setHeader(mPMML.getHeader());
        //data dictionary
        DataField[] dataFields = mPMML.getDataDictionary().getDataFieldArray();
        for(int i=0; i<columnCount; i++)
        {
            OPTYPE.Enum optype = dataFields[i].getOptype();
            if (optype == OPTYPE.CATEGORICAL)
            {
                int countValue = histogram_values[i].size();
                Value value = dataFields[i].addNewValue();
                for(int j=0; j<countValue; j++)
                {
                    value.setValue(histogram_values[i].get(j).toString());
                    Extension ext = value.addNewExtension();
                    ext.setName("count");
                    ext.setValue(String.valueOf(histogram_frequency[i][j]));
                }
            }
        }       
        pmmlObject.setDataDictionary(mPMML.getDataDictionary());
        pmmlObject.getDataDictionary().setDataFieldArray(dataFields);
               
        //ModelStat
        MiningModel miningModel = pmmlObject.addNewMiningModel();
        miningModel.setModelName("Statistica");
        org.dmg.pmml31.ModelStatsDocument.ModelStats modelStats =
            miningModel.addNewModelStats();
       
        for(int i=0; i<columnCount; i++)
View Full Code Here

    }           
   
    public PMMLDocument toPMMLDocument()
    {
        PMMLDocument result = PMMLDocument.Factory.newInstance();
        PMML pmmlObject = result.addNewPMML();
        pmmlObject.setVersion("3.0");
        // head of PMML document
        Header header = pmmlObject.addNewHeader();
        header.setCopyright("www.gridminer.org");
        Application application = header.addNewApplication();
        application.setName("GridMiner");
        application.setVersion("1.0");
        //data dictionary
        DataDictionary dataDictionary = pmmlObject.addNewDataDictionary();
        BigInteger pom = new BigInteger(String.valueOf(columnCount));
        dataDictionary.setNumberOfFields(pom);
       
        for (int i = 0; i < columnCount; i++)
        {
            DataField dataField = dataDictionary.addNewDataField();
            dataField.setName(colInfo[i].getName());
            dataField.setDisplayName(colInfo[i].getDisplayName());          
            //dataField[i].setDataType(DATATYPE.fromString(colInfo[i].getDataType()));
            dataField.setDataType(
                    DATATYPE.Enum.forString(colInfo[i].getDataType()));
            // all attribute are continuous in this phase
            dataField.setOptype(OPTYPE.CONTINUOUS);        
        }
       
        //ModelStat
        MiningModel miningModel = pmmlObject.addNewMiningModel();
        miningModel.setModelName("Statistica");
        org.dmg.pmml31.ModelStatsDocument.ModelStats modelStats =
            miningModel.addNewModelStats();
       
        for (int i=0; i<columnCount; i++)
View Full Code Here

        org.dmg.pmml31.ModelStatsDocument.ModelStats modelStats =
            miningModel.addNewModelStats();
       
        for (int i=0; i<columnCount; i++)
        {
            UnivariateStats statfield = modelStats.addNewUnivariateStats();
            statfield.setField(colInfo[i].getName());
            // counts
            Counts counts = statfield.addNewCounts();
            pom = new BigInteger(String.valueOf(totalFreq[i]));
            counts.setTotalFreq(pom);
            pom = new BigInteger(String.valueOf(missingData[i]));
            counts.setMissingFreq(pom);
           
            Extension ext = counts.addNewExtension();
            ext.setName("distinctValues");
            ext.setValue(String.valueOf(hashSet[i].size()));
           
            String colType = colInfo[i].getDataType();
            if (colType.equalsIgnoreCase("integer")||
                colType.equalsIgnoreCase("float")||
                colType.equalsIgnoreCase("double"))
            {
               // numeric info
                NumericInfo numInfo = statfield.addNewNumericInfo();
                numInfo.setMinimum(minimum[i]);
                numInfo.setMaximum(maximum[i]);
                numInfo.setMean(mean[i]);
                numInfo.setStandardDeviation(stddev[i]);
            }
View Full Code Here

        org.dmg.pmml31.ModelStatsDocument.ModelStats modelStats =
            miningModel.addNewModelStats();
       
        for(int i=0; i<columnCount; i++)
        {
            UnivariateStats statfield = modelStats.addNewUnivariateStats();
            statfield.setField(colInfo[i].getName());
            // Counts
            Counts counts = statfield.addNewCounts();
            BigInteger pom = new BigInteger(String.valueOf(totalFreq[i]));
            counts.setTotalFreq(pom);
            pom = new BigInteger(String.valueOf(missingData[i]));
            counts.setMissingFreq(pom);
            pom = new BigInteger(String.valueOf(invalidFreq[i]));
            counts.setInvalidFreq(pom);           
            Extension ext = counts.addNewExtension();
            ext.setName("distinctValues");
            ext.setValue(String.valueOf(distinctValue[i]));
           
            //DiscrStats
            OPTYPE.Enum optype = mPMML.getDataDictionary().getDataFieldArray(i).getOptype();
            if(optype == OPTYPE.CATEGORICAL)
            {
                DiscrStats discrStats = statfield.addNewDiscrStats();
                int index = histogram_maxfrequency[i];
                discrStats.setModalValue(histogram_values[i].get(index).toString());
            }
            else
           
                if (interval[i]!=null)
                {
                    NumericInfo numInfo = statfield.addNewNumericInfo();
                    numInfo.setMinimum(minimum[i]);
                    numInfo.setMaximum(maximum[i]);
                    numInfo.setMean(mean[i]);
                    numInfo.setStandardDeviation(stddev[i]);               
                   
                    // ContStats                                                               
                    ContStats contsStats = statfield.addNewContStats();
                    contsStats.setTotalValuesSum(sum[i]);
                    contsStats.setTotalSquaresSum(sum2[i]);  
                                       
                    int intervalCount = interval[i].length;
                    for(int index=0; index<intervalCount; index++)
                    {
                        org.dmg.pmml31.IntervalDocument.Interval interv =
                            contsStats.addNewInterval();
                        interv.setLeftMargin(interval[i][index].getLeftMargin());
                        interv.setRightMargin(interval[i][index].getRightMargin());
                       
                        interv.setClosure(
                                Closure.Enum.forString(
                                        interval[i][index].getClosureName()));
                       
                        Extension extension = interv.addNewExtension();
                        extension.setName("Frequencies");
                        extension.setValue(String.valueOf(interval_frequency[i][index]));
                        extension = interv.addNewExtension();
                        extension.setName("SumOfValues");
                        extension.setValue(String.valueOf(interval_sumofvalues[i][index]));
                        extension = interv.addNewExtension();
                        extension.setName("SumOfSquaredValues");
                        extension.setValue(String.valueOf(interval_squaresum[i][index]));
                    }
                }
                else
                {
                    statfield.setNumericInfo(
                        mPMML.getMiningModelArray(0).getModelStats()
                            .getUnivariateStatsArray(i).getNumericInfo());
                }                   
            }           
        }
View Full Code Here

        {
            OPTYPE.Enum optype = dataFields[i].getOptype();
            if (optype == OPTYPE.CATEGORICAL)
            {
                int countValue = histogram_values[i].size();
                Value value = dataFields[i].addNewValue();
                for(int j=0; j<countValue; j++)
                {
                    value.setValue(histogram_values[i].get(j).toString());
                    Extension ext = value.addNewExtension();
                    ext.setName("count");
                    ext.setValue(String.valueOf(histogram_frequency[i][j]));
                }
            }
        }       
View Full Code Here

TOP

Related Classes of org.dmg.pmml31.UnivariateStatsDocument.UnivariateStats

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.