Package com.jgaap.distances

Source Code of com.jgaap.distances.KullbackLeiblerDivergenceTest

/*
* JGAAP -- a graphical program for stylometric authorship attribution
* Copyright (C) 2009,2011 by Patrick Juola
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as
* published by the Free Software Foundation, either version 3 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program.  If not, see <http://www.gnu.org/licenses/>.
*/
/**
*
*/
package com.jgaap.distances;

import static org.junit.Assert.*;

import java.util.Vector;

import org.junit.Test;

import com.jgaap.generics.DistanceCalculationException;
import com.jgaap.util.Event;
import com.jgaap.util.EventMap;
import com.jgaap.util.EventSet;

/**
* @author Patrick Juola
*
*/
public class KullbackLeiblerDivergenceTest {

  /**
   * Test method for
   * {@link com.jgaap.distances.KullbackLeiblerDivergence#distance(com.jgaap.util.EventSet, com.jgaap.util.EventSet)}
   * .
   * @throws DistanceCalculationException
   */
  @Test
  public void testDistance() throws DistanceCalculationException {
    /*
     * n.b. The KL function uses logarithms, for which we use Java's
     * built-in Math.log() function. Math.log() returns the _natural_ (base
     * e) log of a number, not the more usual/intuitive base 2. Formally, we
     * are using units of 'nats' instead of the more normal 'bits.' Not a
     * problem as long as we can remember to do the unit conversions and
     * don't mind working in furlongs per fortnight.
     */

    /* test 1 -- the same histogram should yield distance 0.0 */
    EventSet es1 = new EventSet();
    EventSet es2 = new EventSet();
    Vector<Event> test1 = new Vector<Event>();
    test1.add(new Event("The", null));
    test1.add(new Event("quick", null));
    test1.add(new Event("brown", null));
    test1.add(new Event("fox", null));
    test1.add(new Event("jumps", null));
    test1.add(new Event("over", null));
    test1.add(new Event("the", null));
    test1.add(new Event("lazy", null));
    test1.add(new Event("dog", null));
    test1.add(new Event(".", null));
    es1.addEvents(test1);
    es2.addEvents(test1);

    assertTrue(new KullbackLeiblerDivergence().distance(new EventMap(es1), new EventMap(es2)) == 0.00);

    /* test 2 -- different hist, same distribution (still 0.0) */
    /* use prior data and add another copy */
    es2.addEvents(test1);
    assertTrue(new KullbackLeiblerDivergence().distance(new EventMap(es1), new EventMap(es2)) == 0.00);

    /* test 3 -- different distributions */

    test1 = new Vector<Event>(); // no need to re-create test1
    Vector<Event> test2 = new Vector<Event>();

    /* es1 gets a 50/50 split between alpha and beta */
    test1.add(new Event("alpha", null));
    test1.add(new Event("beta", null));
    es1 = new EventSet();
    es1.addEvents(test1);

    /* es2 gets a 75/25 split between alpha and beta */
    test2.add(new Event("alpha", null));
    test2.add(new Event("alpha", null));
    test2.add(new Event("alpha", null));
    test2.add(new Event("beta", null));
    es2 = new EventSet();
    es2.addEvents(test2);
    double result = new KullbackLeiblerDivergence().distance(new EventMap(es1), new EventMap(es2));
    System.out.println(result);
    assertTrue(DistanceTestHelper.inRange(result, 0.1438410, 0.00001));

    /* test 4 -- reversed distributions */
    result = new KullbackLeiblerDivergence().distance(new EventMap(es2), new EventMap(es1));
    assertTrue(DistanceTestHelper.inRange(result, 0.13081203594, 0.00001));
    /* test 5 -- distributions with 0 (need rounding) */
    /* use same 50/50 es1 */
    /*
     * value of nonce-term gamma should be 0.25 (half of 0.5, because each
     * element appears once
     */

    /* es2 gets a 50/25/25 split between alpha, beta,gamma */
    test2 = new Vector<Event>();
    test2.add(new Event("alpha", null));
    test2.add(new Event("alpha", null));
    test2.add(new Event("beta", null));
    test2.add(new Event("gamma", null));

    es2 = new EventSet();
    es2.addEvents(test2);
    System.out.println("Start here");
    result = new KullbackLeiblerDivergence().distance(new EventMap(es1), new EventMap(es2));
    System.out.println(result);
    assertTrue(DistanceTestHelper.inRange(result, 0.346574, 0.00001));

  }

}
TOP

Related Classes of com.jgaap.distances.KullbackLeiblerDivergenceTest

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.