Package com.jgaap.util

Examples of com.jgaap.util.Document


    probs[0] = 0.02874005; //Mary
    //R code : pnorm(80,30,sqrt(200),lower.tail=FALSE)*pnorm(20,70,sqrt(200))*.5
    probs[1] = 2.070124e-08; //Peter
    weka.core.Utils.normalize(probs);
   
    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown);
   
    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    knownDocument1.setAuthor("Mary");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    Document knownDocument2 = new Document();
    knownDocument2.setAuthor("Peter");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
    Document knownDocument3 = new Document();
    knownDocument3.setAuthor("Mary");
    knownDocument3.addEventSet(null, known3);
    knowns.add(knownDocument3);
    Document knownDocument4 = new Document();
    knownDocument4.setAuthor("Peter");
    knownDocument4.addEventSet(null, known4);
    knowns.add(knownDocument4);

    WEKANaiveBayes classifier = new WEKANaiveBayes();
    classifier.train(knowns);
    List<Pair<String, Double>> t = classifier.analyze(unknownDocument);
View Full Code Here


    test1.add(new Event(".", null));
    known1.addEvents(test1);
    unknown.addEvents(test1);
   
    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    //knownDocument1.setAuthor(known1.getAuthor());
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);

   
    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown);
    NullHistAnalysis nullHistAnalysis = new NullHistAnalysis();
    nullHistAnalysis.train(knowns);
    List<Pair<String, Double>> t = nullHistAnalysis.analyze(unknownDocument);
    String r = t.get(0).getFirst();
    String s = "No analysis performed.\n";
View Full Code Here

    known4.addEvent(new Event("a", null));
    known4.addEvent(new Event("peck", null));
    //known4.setAuthor("Peter");

    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    knownDocument1.setAuthor("Mary");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    Document knownDocument2 = new Document();
    knownDocument2.setAuthor("Peter");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
    Document knownDocument3 = new Document();
    knownDocument3.setAuthor("Mary");
    knownDocument3.addEventSet(null, known3);
    knowns.add(knownDocument3);
    Document knownDocument4 = new Document();
    knownDocument4.setAuthor("Peter");
    knownDocument4.addEventSet(null, known4);
    knowns.add(knownDocument4);

    //Create unknown text
    EventSet unknown1 = new EventSet();

    unknown1.addEvent(new Event("mary", null));
    unknown1.addEvent(new Event("had", null));
    unknown1.addEvent(new Event("a", null));
    unknown1.addEvent(new Event("little", null));
    unknown1.addEvent(new Event("beta", null));

    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown1);

    //Classify unknown based on the knowns
    WEKALeastMedSq classifier = new WEKALeastMedSq();
    List<List<Pair<String, Double>>> t = new ArrayList<List<Pair<String,Double>>>();
    classifier.train(knowns);
    t.add(classifier.analyze(unknownDocument));
    System.out.println(t.toString());

    //Assert that the authors match
    assertTrue(t.get(0).get(0).getFirst().equals("Mary"));
   
   
    // Test 1b - Test equal likelihood
   
    EventSet unknown2 = new EventSet();
   
    unknown2.addEvent(new Event("mary", null));
    unknown2.addEvent(new Event("had", null));
    unknown2.addEvent(new Event("a", null));
    unknown2.addEvent(new Event("peter", null));
    unknown2.addEvent(new Event("piper", null));
   
    Document unknownDocument2 = new Document();
    unknownDocument2.addEventSet(null, unknown2);
   
    t = new ArrayList<List<Pair<String,Double>>>();
    classifier.train(knowns);
    t.add(classifier.analyze(unknownDocument2));
    System.out.println(t.toString());
    assertTrue(Math.abs(t.get(0).get(0).getSecond()-0.5)<.0001);
    assertTrue(Math.abs(t.get(0).get(1).getSecond()-0.5)<.0001);

    classifier = new WEKALeastMedSq();
    t = new ArrayList<List<Pair<String,Double>>>();
    classifier.train(knowns);
    t.add(classifier.analyze(unknownDocument));
    System.out.println(t.toString());
    assertTrue(t.get(0).get(0).getFirst().equals("Mary"));
   

    //Test 3 - Add in another unknown

    EventSet unknown3 = new EventSet();

    unknown3.addEvent(new Event("peter", null));
    unknown3.addEvent(new Event("piper", null));
    unknown3.addEvent(new Event("picked", null));
    unknown3.addEvent(new Event("a", null));
    unknown3.addEvent(new Event("shells", null));

    Document unknownDocument3 = new Document();

    classifier = new WEKALeastMedSq();
    t = new ArrayList<List<Pair<String,Double>>>();
    classifier.train(knowns);
    t.add(classifier.analyze(unknownDocument));
View Full Code Here

    test3.add(new Event("as", null));
    test3.add(new Event("snow.", null));
    unknown.addEvents(test3);

    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    knownDocument1.setAuthor("Mary");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    Document knownDocument2 = new Document();
    knownDocument2.setAuthor("Peter");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
   
    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown);

    System.out.println("There once was a lass from Nantucket");
    nearest.train(knowns);
    List<Pair<String, Double>> t = nearest.analyze(unknownDocument);
    String r = t.get(0).getFirst();
View Full Code Here

    for(int i=0; i<sample3.length(); i++){
      unknown.addEvent(new Event(sample3.charAt(i), null));
    }
   
    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    knownDocument1.setAuthor("Frodo");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    Document knownDocument2 = new Document();
    knownDocument2.setAuthor("Sam");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
   
    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown);
   
    MarkovChainAnalysis gandolf = new MarkovChainAnalysis();
    gandolf.train(knowns);
    List<Pair<String, Double>> t = gandolf.analyze(unknownDocument);
    for(int i=0; i<t.size(); i++){
View Full Code Here

    known4.addEvent(new Event("a", null));
    known4.addEvent(new Event("peck", null));
    //known4.setAuthor("Peter");

    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    knownDocument1.setAuthor("Mary");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    Document knownDocument2 = new Document();
    knownDocument2.setAuthor("Peter");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
    Document knownDocument3 = new Document();
    knownDocument3.setAuthor("Mary");
    knownDocument3.addEventSet(null, known3);
    knowns.add(knownDocument3);
    Document knownDocument4 = new Document();
    knownDocument4.setAuthor("Peter");
    knownDocument4.addEventSet(null, known4);
    knowns.add(knownDocument4);

    //Create unknown text
    EventSet unknown1 = new EventSet();

    unknown1.addEvent(new Event("mary", null));
    unknown1.addEvent(new Event("had", null));
    unknown1.addEvent(new Event("a", null));
    unknown1.addEvent(new Event("little", null));
    unknown1.addEvent(new Event("beta", null));

    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown1);

    //Classify unknown based on the knowns
    WEKALinearRegression classifier = new WEKALinearRegression();
    List<List<Pair<String, Double>>> t = new ArrayList<List<Pair<String,Double>>>();
    classifier.train(knowns);
    t.add(classifier.analyze(unknownDocument));
    System.out.println(t.toString());

    //Assert that the authors match
    assertTrue(t.get(0).get(0).getFirst().equals("Mary"));
   
    // Test 2 - Test equal likelihood
   
    EventSet unknown2 = new EventSet();
   
    unknown2.addEvent(new Event("piper", null));
    unknown2.addEvent(new Event("mary", null));
    unknown2.addEvent(new Event("a", null));
    unknown2.addEvent(new Event("peter", null));
    unknown2.addEvent(new Event("had", null));
   
    Document unknownDocument2 = new Document();
    unknownDocument2.addEventSet(null, unknown2);
   
    t = new ArrayList<List<Pair<String,Double>>>();
    classifier.train(knowns);
    t.add(classifier.analyze(unknownDocument2));
    System.out.println(t.toString());
    assertTrue(Math.abs(t.get(0).get(0).getSecond()-0.5)<.1 && Math.abs(t.get(0).get(1).getSecond()-0.5)<.1);

    // Test 3 - more training documents
   
    EventSet known5 = new EventSet();
    EventSet known6 = new EventSet();
   
    known5.addEvent(new Event("she", null));
    known5.addEvent(new Event("sells", null));
    known5.addEvent(new Event("seashells", null));
    known5.addEvent(new Event("by", null));
    known5.addEvent(new Event("seashore", null));
    //known5.setAuthor("Susie");

    known6.addEvent(new Event("susie", null));
    known6.addEvent(new Event("sells", null));
    known6.addEvent(new Event("shells", null));
    known6.addEvent(new Event("by", null));
    known6.addEvent(new Event("seashore", null));
    //known6.setAuthor("Susie");

    Document knownDocument5 = new Document();
    knownDocument5.setAuthor("Susie");
    knownDocument5.addEventSet(null, known5);
    knowns.add(knownDocument5);
    Document knownDocument6 = new Document();
    knownDocument6.setAuthor("Susie");
    knownDocument6.addEventSet(null, known6);
    knowns.add(knownDocument6);
   
    t = new ArrayList<List<Pair<String,Double>>>();
    classifier.train(knowns);
    t.add(classifier.analyze(unknownDocument));
View Full Code Here

    unknown.addEvent(new Event("white", null));
    unknown.addEvent(new Event("as", null));
    unknown.addEvent(new Event("snow.", null));

    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    knownDocument1.setAuthor("Mary");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    Document knownDocument2 = new Document();
    knownDocument2.setAuthor("Peter");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
   
    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown);
    LDA classifier = new LDA();
    classifier.train(knowns);
    List<Pair<String, Double>> t = classifier.analyze(unknownDocument);
    String author1 = t.get(0).getFirst();
    String author2 = t.get(1).getFirst();
    Double val1 = t.get(0).getSecond();
    Double val2 = t.get(1).getSecond();
    /*System.out.println("Test 1 Classified");
    System.out.println("First : "+author1+" "+t.get(0).getSecond());
    System.out.println("Second: "+author2+" "+t.get(1).getSecond());
    System.out.println("Expected");
    System.out.println("First : Mary");
    System.out.println("Second: Peter");*/
    assertTrue(author1.equals("Mary"));

    //Test 2 - Same classifier
    //Testing for persistence
    t = classifier.analyze(unknownDocument);
    /*System.out.println("Test 2 Classified");
    System.out.println("First : "+t.get(0).getFirst()+" "+t.get(0).getSecond());
    System.out.println("Second: "+t.get(1).getFirst()+" "+t.get(1).getSecond());
    System.out.println("Expected");
    System.out.println("First : Mary");
    System.out.println("Second: Peter");*/
    assertTrue(author1.equals(t.get(0).getFirst()) && Math.abs(val1 - t.get(0).getSecond()) < .000001
        && author2.equals(t.get(1).getFirst()) && Math.abs(val2 - t.get(1).getSecond()) < .000001);
   
    //Test 3 - Different instance of classifier
    //Again testing for persistence
    LDA lda = new LDA();
    lda.train(knowns);
    t = lda.analyze(unknownDocument);
    //String r = t.get(0).getFirst();
    /*System.out.println("Test 3 Classified");
    System.out.println("First : "+r+" "+t.get(0).getSecond());
    System.out.println("Second: "+t.get(1).getFirst()+" "+t.get(1).getSecond());
    System.out.println("Expected");
    System.out.println("First : Mary");
    System.out.println("Second: Peter");*/
    assertTrue(author1.equals(t.get(0).getFirst()) && Math.abs(val1 - t.get(0).getSecond()) < .000001
        && author2.equals(t.get(1).getFirst()) && Math.abs(val2 - t.get(1).getSecond()) < .000001);
   
    //Test 4 - two unknowns
    EventSet unknown2 = new EventSet();
    unknown2.addEvent(new Event("Peter", null));
    unknown2.addEvent(new Event("pumpkin", null));
    unknown2.addEvent(new Event("picked", null));
    unknown2.addEvent(new Event("a", null));
    unknown2.addEvent(new Event("pack", null));
    unknown2.addEvent(new Event("of", null));
    unknown2.addEvent(new Event("pickled", null));
    unknown2.addEvent(new Event("potatoes.", null));
   
    Document unknownDocument2 = new Document();
    unknownDocument2.addEventSet(null, unknown2);
   
    List<List<Pair<String, Double>>> t2 = new ArrayList<List<Pair<String,Double>>>();
    t2.add(lda.analyze(unknownDocument));
    t2.add(lda.analyze(unknownDocument2));
    /*for(int i = 0; i < t2.size(); i++){
View Full Code Here

    test1.add(new Event(".", null));
    known1.addEvents(test1);
    unknown.addEvents(test1);
   
    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    //knownDocument1.setAuthor(known1.getAuthor());
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
   
    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown);
    NullAnalysis nullAnalysis = new NullAnalysis();
    nullAnalysis.train(knowns);
    List<Pair<String,Double>> t = nullAnalysis.analyze(unknownDocument);
    String r = t.get(0).getFirst();
    String s = "No analysis performed.\n";
View Full Code Here

    known4.addEvent(new Event("a", null));
    known4.addEvent(new Event("peck", null));
    //known4.setAuthor("Peter");

    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    knownDocument1.setAuthor("Mary");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    Document knownDocument2 = new Document();
    knownDocument2.setAuthor("Peter");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
    Document knownDocument3 = new Document();
    knownDocument3.setAuthor("Mary");
    knownDocument3.addEventSet(null, known3);
    knowns.add(knownDocument3);
    Document knownDocument4 = new Document();
    knownDocument4.setAuthor("Peter");
    knownDocument4.addEventSet(null, known4);
    knowns.add(knownDocument4);

    //Create unknown texts
    EventSet unknown1 = new EventSet();
    EventSet unknown2 = new EventSet();

    unknown1.addEvent(new Event("mary", null));
    unknown1.addEvent(new Event("had", null));
    unknown1.addEvent(new Event("a", null));
    unknown1.addEvent(new Event("little", null));
    unknown1.addEvent(new Event("beta", null));
   
    unknown2.addEvent(new Event("peter", null));
    unknown2.addEvent(new Event("piper", null));
    unknown2.addEvent(new Event("picked", null));
    unknown2.addEvent(new Event("a", null));
    unknown2.addEvent(new Event("shells", null));

    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown1);
    Document unknownDocument2 = new Document();
    unknownDocument2.addEventSet(null, unknown2);

    //Classify unknown based on the knowns
    WEKADecisionStump classifier = new WEKADecisionStump();
    classifier.train(knowns);
    List<List<Pair<String, Double>>> t = new ArrayList<List<Pair<String,Double>>>();
    t.add(classifier.analyze(unknownDocument));
    t.add(classifier.analyze(unknownDocument2));
    System.out.println(knowns);
    System.out.println(unknownDocument.getEventSet(null));
    System.out.println(unknownDocument2.getEventSet(null));
    System.out.println(t.toString());
    //[[[Mary:1.0], [Peter:0.0]], [[Peter:1.0], [Mary:0.0]]]

      //System.out.println(t.toString());
      //[[[Mary:1.0], [Peter:0.0]], [[Peter:1.0], [Mary:0.0]]]

      //Assert that the authors match
      assertTrue(t.get(0).get(0).getFirst().equals("Mary") && t.get(1).get(0).getFirst().equals("Peter"));

    //Test 2 - Different documents
   
    //Redefine known documents
    known1 = new EventSet();
    known2 = new EventSet();
    known3 = new EventSet();
    known4 = new EventSet();
   
    known1.addEvent(new Event("alpha", null));
    known1.addEvent(new Event("alpha", null));
    known1.addEvent(new Event("alpha", null));
    known1.addEvent(new Event("alpha", null));
    known1.addEvent(new Event("beta", null));
    //known1.setAuthor("Mary");
   
    known3.addEvent(new Event("alpha", null));
    known3.addEvent(new Event("alpha", null));
    known3.addEvent(new Event("alpha", null));
    known3.addEvent(new Event("beta", null));
    known3.addEvent(new Event("beta", null));
    //known3.setAuthor("Mary");

    known2.addEvent(new Event("alpha", null));
    known2.addEvent(new Event("beta", null));
    known2.addEvent(new Event("beta", null));
    known2.addEvent(new Event("beta", null));
    known2.addEvent(new Event("beta", null));
    //known2.setAuthor("Peter");
   
    known4.addEvent(new Event("alpha", null));
    known4.addEvent(new Event("alpha", null));
    known4.addEvent(new Event("beta", null));
    known4.addEvent(new Event("beta", null));
    known4.addEvent(new Event("beta", null));
    //known4.setAuthor("Peter");
   
    knowns = new ArrayList<Document>();
    knownDocument1 = new Document();
    knownDocument1.setAuthor("Mary");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    knownDocument2 = new Document();
    knownDocument2.setAuthor("Peter");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
    knownDocument3 = new Document();
    knownDocument3.setAuthor("Mary");
    knownDocument3.addEventSet(null, known3);
    knowns.add(knownDocument3);
    knownDocument4 = new Document();
    knownDocument4.setAuthor("Peter");
    knownDocument4.addEventSet(null, known4);
    knowns.add(knownDocument4);

    //Create unknown texts
    unknown1 = new EventSet();
    unknown2 = new EventSet();

    unknown1.addEvent(new Event("alpha", null));
    unknown1.addEvent(new Event("alpha", null));
    unknown1.addEvent(new Event("alpha", null));
    unknown1.addEvent(new Event("alpha", null));
    unknown1.addEvent(new Event("alpha", null));
   
    unknown2.addEvent(new Event("beta", null));
    unknown2.addEvent(new Event("beta", null));
    unknown2.addEvent(new Event("beta", null));
    unknown2.addEvent(new Event("beta", null));
    unknown2.addEvent(new Event("beta", null));

    unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown1);
    unknownDocument2 = new Document();
    unknownDocument2.addEventSet(null, unknown2);
   
    //Classify unknown based on the knowns
    classifier = new WEKADecisionStump();
    classifier.train(knowns);
    t = new ArrayList<List<Pair<String,Double>>>();
View Full Code Here

    known4.addEvent(new Event("a", null));
    known4.addEvent(new Event("peck", null));
    //known4.setAuthor("Peter");

    List<Document> knowns = new ArrayList<Document>();
    Document knownDocument1 = new Document();
    knownDocument1.setAuthor("Mary");
    knownDocument1.addEventSet(null, known1);
    knowns.add(knownDocument1);
    Document knownDocument2 = new Document();
    knownDocument2.setAuthor("Peter");
    knownDocument2.addEventSet(null, known2);
    knowns.add(knownDocument2);
    Document knownDocument3 = new Document();
    knownDocument3.setAuthor("Mary");
    knownDocument3.addEventSet(null, known3);
    knowns.add(knownDocument3);
    Document knownDocument4 = new Document();
    knownDocument4.setAuthor("Peter");
    knownDocument4.addEventSet(null, known4);
    knowns.add(knownDocument4);

    //Create unknown text
    EventSet unknown1 = new EventSet();

    unknown1.addEvent(new Event("mary", null));
    unknown1.addEvent(new Event("had", null));
    unknown1.addEvent(new Event("a", null));
    unknown1.addEvent(new Event("little", null));
    unknown1.addEvent(new Event("beta", null));

    Document unknownDocument = new Document();
    unknownDocument.addEventSet(null, unknown1);

    //Classify unknown based on the knowns
    WEKAJ48DecisionTree tree = new WEKAJ48DecisionTree();
    List<List<Pair<String, Double>>> t = new ArrayList<List<Pair<String,Double>>>();
    tree.train(knowns);
    t.add(tree.analyze(unknownDocument));
    System.out.println(t.toString());


      //Assert that the authors match
      assertTrue(t.get(0).get(0).getFirst().equals("Mary"));
   
   
    //Test 2 - Add in third known author

    EventSet known5 = new EventSet();
    EventSet known6 = new EventSet();
   
    known5.addEvent(new Event("she", null));
    known5.addEvent(new Event("sells", null));
    known5.addEvent(new Event("seashells", null));
    known5.addEvent(new Event("by", null));
    known5.addEvent(new Event("seashore", null));
    //known5.setAuthor("Susie");

    known6.addEvent(new Event("susie", null));
    known6.addEvent(new Event("sells", null));
    known6.addEvent(new Event("shells", null));
    known6.addEvent(new Event("by", null));
    known6.addEvent(new Event("seashore", null));
    //known6.setAuthor("Susie");

    Document knownDocument5 = new Document();
    knownDocument5.setAuthor("Susie");
    knownDocument5.addEventSet(null, known5);
    knowns.add(knownDocument5);
    Document knownDocument6 = new Document();
    knownDocument6.setAuthor("Susie");
    knownDocument6.addEventSet(null, known6);
    knowns.add(knownDocument6);

    t = new ArrayList<List<Pair<String,Double>>>();
    tree.train(knowns);
    t.add(tree.analyze(unknownDocument));
    System.out.println(t.toString());
    assertTrue(t.get(0).get(0).getFirst().equals("Mary"));



    //Test 3 - Add in another unknown

    EventSet unknown2 = new EventSet();

    unknown2.addEvent(new Event("peter", null));
    unknown2.addEvent(new Event("piper", null));
    unknown2.addEvent(new Event("picked", null));
    unknown2.addEvent(new Event("a", null));
    unknown2.addEvent(new Event("shells", null));

    Document unknownDocument2 = new Document();
    unknownDocument2.addEventSet(null, unknown2);

    t = new ArrayList<List<Pair<String,Double>>>();
    tree.train(knowns);
    t.add(tree.analyze(unknownDocument));
    t.add(tree.analyze(unknownDocument2));
View Full Code Here

TOP

Related Classes of com.jgaap.util.Document

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.