Package opennlp.tools.namefind

Source Code of opennlp.tools.namefind.DictionaryNameFinderTest

/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements.  See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/


package opennlp.tools.namefind;

import static org.junit.Assert.assertTrue;
import opennlp.tools.dictionary.Dictionary;
import opennlp.tools.tokenize.SimpleTokenizer;
import opennlp.tools.util.Span;
import opennlp.tools.util.StringList;

import org.junit.Before;
import org.junit.Test;

/**
  *Tests for the {@link DictionaryNameFinder} class.
  */
public class DictionaryNameFinderTest{

  private Dictionary mDictionary = new Dictionary();
  private TokenNameFinder mNameFinder;

  public DictionaryNameFinderTest() {

    StringList vanessa = new StringList(new String[]{"Vanessa"});
    mDictionary.put(vanessa);

    StringList vanessaWilliams = new
        StringList(new String[]{"Vanessa",
        "Williams"});
    mDictionary.put(vanessaWilliams);

    StringList max = new StringList(new String[]{"Max"});
    mDictionary.put(max);

    StringList michaelJordan = new
        StringList(new String[]{"Michael", "Jordan"});
    mDictionary.put(michaelJordan);
  }

  @Before
  public void setUp() throws Exception {
    mNameFinder = new DictionaryNameFinder(mDictionary);
  }

  @Test
  public void testSingleTokeNameAtSentenceStart() {

    String sentence = "Max a b c d";

    SimpleTokenizer tokenizer = SimpleTokenizer.INSTANCE;
    String tokens[] = tokenizer.tokenize(sentence);

    Span names[] = mNameFinder.find(tokens);

    assertTrue(names.length == 1);
    assertTrue(names[0].getStart() == 0 && names[0].getEnd() == 1);
  }

  @Test
  public void testSingleTokeNameInsideSentence() {
    String sentence = "a b  Max c d";

    SimpleTokenizer tokenizer = SimpleTokenizer.INSTANCE;
    String tokens[] = tokenizer.tokenize(sentence);

    Span names[] = mNameFinder.find(tokens);

    assertTrue(names.length == 1);
    assertTrue(names[0].getStart() == 2 && names[0].getEnd() == 3);
  }

  @Test
  public void testSingleTokeNameAtSentenceEnd() {
    String sentence = "a b c Max";

    SimpleTokenizer tokenizer = SimpleTokenizer.INSTANCE;
    String tokens[] = tokenizer.tokenize(sentence);

    Span names[] = mNameFinder.find(tokens);

    assertTrue(names.length == 1);
    assertTrue(names[0].getStart() == 3 && names[0].getEnd() == 4);
  }

  @Test
  public void testLastMatchingTokenNameIsChoosen() {
    String sentence[] = {"a", "b", "c", "Vanessa"};

    Span names[] = mNameFinder.find(sentence);

    assertTrue(names.length == 1);
    assertTrue(names[0].getStart() == 3 && names[0].getEnd() == 4);
  }

  @Test
  public void testLongerTokenNameIsPreferred() {
    String sentence[] = {"a", "b", "c", "Vanessa", "Williams"};

    Span names[] = mNameFinder.find(sentence);

    assertTrue(names.length == 1);
    assertTrue(names[0].getStart() == 3 && names[0].getEnd() == 5);
  }

  @Test
  public void testCaseSensitivity() {
    String sentence[] = {"a", "b", "c", "vanessa", "williams"};

    Span names[] = mNameFinder.find(sentence);

    assertTrue(names.length == 1);
    assertTrue(names[0].getStart() == 3 && names[0].getEnd() == 5);
  }

  @Test
  public void testCaseLongerEntry() {
    String sentence[] = {"a", "b", "michael", "jordan"};

    Span names[] = mNameFinder.find(sentence);

    assertTrue(names.length == 1);
    assertTrue(names[0].length() == 2);
  }
}
TOP

Related Classes of opennlp.tools.namefind.DictionaryNameFinderTest

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.