Package org.apache.nutch.net

Examples of org.apache.nutch.net.RegexUrlNormalizer.normalize()


  private void normalizeTest(String weird, String normal) throws Exception {
    String testSrcDir = System.getProperty("test.src.dir");
    String path = testSrcDir + "/org/apache/nutch/net/test-regex-normalize.xml";
    RegexUrlNormalizer normalizer = new RegexUrlNormalizer(path);
    assertEquals(normal, normalizer.normalize(weird));
  }
 
  public static void main(String[] args) throws Exception {
    new TestRegexUrlNormalizer("test").testNormalizer();
    new TestBasicUrlNormalizer("test").testNormalizer(); // need to make sure it passes this test too
View Full Code Here


  private void normalizeTest(String weird, String normal) throws Exception {
    String testSrcDir = System.getProperty("test.src.dir");
    String path = testSrcDir + "/org/apache/nutch/net/test-regex-normalize.xml";
    RegexUrlNormalizer normalizer = new RegexUrlNormalizer(path);
    assertEquals(normal, normalizer.normalize(weird));
  }
 
  public static void main(String[] args) throws Exception {
    new TestRegexUrlNormalizer("test").testNormalizer();
    new TestBasicUrlNormalizer("test").testNormalizer(); // need to make sure it passes this test too
View Full Code Here

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.