Examples of EnwikiDocMaker


Examples of org.apache.lucene.benchmark.byTask.feeds.EnwikiDocMaker

      } else if (arg.equals("--discardImageOnlyDocs") || arg.equals("-d")) {
        keepImageOnlyDocs = false;
      }

    }
    DocMaker docMaker = new EnwikiDocMaker();
    Properties properties = new Properties();

    properties.setProperty("docs.file", wikipedia.getAbsolutePath());
    properties.setProperty("doc.maker.forever", "false");
    properties.setProperty("keep.image.only.docs", String.valueOf(keepImageOnlyDocs));
    docMaker.setConfig(new Config(properties));
    docMaker.resetInputs();
    if (wikipedia != null && wikipedia.exists()) {
      System.out.println("Extracting Wikipedia to: " + outputDir + " using EnwikiDocMaker");
      outputDir.mkdirs();
      ExtractWikipedia extractor = new ExtractWikipedia(docMaker, outputDir);
      extractor.extract();
View Full Code Here

Examples of org.apache.lucene.benchmark.byTask.feeds.EnwikiDocMaker

      } else if (arg.equals("--discardImageOnlyDocs") || arg.equals("-d")) {
        keepImageOnlyDocs = false;
      }

    }
    DocMaker docMaker = new EnwikiDocMaker();
    Properties properties = new Properties();

    properties.setProperty("docs.file", wikipedia.getAbsolutePath());
    properties.setProperty("content.source.forever", "false");
    properties.setProperty("keep.image.only.docs", String.valueOf(keepImageOnlyDocs));
    docMaker.setConfig(new Config(properties));
    docMaker.resetInputs();
    if (wikipedia != null && wikipedia.exists()) {
      System.out.println("Extracting Wikipedia to: " + outputDir + " using EnwikiDocMaker");
      outputDir.mkdirs();
      ExtractWikipedia extractor = new ExtractWikipedia(docMaker, outputDir);
      extractor.extract();
View Full Code Here
TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.