Package opennlp.tools.tokenize

Examples of opennlp.tools.tokenize.TokenizerModel


    return model;
  }

  @Override
  protected TokenizerModel loadModel(InputStream in) throws IOException {
    return new TokenizerModel(in);
  }
View Full Code Here


    EvaluatorParams params = ArgumentParser.parse(args,
        EvaluatorParams.class);

    Charset encoding = params.getEncoding();

    TokenizerModel model = new TokenizerModelLoader().load(params.getModel());

    TokenizerEvaluationMonitor missclassifiedListener = null;
    if (params.getMisclassified()) {
      missclassifiedListener = new TokenEvaluationErrorListener();
    }
View Full Code Here

    if (args.length != 1) {
      System.out.println(getHelp());
      throw new TerminateToolException(1);
    }
   
    TokenizerModel model = new TokenizerModelLoader().load(new File(args[0]));
   
    CommandLineTokenizer tokenizer =
      new CommandLineTokenizer(new opennlp.tools.tokenize.TokenizerME(model));
   
    tokenizer.process();
View Full Code Here

 
  /**
   * @return tokenizer model
   */
  public TokenizerModel tokModel() {
    TokenizerModel model = null;
    try {
      /* Load the tokenization model from file */
      InputStream modelIn = this.getClass().getClassLoader().getResourceAsStream("en-token.bin");
      model = new TokenizerModel(modelIn);
      return model;
    }
    catch (Exception e) {
      e.printStackTrace();
    }
View Full Code Here

  public ObjectStream<NameSample> create(String[] args) {

    Parameters params = ArgumentParser.parse(args, Parameters.class);

    TokenizerModel tokenizerModel = new TokenizerModelLoader().load(params.getTokenizerModel());
    Tokenizer tokenizer = new TokenizerME(tokenizerModel);

    ObjectStream<String> mucDocStream = new FileToStringSampleStream(
        new DirectorySampleStream(params.getData(), new FileFilter() {
View Full Code Here

    }

    File modelOutFile = params.getModel();
    CmdLineUtil.checkOutputFile("tokenizer model", modelOutFile);

    TokenizerModel model;
    try {
      Dictionary dict = loadDict(params.getAbbDict());

      TokenizerFactory tokFactory = TokenizerFactory.create(
          params.getFactory(), params.getLang(), dict,
View Full Code Here

    super("Tokenizer");
  }
 
  @Override
  protected TokenizerModel loadModel(InputStream modelIn) throws IOException {
    return new TokenizerModel(modelIn);
  }
View Full Code Here

  }
 
  public void run(String format, String[] args) {
    super.run(format, args);

    TokenizerModel model = new TokenizerModelLoader().load(params.getModel());

    TokenizerEvaluationMonitor misclassifiedListener = null;
    if (params.getMisclassified()) {
      misclassifiedListener = new TokenEvaluationErrorListener();
    }
View Full Code Here

  public void run(String[] args) {
    if (args.length != 1) {
      System.out.println(getHelp());
    } else {
   
      TokenizerModel model = new TokenizerModelLoader().load(new File(args[0]));

      CommandLineTokenizer tokenizer =
        new CommandLineTokenizer(new opennlp.tools.tokenize.TokenizerME(model));

      tokenizer.process();
View Full Code Here

    Parameters params = ArgumentParser.parse(args, Parameters.class);
   
    ParserModel parserModel = new ParserModelLoader().load(params.getParserModel());
    Parser parser =  ParserFactory.create(parserModel);
   
    TokenizerModel tokenizerModel = new TokenizerModelLoader().load(params.getTokenizerModel());
    Tokenizer tokenizer = new TokenizerME(tokenizerModel);
   
    ObjectStream<String> mucDocStream = new FileToStringSampleStream(
        new DirectorySampleStream(params.getData(), new FileFilter() {
         
View Full Code Here

TOP

Related Classes of opennlp.tools.tokenize.TokenizerModel

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.