Package org.apache.ctakes.typesystem.type.syntax

Examples of org.apache.ctakes.typesystem.type.syntax.WordToken


//        }
       
        String oldSystemTokenClass = oldSystemToken.getClass().getName();
        if (oldSystemTokenClass.equals(WordToken.class.getName()))
        {
          newGoldToken = new WordToken(goldView, oldSystemToken.getBegin(), oldSystemToken.getEnd());
        } else if (oldSystemTokenClass.equals(ContractionToken.class.getName()))
        {
          newGoldToken = new ContractionToken(goldView, oldSystemToken.getBegin(), oldSystemToken.getEnd());
        } else if (oldSystemTokenClass.equals(NewlineToken.class.getName()))
        {
View Full Code Here


   * @return
   */
 
  private boolean isAdjacentWithStopWords(JCas jcas, Annotation prevAnn, Annotation currAnn)
  {
    WordToken prevWta = getLastToken(prevAnn);
    WordToken currWta = getFirstToken(currAnn);
   
    if(prevWta == null || currWta == null)
      return false;
   
    if(prevWta.getTokenNumber() == (currWta.getTokenNumber() - 1))
      return true;
   
    List<WordToken> containedWTAs = getContainedWordTokens(jcas, prevWta, currWta);
    for(int i=0; i<containedWTAs.size(); i++)
    {
      WordToken tempWta = containedWTAs.get(i);
      if(stopWords.contains(tempWta.getCoveredText()))
          continue;
      else
        return false;
    }
   
View Full Code Here

    JFSIndexRepository indexes = jcas.getJFSIndexRepository();
    Iterator<?> annotItr = indexes.getAnnotationIndex(WordToken.type).iterator();

    while (annotItr.hasNext())
    {
      WordToken wta = (WordToken)annotItr.next();
      if(wta.getBegin() >= prevWta.getEnd() && wta.getEnd() <= currWta.getBegin())
        list.add(wta);
    }
   
    return list;
  }
View Full Code Here

    return l;
  }
 
  private WordToken getFirstToken(Annotation ann)
  {
    WordToken wta = null;
   
    if(ann instanceof PADLocation)
    {
      FSArray fsa = (((PADLocation)ann).getRelatedTokens());
     
View Full Code Here

    return wta;
  }

  private WordToken getLastToken(Annotation ann)
  {
    WordToken wta = null;

    if(ann instanceof PADLocation)
    {
      FSArray fsa = (((PADLocation)ann).getRelatedTokens());
     
View Full Code Here

        .iterator();
    List<String> unigrams = new ArrayList<String>();
    List bigrams = new ArrayList();

    while (wordTokenItr.hasNext()) {
      WordToken token = (WordToken) wordTokenItr.next();
      String tok = token.getCoveredText();

      if (tok == null)
        continue;
      if (!caseSensitive)
        tok = tok.toLowerCase();
View Full Code Here

   * @param obj
   * @return
   */
  private BaseToken adaptToBaseToken(org.apache.ctakes.typesystem.type.syntax.BaseToken obj) throws Exception {
    if (obj instanceof WordToken) {
      WordToken wta = (WordToken) obj;
      return new WordTokenAdapter(wta);
    } else if (obj instanceof NumToken) {
      NumToken nta = (NumToken) obj;
      if (nta.getNumType() == TokenizerAnnotator.TOKEN_NUM_TYPE_INTEGER) {
        return new IntegerTokenAdapter(nta);
View Full Code Here

          sent.setSentenceNumber(sentNum);
        }
        sentNum++;
        sent.addToIndexes();
        for (int j=0; j < tokenArrays[i].length; j++) {
          WordToken tok = new WordToken(jcas);
          LineAndTokenPosition word = new LineAndTokenPosition();
          word.setLine(i+1);
          word.setTokenOffset(j);
          LineTokenToCharacterOffsetConverter.BeginAndEndCharacterOffsetPair tPos = converter.convert(word);
          if (tPos == null) {
            tok.setBegin(0);
            tok.setEnd(1);
          } else {
            tok.setBegin(tPos.getBegin());
            tok.setEnd(tPos.getEnd() + 1);
          }
          tok.setTokenNumber(tokNum);
          tokNum++; 
          tok.addToIndexes();
        }
      }
      logger.info("before assertions");
      for (Annotation a : assertions) {
        logger.info("  begin assertion");
View Full Code Here

      throws AnalysisEngineProcessException {
    JFSIndexRepository indexes = jcas.getJFSIndexRepository();
    Iterator wordItr = indexes.getAnnotationIndex(WordToken.type)
        .iterator();
    while (wordItr.hasNext()) {
      WordToken wordAnnotation = (WordToken) wordItr.next();
      if (wordAnnotation.getBegin() >= rangeBegin
          && wordAnnotation.getEnd() <= rangeEnd) {
        String word = text.substring(wordAnnotation.getBegin(),
            wordAnnotation.getEnd());

        // if the original word was misspelled, use the spell correction
        String suggestion = wordAnnotation.getSuggestion();

        if ((suggestion != null) && (suggestion.length() > 0)) {
          word = suggestion;
        }
View Full Code Here

  }

  private BaseToken adaptToBaseToken(org.apache.ctakes.typesystem.type.syntax.BaseToken bta)
      throws Exception {
    if (bta instanceof WordToken) {
      WordToken wta = (WordToken) bta;
      return new WordTokenAdapter(wta);
    } else if (bta instanceof NumToken) {
      NumToken nta = (NumToken) bta;
      if (nta.getNumType() == TokenizerAnnotator.TOKEN_NUM_TYPE_INTEGER) {
        return new IntegerTokenAdapter(nta);
View Full Code Here

TOP

Related Classes of org.apache.ctakes.typesystem.type.syntax.WordToken

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.