Package org.apache.ctakes.dictionary.lookup.vo

Examples of org.apache.ctakes.dictionary.lookup.vo.LookupToken


        Map ltEndOffsetMap = getEndOffsetMap(ltList, true);

        List lhList = new ArrayList();
        for (int ltIdx = 0; ltIdx < ltList.size(); ltIdx++)
        {
            LookupToken lt = (LookupToken) ltList.get(ltIdx);

            Boolean useForLookup = Boolean.valueOf(lt.getStringAttribute(LT_KEY_USE_FOR_LOOKUP));

            if ((useForLookup == null) || (useForLookup.booleanValue()))
            {
                Collection mdhCol = getFirstTokenHits(lt);

                if ((mdhCol != null) && (mdhCol.size() > 0))
                {
                    int wEndOffset = -1;
                    if (useWindowAnnots)
                    {
                        // get the largest overlapping window annotation
                        LookupAnnotation wAnnot = getLargestWindowAnnotation(
                                ltIdx,
                                lt,
                                ltStartOffsetMap,
                                ltEndOffsetMap,
                                ltListIndexMap,
                                wStartOffsetMap,
                                wEndOffsetMap);
                        if (wAnnot != null)
                        {
                            wEndOffset = wAnnot.getEndOffset();
                        }
                    }
                    if (wEndOffset == -1)
                    {
                        iv_logger.debug("Window size set to max perm level.");
                        wEndOffset = getFixedWindowEndOffset(ltIdx, lt, ltList);
                    }

                    List endLookupTokenList = getLookupTokenList(
                            wEndOffset,
                            ltEndOffsetMap,
                            false);
                    LookupToken endLookupToken = (LookupToken) endLookupTokenList.get(endLookupTokenList.size() - 1);

                    int startTokenIdx = ltIdx;
                    int endTokenIdx = ((Integer) ltListIndexMap.get(endLookupToken)).intValue();

                    // list of LookupToken objects bound by the window
View Full Code Here


                    }
                }
            }
        }

        LookupToken firstWordLookupToken = (LookupToken) wLookupTokenList.get(firstTokenIndex.intValue());

        Iterator permItr = permCol.iterator();
        while (permItr.hasNext())
        {
            // convert permutation idx back into LookupTokens
            List tempList = new ArrayList();
            List permutation = (List) permItr.next();
            Iterator idxItr = permutation.iterator();
            while (idxItr.hasNext())
            {
                int idx = ((Integer) idxItr.next()).intValue();
                if (idx <= firstTokenIndex.intValue())
                {
                    idx--;
                }
                LookupToken lt = (LookupToken) wLookupTokenList.get(idx);
                tempList.add(lt);
            }

            List singleTokenList = new ArrayList();
            singleTokenList.add(firstWordLookupToken);
            String[] fwPerms = iv_phrBuilder.getPhrases(singleTokenList);

            String[] phrArr = iv_phrBuilder.getPhrases(tempList);
            for (int i = 0; i < phrArr.length; i++)
            {
                for (int fwPermIdx = 0; fwPermIdx < fwPerms.length; fwPermIdx++)
                {
                    StringBuffer phraseSB = new StringBuffer();
                    phraseSB.append(fwPerms[fwPermIdx]);
                    phraseSB.append(' ');
                    phraseSB.append(phrArr[i]);
                    String phrase = phraseSB.toString().trim().toLowerCase();
                    Set mdhSet = (Set) mdhMap.get(phrase);
                    if (mdhSet != null)
                    {
                        Iterator mdhIterator = mdhSet.iterator();
                        while (mdhIterator.hasNext())
                        {
                            MetaDataHit mdh = (MetaDataHit) mdhIterator.next();
                            // figure out start and end offsets
                            Collections.sort(permutation);

                            int startOffset;
                            if (permutation.size() > 0)
                            {
                                int firstIdx = ((Integer) permutation.get(0)).intValue();
                                if (firstIdx <= firstTokenIndex.intValue())
                                {
                                    firstIdx--;
                                }
                                LookupToken lt = (LookupToken) wLookupTokenList.get(firstIdx);
                                if (lt.getStartOffset() < firstWordLookupToken.getStartOffset())
                                {
                                    startOffset = lt.getStartOffset();
                                }
                                else
                                {
                                    startOffset = firstWordLookupToken.getStartOffset();
                                }
                            }
                            else
                            {
                                startOffset = firstWordLookupToken.getStartOffset();
                            }

                            int endOffset;
                            if (permutation.size() > 0)
                            {
                                int lastIdx = ((Integer) permutation.get(permutation.size() - 1)).intValue();
                                if (lastIdx <= firstTokenIndex.intValue())
                                {
                                    lastIdx--;
                                }
                                LookupToken lt = (LookupToken) wLookupTokenList.get(lastIdx);
                                if (lt.getEndOffset() > firstWordLookupToken.getEndOffset())
                                {
                                    endOffset = lt.getEndOffset();
                                }
                                else
                                {
                                    endOffset = firstWordLookupToken.getEndOffset();
                                }
View Full Code Here

        if ((startLookupTokenList == null) || (endLookupTokenList == null))
        {
            iv_logger.debug("Invalid window:" + startOffset + "," + endOffset);
            return -1;
        }
        LookupToken startLookupToken = (LookupToken) startLookupTokenList.get(0);
        Integer startIdx = (Integer) ltListIndexMap.get(startLookupToken);

        LookupToken endLookupToken = (LookupToken) endLookupTokenList.get(endLookupTokenList.size() - 1);
        Integer endIdx = (Integer) ltListIndexMap.get(endLookupToken);

        return endIdx.intValue() - startIdx.intValue() + 1;
    }
View Full Code Here

        int fixedEndOffset = 0;

        for (int i = tokenIdx; (i < tokenIdx + iv_maxPermutationLevel)
                && (i < ltList.size()); i++)
        {
            LookupToken tempLookupToken = (LookupToken) ltList.get(i);
            if (tempLookupToken != null)
            {
                fixedEndOffset = tempLookupToken.getEndOffset();
            }
        }
        return fixedEndOffset;
    }
View Full Code Here

    public Collection lookup(List ltList, Map ctxMap) throws Exception
    {
        List lhList = new ArrayList();
        for (int tokenIdx = 0; tokenIdx < ltList.size(); tokenIdx++)
        {
            LookupToken lt = (LookupToken) ltList.get(tokenIdx);

            List singleLtList = new ArrayList();
            singleLtList.add(lt);

            String[] strArr = iv_phrBuilder.getPhrases(singleLtList);
            Collection mdhCol = getHits(strArr);

            if ((mdhCol != null) && (mdhCol.size() > 0))
            {
                Iterator mdhMatchItr = mdhCol.iterator();
                while (mdhMatchItr.hasNext())
                {
                    MetaDataHit mdh = (MetaDataHit) mdhMatchItr.next();
                    LookupHit lh = new LookupHit(mdh, lt.getStartOffset(), lt
                            .getEndOffset());
                    lhList.add(lh);
                }
            }
        }
View Full Code Here

      if (!((bta instanceof NewlineToken)
          || (bta instanceof PunctuationToken)
          || (bta instanceof ContractionToken)
          || (bta instanceof SymbolToken)))
      {
        LookupToken lt = new LookupAnnotationToJCasAdapter(bta);

        if (bta instanceof WordToken)
        {
          WordToken wta = (WordToken) bta;
          String canonicalForm = wta.getCanonicalForm();
          if (canonicalForm != null)
          {
            lt.addStringAttribute(
                CANONICAL_VARIANT_ATTR,
                canonicalForm);
          }
        }
View Full Code Here

        while (teItr.hasNext())
        {
            TextExtractor te = (TextExtractor) teItr.next();

            StringBuffer sb = new StringBuffer();
            LookupToken previousLt = null;
            Iterator ltItr = lookupTokenList.iterator();
            while (ltItr.hasNext())
            {
                LookupToken lt = (LookupToken) ltItr.next();
                String variant = te.getText(lt);

                if (variant == null)
                {
                    variant = lt.getText();
                }

                if (previousLt != null)
                {
                    // check delta between previous token and current token
                    // this delta represents whitespace between tokens
                    if (previousLt.getEndOffset() != lt.getStartOffset())
                    {
                        // insert whitespace
                        sb.append(' ');
                    }
                }
View Full Code Here

      if (!((bta instanceof NewlineToken)
          || (bta instanceof PunctuationToken)
          || (bta instanceof ContractionToken)
          || (bta instanceof SymbolToken)))
      {
        LookupToken lt = new LookupAnnotationToJCasAdapter(bta);

        // POS exclusion logic for first word lookup
        if (isTagExcluded(bta.getPartOfSpeech()))
        {
          lt.addStringAttribute(
              FirstTokenPermutationImpl.LT_KEY_USE_FOR_LOOKUP,
              "false");
        }
        else
        {
          lt.addStringAttribute(
              FirstTokenPermutationImpl.LT_KEY_USE_FOR_LOOKUP,
              "true");
        }

        if (bta instanceof WordToken)
        {
          WordToken wta = (WordToken) bta;
          String canonicalForm = wta.getCanonicalForm();
          if (canonicalForm != null)
          {
            lt.addStringAttribute(CANONICAL_VARIANT_ATTR, canonicalForm);
          }
        }

        ltList.add(lt);
      }
View Full Code Here

  {
    List ltObjectList = new ArrayList();

    while (lookupTokenItr.hasNext())
    {
      LookupToken lt = (LookupToken) lookupTokenItr.next();

      // only consider if it's within the window
      if ((lt.getStartOffset() >= window.getBegin())
          && (lt.getEndOffset() <= window.getEnd()))
      {
        ltObjectList.add(lt);
      }
    }
    return ltObjectList;
View Full Code Here

  {
    List<LookupToken> ltObjectList = new ArrayList<>();

    while (lookupTokenItr.hasNext())
    {
      LookupToken lt = lookupTokenItr.next();

      // only consider if it's within the window
      if ((lt.getStartOffset() >= window.getBegin())
          && (lt.getEndOffset() <= window.getEnd()))
      {
        ltObjectList.add(lt);
      }
    }
    return ltObjectList;
View Full Code Here

TOP

Related Classes of org.apache.ctakes.dictionary.lookup.vo.LookupToken

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.