Examples of org.apache.lucene.analysis.CharArraySet$UnmodifiableCharArraySet

org.apache.lucene.analysis.CharArraySet
Efficient unmodifiable {@link CharArraySet}. This implementation does not delegate calls to a give {@link CharArraySet} like{@link Collections#unmodifiableSet(java.util.Set)} does. Instead is passesthe internal representation of a {@link CharArraySet} to a superconstructor and overrides all mutators.

    private TermAttribute termAtt;
    
    public ChineseFilter(TokenStream in) {
        super(in);


        stopTable = new CharArraySet(Arrays.asList(STOP_WORDS), false);
        termAtt = addAttribute(TermAttribute.class);
    }

View Full Code Here


  public void setArticles(Set<?> articles) {
    if (articles instanceof CharArraySet)
      this.articles = (CharArraySet) articles;
    else
      this.articles = new CharArraySet(articles, true);
  }

View Full Code Here

  /**
   * Constructs an elision filter with standard stop words
   */
  protected ElisionFilter(TokenStream input) {
    super(input);
    this.articles = new CharArraySet(Arrays.asList(
        "l", "m", "t", "qu", "n", "s", "j"), true);
    termAtt = addAttribute(TermAttribute.class);
  }

View Full Code Here

  /**
   * Constructs an elision filter with an array of stop words
   */
  public ElisionFilter(TokenStream input, String[] articles) {
    super(input);
    this.articles = new CharArraySet(Arrays.asList(articles), true);
    termAtt = addAttribute(TermAttribute.class);
  }

View Full Code Here

    this.onlyLongestMatch=onlyLongestMatch;
    
    if (dictionary instanceof CharArraySet) {
      this.dictionary = (CharArraySet) dictionary;
    } else {
      this.dictionary = new CharArraySet(dictionary.size(), false);
      addAllLowerCase(this.dictionary, dictionary);
    }
    
    termAtt = addAttribute(TermAttribute.class);
    offsetAtt = addAttribute(OffsetAttribute.class);

View Full Code Here

   * @param dictionary 
   * @return {@link Set} of lowercased terms 
   */
  public static final Set makeDictionary(final String[] dictionary) {
    // is the below really case insensitive? 
    CharArraySet dict = new CharArraySet(dictionary.length, false);
    addAllLowerCase(dict, Arrays.asList(dictionary));
    return dict;
  }

View Full Code Here

        stopWords = getWordSet(loader, stopWordFiles, ignoreCase);
      } catch (IOException e) {
        throw new RuntimeException(e);
      }
    } else {
      stopWords = new CharArraySet(luceneMatchVersion, StopAnalyzer.ENGLISH_STOP_WORDS_SET, ignoreCase);
    }
  }

View Full Code Here

        stopWords = getWordSet(loader, stopWordFiles, ignoreCase);
      } catch (IOException e) {
        throw new RuntimeException(e);
      }
    } else {
      stopWords = new CharArraySet(luceneMatchVersion, StopAnalyzer.ENGLISH_STOP_WORDS_SET, ignoreCase);
    }
  }

View Full Code Here

  /**
   * Set the keep word list.
   * NOTE: if ignoreCase==true, the words are expected to be lowercase
   */
  public void setWords(Set<String> words) {
    this.words = new CharArraySet(luceneMatchVersion, words, ignoreCase);
  }

View Full Code Here

    this.words = new CharArraySet(luceneMatchVersion, words, ignoreCase);
  }


  public void setIgnoreCase(boolean ignoreCase) {    
    if (words != null && this.ignoreCase != ignoreCase) {
      words = new CharArraySet(luceneMatchVersion, words, ignoreCase);
    }
    this.ignoreCase = ignoreCase;
  }

View Full Code Here

0 1 2 3 4 5 6 7 8 9

TOP

Related Classes of org.apache.lucene.analysis.CharArraySet$UnmodifiableCharArraySet

com.github.le11.nls.lucene.TypeAwareStopFilter

com.github.le11.nls.solr.TypeAwareStopFilterFactory

de.jetwick.solrplugin.TWordDelimiterFilterFactory

edu.wiki.index.WikipediaAnalyzer

org.apache.lucene.analysis.ar.TestArabicAnalyzer

org.apache.lucene.analysis.ar.TestArabicStemFilter

org.apache.lucene.analysis.bg.TestBulgarianAnalyzer

org.apache.lucene.analysis.bg.TestBulgarianStemmer

org.apache.lucene.analysis.br.TestBrazilianStemmer

org.apache.lucene.analysis.ca.TestCatalanAnalyzer

All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.