Package org.apache.lucene.index

Examples of org.apache.lucene.index.IndexReader.maxDoc()


                int numUpdates = 0;
                int numRemovals = 0;
                int numNew = 0;
                try {
                    IndexReader ir = IndexReader.open(di.getIndexPath());
                    int numDocs = ir.maxDoc();
                    ds.setStatus("There are " + numDocs + " docs in index " + di.getDescription() + "(" + di.getPath() + ")");
                    addHeader(di.getDescription());
                    //ArrayList<String> allDocsInIndexx = new ArrayList<String>(); // indexed files
                    // ArrayList allDocsInFolder = new ArrayList(); // current files
                    // ArrayList newDocsToAdd = new ArrayList(); // files to be added that are new
View Full Code Here


        int totalDocumentsFound = 0;
        int minDocsFound = documents / (2 * numIndexers);
        for (String tmpDir: tmpDirs) {
            String sep = java.io.File.separator;
            IndexReader reader = IndexReader.open(tmpDir + sep + "indexer" + sep + "indexes" + sep + "index");
            int docsFound = reader.maxDoc();
            reader.close();
            assertTrue("too few documents indexed. Found " + docsFound + ", expected at least" +minDocsFound , docsFound > minDocsFound);
            totalDocumentsFound += docsFound;
        }

View Full Code Here

      
        // check that every index is empty
        for (String tmpDir: tmpDirs) {
            String sep = java.io.File.separator;
            IndexReader reader = IndexReader.open(tmpDir + sep + "indexer" + sep + "indexes" + sep + "index");
            assertEquals("indexed " + reader.maxDoc() + " documents on mixed indexer. Mixed indexers should not index anything.",0,reader.maxDoc());
            reader.close();
        }
    }

    @TestInfo(testType = TestInfo.TestType.UNIT
View Full Code Here

      
        // check that every index is empty
        for (String tmpDir: tmpDirs) {
            String sep = java.io.File.separator;
            IndexReader reader = IndexReader.open(tmpDir + sep + "indexer" + sep + "indexes" + sep + "index");
            assertEquals("indexed " + reader.maxDoc() + " documents on mixed indexer. Mixed indexers should not index anything.",0,reader.maxDoc());
            reader.close();
        }
    }

    @TestInfo(testType = TestInfo.TestType.UNIT
View Full Code Here

      do {
        Term term = te.term();
        if (term == null || !term.field().equals(contentField)) {
          break;
        }
        OpenBitSet termBitset = new OpenBitSet(reader.maxDoc());

        // Generate bitset for the term
        TermDocs termDocs = reader.termDocs(term);

        while (termDocs.next()) {
View Full Code Here

      FetcherOutput fo = new FetcherOutput();
      Content co = new Content();
      ParseText pt = new ParseText();
      ParseData pd = new ParseData();
      int outputCnt = 0;
      for (int n = 0; n < ir.maxDoc(); n++) {
        if (ir.isDeleted(n)) {
          //System.out.println("-del");
          continue;
        }
        Document doc = ir.document(n);
View Full Code Here

  /** Delete pages without CC licenes. */
  public int deleteUnlicensed() throws IOException {
    int deleteCount = 0;
    for (int index = 0; index < readers.length; index++) {
      IndexReader reader = readers[index];
      int readerMax = reader.maxDoc();
      for (int doc = 0; doc < readerMax; doc++) {
        if (!reader.isDeleted(doc)) {
          Document document = reader.document(doc);
          if (document.get(CCIndexingFilter.FIELD)==null){ // no CC fields
            reader.delete(doc);                   // delete it
View Full Code Here

    for (int i = 0; i < directories.length; i++) {
      File indexDone = new File(directories[i], IndexSegment.DONE_NAME);
      if (indexDone.exists() && indexDone.isFile()){
        File indexDir = new File(directories[i], "index");
        IndexReader reader = IndexReader.open(indexDir);
        maxDoc += reader.maxDoc();
        vReaders.add(reader);
      }
    }

    IndexReader[] readers=new IndexReader[vReaders.size()];
View Full Code Here

    SequenceFile.Writer writer =
      new SequenceFile.Writer(new LocalFileSystem(), tempFile.getPath(), IndexedDoc.class, NullWritable.class);
    try {
      for (int index = 0; index < readers.length; index++) {
        IndexReader reader = readers[index];
        int readerMax = reader.maxDoc();
        indexedDoc.index = index;
        for (int doc = 0; doc < readerMax; doc++) {
          if (!reader.isDeleted(doc)) {
            Document document = reader.document(doc);
            hasher.updateHash(indexedDoc.hash, document);
View Full Code Here

                IndexReader reader = IndexReader.open(localIndexDir);
                if (reader.hasDeletions()) {
                    LOG.info("Clearing old deletions in " + indexDir + "(" + localIndexDir + ")");
                    reader.undeleteAll();
                }
                maxDoc += reader.maxDoc();
                vReaders.add(reader);
            }
        }

        //
View Full Code Here

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.