Package org.apache.tika.parser

Examples of org.apache.tika.parser.CompositeParser


        }
        if (parsers.isEmpty()) {
            return getDefaultParser(mimeTypes, loader);
        } else {
            MediaTypeRegistry registry = mimeTypes.getMediaTypeRegistry();
            return new CompositeParser(registry, parsers);
        }
    }
View Full Code Here


public class TextExtractionService implements InitializingBean {

    private static Logger logger = org.slf4j.LoggerFactory.getLogger(TextExtractionService.class);

    private static CompositeParser configureParser(Resource config, boolean autoDetectType) {
        CompositeParser parser = null;
        InputStream stream = null;
        try {
            stream = config.getInputStream();
            if (autoDetectType) {
                parser = new AutoDetectParser(new TikaConfig(stream));
View Full Code Here

                throw new TikaException(
                        "Unable to instantiate a parser class: " + name, e);
            }
        }
        this.parser =
            new CompositeParser(mimeTypes.getMediaTypeRegistry(), parsers);
    }
View Full Code Here

            } catch (InstantiationException e) {
                throw new TikaException(
                        "Unable to instantiate a parser class: " + name, e);
            }
        }
        return new CompositeParser(mimeTypes.getMediaTypeRegistry(), parsers);
    }
View Full Code Here

        }
        if (parsers.isEmpty()) {
            return getDefaultParser(mimeTypes, loader);
        } else {
            MediaTypeRegistry registry = mimeTypes.getMediaTypeRegistry();
            return new CompositeParser(registry, parsers);
        }
    }
View Full Code Here

            } catch (InstantiationException e) {
                throw new TikaException(
                        "Unable to instantiate a parser class: " + name, e);
            }
        }
        return new CompositeParser(mimeTypes.getMediaTypeRegistry(), parsers);
    }
View Full Code Here

   }
  
   public static void attachExternalParsers(List<ExternalParser> parsers, TikaConfig config) {
      Parser parser = config.getParser();
      if (parser instanceof CompositeParser) {
         CompositeParser cParser = (CompositeParser)parser;
         Map<MediaType,Parser> parserMap = cParser.getParsers();
      }
      // TODO
   }
View Full Code Here

        }
        if (parsers.isEmpty()) {
            return getDefaultParser(mimeTypes, loader);
        } else {
            MediaTypeRegistry registry = mimeTypes.getMediaTypeRegistry();
            return new CompositeParser(registry, parsers);
        }
    }
View Full Code Here

            TikaConfig c = new TikaConfig(configFile);
            assertEquals(CompositeParser.class, c.getParser().getClass());
            assertEquals(CompositeDetector.class, c.getDetector().getClass());

            CompositeParser p = (CompositeParser) c.getParser();
            assertTrue("enough parsers?", p.getParsers().size() > 130);

            CompositeDetector d = (CompositeDetector) c.getDetector();
            assertTrue("enough detectors?", d.getDetectors().size() > 3);
            //just try to load it into autodetect to make sure no errors are thrown
            Parser auto = new AutoDetectParser(c);
View Full Code Here

TOP

Related Classes of org.apache.tika.parser.CompositeParser

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.