Package org.apache.uima.collection

Examples of org.apache.uima.collection.CollectionReader


  {
    AggregateBuilder builder = new AggregateBuilder();
   
    TypeSystemDescription typeSystemDescription = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath();
   
    CollectionReader reader =
        CollectionReaderFactory.createCollectionReader(
          XMIReader.class,
          typeSystemDescription,
          XMIReader.PARAM_FILES,
          inputFiles);
View Full Code Here


  public static void main(String[] args) throws UIMAException, IOException {
   
    Options options = new Options();
    options.parseOptions(args);

    CollectionReader collectionReader = CollectionReaderFactory.createCollectionReaderFromPath(
        "../ctakes-core/desc/collection_reader/FilesInDirectoryCollectionReader.xml",
        FilesInDirectoryCollectionReader.PARAM_INPUTDIR,
        options.inputDirectory);

    // make sure the model parameters match those used for training
View Full Code Here

   
    Options options = new Options();
    options.parseOptions(args);

    List<File> trainFiles = Arrays.asList(options.inputDirectory.listFiles());
    CollectionReader collectionReader = getCollectionReader(trainFiles);
   
    AnalysisEngine relationExtractorPrinter = AnalysisEngineFactory.createPrimitive(
        RelationExtractorPrinter.class);
       
    SimplePipeline.runPipeline(collectionReader, relationExtractorPrinter);
View Full Code Here

  public static CollectionReader getCR(File collectionReaderDescriptorFile) throws ResourceInitializationException {
    try {
      XMLInputSource xmlInputSource = new XMLInputSource(collectionReaderDescriptorFile);
      XMLParser xmlParser = UIMAFramework.getXMLParser();
      ResourceSpecifier resourceSpecifier = xmlParser.parseResourceSpecifier(xmlInputSource);
      CollectionReader collectionReader = UIMAFramework.produceCollectionReader(resourceSpecifier);
      return collectionReader;
    } catch (IOException ioe) {
      throw new ResourceInitializationException(ioe);
    } catch (InvalidXMLException ixe) {
      throw new ResourceInitializationException(ixe);
View Full Code Here

//      TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath("../common-type-system/desc/common_type_system.xml",
//                                       "../assertion/desc/medfactsTypeSystem.xml");

    AnalysisEngine ae = AnalysisEngineFactory.createAnalysisEngineFromPath("desc/analysis_engine/ODIESvmVectorCreator.xml");

    CollectionReader reader = CollectionReaderFactory.createCollectionReaderFromPath(
        "../ctakes-core/desc/collection_reader/FilesInDirectoryCollectionReader.xml",
        FilesInDirectoryCollectionReader.PARAM_INPUTDIR,
        inputRoot);

    AnalysisEngine serializer = AnalysisEngineFactory.createPrimitive(
View Full Code Here

//      TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath("../ctakes-type-system/desc/common_type_system.xml",
//                                       "desc/type-system/CorefTypes.xml",
//                                       "../assertion/desc/medfactsTypeSystem.xml");
//    TypeSystemDescription corefTypeSystem = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath();
    try {
      CollectionReader xmiReader = CollectionReaderFactory.createCollectionReader(XMIReader.class,
//          typeSystem,
          XMIReader.PARAM_FILES,
          paths);
     
      AnalysisEngine consumer = AnalysisEngineFactory.createPrimitive(ODIEVectorFileWriter.class,
View Full Code Here

  public static void main(String[] args) throws Exception {
    Options options = new Options();
    options.parseOptions(args);

    CollectionReader reader = CollectionReaderFactory.createCollectionReader(
        XReader.class,
        FilesCollectionReader.PARAM_ROOT_FILE,
        options.trainDirectory.getPath());

    Multiset<Integer> mentionsBetweenCounts = HashMultiset.create();
    JCas jCas = JCasFactory.createJCasFromPath("../ctakes-type-system/desc/common_type_system.xml");
    while (reader.hasNext()) {
      reader.getNext(jCas.getCas());
      JCas goldView = jCas.getView(GOLD_VIEW_NAME);
      for (BinaryTextRelation relation : JCasUtil.select(goldView, BinaryTextRelation.class)) {
        Annotation arg1 = relation.getArg1().getArgument();
        Annotation arg2 = relation.getArg2().getArgument();
        int mentionsBetween;
View Full Code Here

      String decodingInputDirectory,
      String decodingOutputDirectory,
      String... trainingArgs) throws Exception
  {
   
    CollectionReader trainingCollectionReader = CollectionReaderFactory.createCollectionReader(
        XReader.class,
        XReader.PARAM_ROOT_FILE,
        trainingDataInputDirectory,
        XReader.PARAM_XML_SCHEME,
        XReader.XMI);
    CollectionReader evaluationCollectionReader = CollectionReaderFactory.createCollectionReader(
        XReader.class,
        XReader.PARAM_ROOT_FILE,
        decodingInputDirectory,
        XReader.PARAM_XML_SCHEME,
        XReader.XMI);
View Full Code Here

  public void execute() throws ResourceInitializationException
  {
    String filename = "/work/medfacts/sharp/data/2012-10-16_full_data_set_updated/Seed_Corpus/clean_dirs/splits/official/train";
   
      CollectionReader reader = CollectionReaderFactory.createCollectionReader(
            XReader.class,
            XReader.PARAM_ROOT_FILE,
            filename,
            XReader.PARAM_XML_SCHEME,
            XReader.XMI);
View Full Code Here

      // create a collection reader that loads URIs for all Knowtator text files
      List<File> files = Lists.newArrayList();
      files.addAll(getTrainTextFiles(options.getBatchesDirectory()));
      files.addAll(getDevTextFiles(options.getBatchesDirectory()));
      files.addAll(getTestTextFiles(options.getBatchesDirectory()));
      CollectionReader reader = UriCollectionReader.getCollectionReaderFromFiles(files);

      // load the text from the URI, run the preprocessor, then run the
      // Knowtator XML reader
      AggregateBuilder builder = new AggregateBuilder();
      builder.add(UriToDocumentTextAnnotator.getDescription());
View Full Code Here

TOP

Related Classes of org.apache.uima.collection.CollectionReader

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.