Package org.uimafit.factory

Examples of org.uimafit.factory.AggregateBuilder


 
  public void execute() throws UIMAException, IOException
  {
    logger.info("starting");

    AggregateBuilder builder = new AggregateBuilder();
   
    TypeSystemDescription typeSystemDescription = TypeSystemDescriptionFactory.createTypeSystemDescription();
    String filename = "/work/medfacts/sharp/data/2013-01-11_cue_phrase_feature_test/ON03FP00037D00207__merged.txt.xmi";
   
    JCas jcas = JCasFactory.createJCas(filename, typeSystemDescription);
View Full Code Here


      tok.addToIndexes();
      LookupWindowAnnotation lwa = new LookupWindowAnnotation(jCas);
      lwa.setBegin(0);
      lwa.setEnd(text.length());
      lwa.addToIndexes();
    AggregateBuilder builder = new AggregateBuilder();
    addDescriptor(builder,
        "desc/analysis_engine/DictionaryLookupAnnotator.xml");
    AnalysisEngine engine = builder.createAggregate();
    engine.process(jCas);
    Assert.assertTrue(printAnnos(jCas, IdentifiedAnnotation.type) > 0);
  }
View Full Code Here

  @Test
  public void testDictionaryLookupIntegrated() throws UIMAException, IOException {
    // JCas jCas =
    // JCasFactory.createJCasFromPath("src/main/resources/org/apache/ctakes/ytex/types/TypeSystem.xml");
    String text = "Dr. Doolitle asked patient\nto take a deep breath\nand exhale slowly.  Patient coughed and complained of abdominal pain.  Patient was administered acetaminophen.";
    AggregateBuilder builder = new AggregateBuilder();
    addDescriptor(builder,
        "desc/analysis_engine/AggregatePlaintextUMLSProcessorMinimal.xml");
    // addDescriptor(builder,
    // "desc/analysis_engine/SentenceDetectorAnnotator.xml");
    // addDescriptor(builder,
    // "../ctakes-core/desc/analysis_engine/TokenizerAnnotator.xml");
    // addDescriptor(builder,
    // "../ctakes-context-tokenizer/desc/analysis_engine/ContextDependentTokenizerAnnotator.xml");
    // addDescriptor(builder,
    // "../ctakes-pos-tagger/desc/POSTagger.xml");
    // addDescriptor(builder,
    // "../ctakes-chunker/desc/Chunker.xml");
    // addDescriptor(builder,
    // "../ctakes-chunker/desc/AdjustNounPhraseToIncludeFollowingNP.xml");
    // addDescriptor(builder,
    // "../ctakes-chunker/desc/AdjustNounPhraseToIncludeFollowingPPNP.xml");
    // addDescriptor(builder,
    // "../ctakes-clinical-pipeline/desc/analysis_engine/LookupWindowAnnotator.xml");
    // addDescriptor(builder,
    // "desc/analysis_engine/DictionaryLookupAnnotator.xml");
    AnalysisEngine engine = builder.createAggregate();
    JCas jCas = engine.newJCas();
    jCas.setDocumentText(text);
//    Segment s = new Segment(jCas);
//    s.setBegin(0);
//    s.setEnd(text.length());
View Full Code Here

      files.addAll(Arrays.asList(subDir.listFiles()));
    }

    // construct reader and Knowtator XML parser
    CollectionReader reader = UriCollectionReader.getCollectionReaderFromFiles(files);
    AggregateBuilder aggregateBuilder = new AggregateBuilder();
    aggregateBuilder.add(UriToDocumentTextAnnotator.getDescription());
    aggregateBuilder.add(THYMEKnowtatorXMLReader.getDescription(knowtatorXMLDirectory));

    // walk through each document in the collection
    for (JCas jCas : new JCasIterable(reader, aggregateBuilder.createAggregate())) {
      System.err.println(ViewURIUtil.getURI(jCas));

      // collect all relations and sort them by the order they appear in the text
      Collection<BinaryTextRelation> relations = JCasUtil.select(jCas, BinaryTextRelation.class);
      List<BinaryTextRelation> relationList = new ArrayList<BinaryTextRelation>(relations);
View Full Code Here

  }

  public static AnalysisEngineDescription getDataWriterDescription(
      Class<? extends SequenceDataWriter<String>> dataWriterClass,
      File directory) throws ResourceInitializationException {
    AggregateBuilder builder = new AggregateBuilder();
   
    for(Class<?> component : components){
      builder.add(AnalysisEngineFactory.createPrimitiveDescription(ViewCreatorAnnotator.class, ViewCreatorAnnotator.PARAM_VIEW_NAME, component.getSimpleName()));
    }
   
    builder.add(TimeAnnotator.createEnsembleDescription(
                      new File(directory, TimeAnnotator.class.getSimpleName()),
                      TimeAnnotator.class.getSimpleName()));
    builder.add(BackwardsTimeAnnotator.createEnsembleDescription(
                      new File(directory, BackwardsTimeAnnotator.class.getSimpleName()),
                      BackwardsTimeAnnotator.class.getSimpleName()));
    builder.add(ConstituencyBasedTimeAnnotator.createEnsembleDescription(
        new File(directory, ConstituencyBasedTimeAnnotator.class.getSimpleName()),
        ConstituencyBasedTimeAnnotator.class.getSimpleName()));
    builder.add(CRFTimeAnnotator.createEnsembleDescription(
        new File(directory, CRFTimeAnnotator.class.getSimpleName()),
        CRFTimeAnnotator.class.getSimpleName()));
   
    builder.add(AnalysisEngineFactory.createPrimitiveDescription(MetaTimeAnnotator.class,
          CleartkSequenceAnnotator.PARAM_IS_TRAINING,
          true,
          DefaultSequenceDataWriterFactory.PARAM_DATA_WRITER_CLASS_NAME,
          dataWriterClass,
          DirectoryDataWriterFactory.PARAM_OUTPUT_DIRECTORY,
          new File(directory, MetaTimeAnnotator.class.getSimpleName())));
    return builder.createAggregateDescription();
  }
View Full Code Here

          new File(directory, MetaTimeAnnotator.class.getSimpleName())));
    return builder.createAggregateDescription();
  }

  public static AnalysisEngineDescription getAnnotatorDescription(File directory) throws ResourceInitializationException{
    AggregateBuilder builder = new AggregateBuilder();
   
    for(Class<?> component : components){
      builder.add(AnalysisEngineFactory.createPrimitiveDescription(ViewCreatorAnnotator.class, ViewCreatorAnnotator.PARAM_VIEW_NAME, component.getSimpleName()));
    }
    builder.add(TimeAnnotator.createEnsembleDescription(
                      new File(directory, TimeAnnotator.class.getSimpleName()),
                      TimeAnnotator.class.getSimpleName()));
    builder.add(BackwardsTimeAnnotator.createEnsembleDescription(
                      new File(directory, BackwardsTimeAnnotator.class.getSimpleName()),
                      BackwardsTimeAnnotator.class.getSimpleName()));
    builder.add(ConstituencyBasedTimeAnnotator.createEnsembleDescription(
                      new File(directory, ConstituencyBasedTimeAnnotator.class.getSimpleName()),
                      ConstituencyBasedTimeAnnotator.class.getSimpleName()));
    builder.add(CRFTimeAnnotator.createEnsembleDescription(
                      new File(directory, CRFTimeAnnotator.class.getSimpleName()),
                      CRFTimeAnnotator.class.getSimpleName()));
    builder.add(AnalysisEngineFactory.createPrimitiveDescription(
        MetaTimeAnnotator.class,
        CleartkSequenceAnnotator.PARAM_IS_TRAINING,
        false,
        GenericJarClassifierFactory.PARAM_CLASSIFIER_JAR_PATH,
        new File(directory, MetaTimeAnnotator.class.getSimpleName() + File.separator + "model.jar")));
    return builder.createAggregateDescription();
  }
View Full Code Here

  @Override
  protected void train(CollectionReader collectionReader, File directory) throws Exception {
    //    if(this.baseline) return;
    if(this.skipTrain) return;
    AggregateBuilder aggregateBuilder = this.getPreprocessorAggregateBuilder();
    aggregateBuilder.add(CopyFromGold.getDescription(EventMention.class, TimeMention.class, BinaryTextRelation.class));
    //    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(RemoveCrossSentenceRelations.class));
    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(RemoveNullArgumentRelations.class));
    if(!this.useGoldAttributes){
      aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(RemoveGoldAttributes.class));
    }
    if (this.useClosure) {
      aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(AddClosure.class));//aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(AddTransitiveContainsRelations.class));
      //      aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(AddContain2Overlap.class));
      //      aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(AddTransitiveBeforeAndOnRelations.class));
    }
    //    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(RemoveNonContainsRelations.class));
    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(AddFlippedOverlap.class));//add flipped overlap instances to training data

    //    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(RemoveEventEventRelations.class));
    aggregateBuilder.add(EventTimeRelationAnnotator.createDataWriterDescription(
        //                LIBSVMStringOutcomeDataWriter.class,
        TKSVMlightStringOutcomeDataWriter.class,
        //        TKLIBSVMStringOutcomeDataWriter.class,
        //        SVMlightStringOutcomeDataWriter.class,       
        new File(directory,EVENT_TIME),
        params.probabilityOfKeepingANegativeExample));
    aggregateBuilder.add(EventEventRelationAnnotator.createDataWriterDescription(
        LIBSVMStringOutcomeDataWriter.class,
        new File(directory,EVENT_EVENT),
        params.probabilityOfKeepingANegativeExample));
    aggregateBuilder.add(EventDischargeTimeAnnotator.createDataWriterDescription(
        LIBSVMStringOutcomeDataWriter.class,
        new File(directory,EVENT_DISCHARGE)));
    aggregateBuilder.add(EventAdmissionTimeAnnotator.createDataWriterDescription(
        LIBSVMStringOutcomeDataWriter.class,
        new File(directory,EVENT_ADMISSION)));
    SimplePipeline.runPipeline(collectionReader, aggregateBuilder.createAggregate());
    String[] optArray;

    if(this.kernelParams == null){
      ArrayList<String> svmOptions = new ArrayList<>();
      svmOptions.add("-c"); svmOptions.add(""+params.svmCost);        // svm cost
View Full Code Here

  }

  @Override
  protected AnnotationStatistics<String> test(CollectionReader collectionReader, File directory)
      throws Exception {
    AggregateBuilder aggregateBuilder = this.getPreprocessorAggregateBuilder();
    aggregateBuilder.add(CopyFromGold.getDescription(EventMention.class, TimeMention.class));

    //    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(
    //        RemoveCrossSentenceRelations.class,
    //        RemoveCrossSentenceRelations.PARAM_SENTENCE_VIEW,
    //        CAS.NAME_DEFAULT_SOFA,
    //        RemoveCrossSentenceRelations.PARAM_RELATION_VIEW,
    //        GOLD_VIEW_NAME));
    if (this.useClosure) {
      aggregateBuilder.add(
          AnalysisEngineFactory.createPrimitiveDescription(AddClosure.class),//AnalysisEngineFactory.createPrimitiveDescription(AddTransitiveContainsRelations.class),
          CAS.NAME_DEFAULT_SOFA,
          GOLD_VIEW_NAME);

      //      aggregateBuilder.add(
      //          AnalysisEngineFactory.createPrimitiveDescription(AddContain2Overlap.class),
      //          CAS.NAME_DEFAULT_SOFA,
      //          GOLD_VIEW_NAME);
      //      aggregateBuilder.add(
      //          AnalysisEngineFactory.createPrimitiveDescription(AddTransitiveBeforeAndOnRelations.class),
      //          CAS.NAME_DEFAULT_SOFA,
      //          GOLD_VIEW_NAME);
    }

    //    aggregateBuilder.add(
    //        AnalysisEngineFactory.createPrimitiveDescription(RemoveNonContainsRelations.class,
    //            RemoveNonContainsRelations.PARAM_RELATION_VIEW,
    //            GOLD_VIEW_NAME));
    //    aggregateBuilder.add(
    //        AnalysisEngineFactory.createPrimitiveDescription(RemoveEventEventRelations.class),
    //        CAS.NAME_DEFAULT_SOFA,
    //        GOLD_VIEW_NAME);

    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(RemoveRelations.class));
    aggregateBuilder.add(this.baseline ? RecallBaselineEventTimeRelationAnnotator.createAnnotatorDescription(directory) :
      EventTimeRelationAnnotator.createAnnotatorDescription(new File(directory,EVENT_TIME)));
    aggregateBuilder.add(EventEventRelationAnnotator.createAnnotatorDescription(new File(directory,EVENT_EVENT)));
    aggregateBuilder.add(EventDischargeTimeAnnotator.createAnnotatorDescription(new File(directory,EVENT_DISCHARGE)));
    aggregateBuilder.add(EventAdmissionTimeAnnotator.createAnnotatorDescription(new File(directory,EVENT_ADMISSION)));
   
    if (this.useClosure) {//add closure for system output
      aggregateBuilder.add(
          AnalysisEngineFactory.createPrimitiveDescription(AddClosure.class),//AnalysisEngineFactory.createPrimitiveDescription(AddTransitiveContainsRelations.class),
          GOLD_VIEW_NAME,
          CAS.NAME_DEFAULT_SOFA
          );
    }
       
    if(this.i2b2Output != null){
      aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(WriteI2B2XML.class, WriteI2B2XML.PARAM_OUTPUT_DIR, this.i2b2Output), "TimexView", CAS.NAME_DEFAULT_SOFA);
    }
   
    //remove the null argument from relations
    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(RemoveNullArgumentRelations.class));
   
    Function<BinaryTextRelation, ?> getSpan = new Function<BinaryTextRelation, HashableArguments>() {
      public HashableArguments apply(BinaryTextRelation relation) {
        return new HashableArguments(relation);
      }
    };
    Function<BinaryTextRelation, String> getOutcome = AnnotationStatistics.annotationToFeatureValue("category");

    AnnotationStatistics<String> stats = new AnnotationStatistics<>();
    JCasIterable jcasIter =new JCasIterable(collectionReader, aggregateBuilder.createAggregate());
    JCas jCas = null;
    while(jcasIter.hasNext()) {
      jCas = jcasIter.next();
      JCas goldView = jCas.getView(GOLD_VIEW_NAME);
      JCas systemView = jCas.getView(CAS.NAME_DEFAULT_SOFA);
View Full Code Here

    CollectionReader collectionReader = CollectionReaderFactory.createCollectionReaderFromPath(
        "../ctakes-core/desc/collection_reader/FilesInDirectoryCollectionReader.xml",
        FilesInDirectoryCollectionReader.PARAM_INPUTDIR,
        options.getInputDirectory());

    AggregateBuilder aggregateBuilder = getLightweightPreprocessorAggregateBuilder();
    aggregateBuilder.add(EventAnnotator.createAnnotatorDescription(new File(options.getEventModelDirectory())));
    aggregateBuilder.add(BackwardsTimeAnnotator.createAnnotatorDescription(options.getTimeModelDirectory() + File.pathSeparator + "model.jar"));
    aggregateBuilder.add(EventTimeRelationAnnotator.createAnnotatorDescription(options.getEventTimeRelationModelDirectory() + File.separator + "model.jar"));
    if(options.getEventEventRelationModelDirectory()!=null){
      aggregateBuilder.add(EventEventRelationAnnotator.createAnnotatorDescription(options.getEventEventRelationModelDirectory() + File.separator + "model.jar"));
    }
   
    //aggregateBuilder.createAggregateDescription().toXML(new FileWriter("desc/analysis_engine/TemporalAggregateUMLSPipeline.xml"));
    AnalysisEngine xWriter = getXMIWriter(options.getOutputDirectory());
   
    SimplePipeline.runPipeline(
        collectionReader,
        aggregateBuilder.createAggregate(),
        xWriter);
  }
View Full Code Here

  /**
   * Preprocessing needed for relation extraction.
   */
  protected static AggregateBuilder getPreprocessorAggregateBuilder()
      throws Exception {
    AggregateBuilder aggregateBuilder = new AggregateBuilder();
    aggregateBuilder.add(ClinicalPipelineFactory.getDefaultPipeline());
    // add semantic role labeler
    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(ClearNLPSemanticRoleLabelerAE.class));
    aggregateBuilder.add(AnalysisEngineFactory.createPrimitiveDescription(ConstituencyParser.class));
    return aggregateBuilder;
  }
View Full Code Here

TOP

Related Classes of org.uimafit.factory.AggregateBuilder

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.