Package com.clearnlp.constituent

Examples of com.clearnlp.constituent.CTReader


    for (PrintStream f : foutf.close();
  }
 
  void printTreesForCKY(String[] args)
  {
    CTReader reader = new CTReader(UTInput.createBufferedFileReader(args[0]));
    PrintStream fout = UTOutput.createPrintBufferedFileStream(args[1]);
    CTTree tree;
    CTNode root;
    int count;
   
    while ((tree = reader.nextTree()) != null)
    {
      root = tree.getRoot();
     
      if (root.getChildrenSize() == 1)
      {
        count = stripPunct(tree);
       
        if (root.getChildrenSize() > 0 && tree.getTokens().size()-count >= 4 && !containsEmptyCategories(tree) && isCKYTree(root.getChild(0)))
          fout.println(tree+"\n");
      }
    }
   
    reader.close();
    fout.close();
  }
View Full Code Here


    return true;
  }
 
  void traverse(String inputFile)
  {
    CTReader reader = new CTReader(UTInput.createBufferedFileReader(inputFile));
    CTTree tree;
   
    while ((tree = reader.nextTree()) != null)
      traverseAux(tree.getRoot());
  }
View Full Code Here

  {
    String treeDir = args[0];
    String treeFile = args[1];
    int treeId = Integer.parseInt(args[2]);
   
    CTReader reader = new CTReader(UTInput.createBufferedFileReader(treeDir+File.separator+treeFile));
    CTTree tree = null;
    int i;
   
    for (i=0; i<=treeId; i++)
      tree = reader.nextTree();
   
    System.out.println(tree.toString(true,true));
  }
View Full Code Here

        mName   = getNames      (UTFile.replaceExtension(inputPath, nameExt));
      }
      catch (Exception e) {e.printStackTrace();}
     
      PrintStream fout = UTOutput.createPrintBufferedFileStream(UTFile.replaceExtension(inputPath, outputExt));
      CTReader reader = new CTReader(UTInput.createBufferedFileReader(inputPath));
      CTTree cTree; DEPTree dTree; int n;
      List<PBInstance> instances = null;
     
      for (n=0; (cTree = reader.nextTree()) != null; n++)
      {
        if (language.equals(AbstractReader.LANG_EN))
          CTLibEn.preprocessTree(cTree);
       
        if (mProp != null)
        {
          instances = mProp.get(n);
          addPBInstances(cTree, instances);
        }
       
        dTree = c2d.toDEPTree(cTree);
       
        if (dTree == null)
        {
        //  fout.println(getNullTree()+"\n");
        }
        else
        {
          if (morph   != nullmorph.process(dTree);
          if (mSense  != nulladdWordSenses(cTree, dTree, mSense.get(n), DEPLibEn.FEAT_WS);
          if (mVclass != nulladdWordSenses(cTree, dTree, mVclass.get(n), DEPLibEn.FEAT_VN);
          if (mName   != nulladdNames(cTree, dTree, mName.get(n));
         
          if (mProp != null)
          {
            addRolesets(cTree, dTree, instances);
            if (b_verbs_only) relabelLightVerb(dTree);
            DEPLibEn.postLabel(dTree);
          }
       
          dTree = getDEPTreeWithoutEdited(cTree, dTree);
          fout.println(dTree+"\n");         
        }
      }
     
      fout.close();
      reader.close();
    }
  }
View Full Code Here

    }
  }
 
  protected int convert(AbstractC2DConverter c2d, AbstractComponent morph, String language, String inputFile, String outputFile, boolean normalize)
  {
    CTReader  reader = new CTReader(UTInput.createBufferedFileReader(inputFile));
    PrintStream fout = UTOutput.createPrintBufferedFileStream(outputFile);
    CTTree  cTree;
    DEPTree dTree;
    int n;
   
    for (n=0; (cTree = reader.nextTree()) != null; n++)
    {
      if (normalizeCTLib.normalizeIndices(cTree);
     
      if (language.equals(AbstractReader.LANG_EN))
        CTLibEn.preprocessTree(cTree);
     
      dTree = c2d.toDEPTree(cTree);
     
      if (dTree == null)
      {
        fout.println(getNullTree()+"\n");
      }
      else
      {
        morph.process(dTree);
        fout.println(dTree.toStringDAG()+"\n");
      }
    }
   
    reader.close();
    fout.close();
   
    return n;
  }
View Full Code Here

        remove(inputPath+File.separator+filePath, parseExt, outputExt);
    }
    else if (inputPath.endsWith(parseExt))
    {
      PrintStream fout = UTOutput.createPrintBufferedFileStream(UTFile.replaceExtension(inputPath, outputExt));
      CTReader reader = new CTReader(UTInput.createBufferedFileReader(inputPath));
      CTTree tree;
     
      while ((tree = reader.nextTree()) != null)
      {
        remove(inputPath, tree.getRoot());
        fout.println(tree.toString()+"\n");
      }
     
      fout.close();
      reader.close();
    }
  }
View Full Code Here

    }
  }
 
  private void printTree(PrintStream fout, String inputFile)
  {
    CTReader reader = new CTReader();
    StringBuilder build;
    CTTree tree;
   
    reader.open(UTInput.createBufferedFileReader(inputFile));
   
    while ((tree = reader.nextTree()) != null)
    {
      build = new StringBuilder();
     
      for (CTNode node : tree.getTerminals())
      {
        build.append(node.form);
        build.append("\t");
        build.append(node.pTag);
        build.append("\n");
      }
     
      fout.println(build.toString());
    }
   
    reader.close();
  }
View Full Code Here

    fout.close();
  }
 
  private List<CTTree> getTrees(String parseFile)
  {
    CTReader reader = new CTReader(UTInput.createBufferedFileReader(parseFile));
    List<CTTree> trees = new ArrayList<CTTree>();
    CTTree tree;
   
    while ((tree = reader.nextTree()) != null)
      trees.add(tree);
   
    return trees;
  }
View Full Code Here

  }
 
  Map<String,String> getSemlinkMap(String ontoDir, String semDir, String semVNFile) throws Exception
  {
    BufferedReader fin = UTInput.createBufferedFileReader(semVNFile);
    CTReader reader1 = new CTReader(), reader2 = new CTReader();
    Map<String,String> map = new HashMap<String,String>();
    Set<String> skipPaths = new HashSet<String>();
    String line, ontoPath = "", semPath = "";
    int i, treeId, predId, prevId = -1;
    CTTree tree1 = null, tree2 = null;
    IntArrayList[] lists;
    IntArrayList list;
    String[] tmp;
   
    while ((line = fin.readLine()) != null)
    {
      tmp = line.split(" ");
      if (skipPaths.contains(tmp[0]))  continue;
     
      if (!semPath.equals(tmp[0]))
      {
        ontoPath = UTFile.replaceExtension("nw"+File.separator+tmp[0], "parse");
       
        if (!new File(ontoDir+File.separator+ontoPath).exists())
        {
          skipPaths.add(tmp[0]);
          continue;
        }
       
        semPath = tmp[0];
        prevId  = -1;
       
        reader1.close();
        reader2.close();
       
        reader1.open(UTInput.createBufferedFileReader(ontoDir+File.separator+ontoPath));
        reader2.open(UTInput.createBufferedFileReader(semDir +File.separator+semPath));
      }
     
      treeId = Integer.parseInt(tmp[1]);
      predId = Integer.parseInt(tmp[2]);
     
      for (i=0; i<treeId-prevId; i++)
      {
        tree1 = reader1.nextTree();
        tree2 = reader2.nextTree();
      }
     
      prevId = treeId;
      lists  = CTLib.getTokenMapList(tree2, tree1);
     
View Full Code Here

   * @return the sorted list of PropBank instances from the specific file.
   */
  static public List<PBInstance> getPBInstanceList(String propFile, String treeDir, boolean norm)
  {
    List<PBInstance> list = PBLib.getPBInstanceList(propFile);
    CTReader reader = new CTReader();
    CTTree   tree   = null;
    String treeFile = "";
    int    treeId   = -1;
   
    for (PBInstance instance : list)
    {
      if (!treeFile.equals(instance.treePath))
      {
        treeFile = instance.treePath;
        treeId   = -1;
        reader.close();
        reader.open(UTInput.createBufferedFileReader(treeDir+File.separator+treeFile));
      }
     
      for (; treeId < instance.treeId; treeId++)
        tree = reader.nextTree();
     
      if (normCTLib.normalizeIndices(tree);
      tree.setPBLocs();
      instance.setTree(tree);
    }
View Full Code Here

TOP

Related Classes of com.clearnlp.constituent.CTReader

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.