当前位置: 首页>>代码示例>>Java>>正文


Java TreePrint类代码示例

本文整理汇总了Java中edu.stanford.nlp.trees.TreePrint的典型用法代码示例。如果您正苦于以下问题:Java TreePrint类的具体用法?Java TreePrint怎么用?Java TreePrint使用的例子?那么, 这里精选的类代码示例或许可以为您提供帮助。


TreePrint类属于edu.stanford.nlp.trees包,在下文中一共展示了TreePrint类的15个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Java代码示例。

示例1: demoAPI

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/**
 * demoAPI demonstrates other ways of calling the parser with already
 * tokenized text, or in some cases, raw text that needs to be tokenized as
 * a single sentence. Output is handled with a TreePrint object. Note that
 * the options used when creating the TreePrint can determine what results
 * to print out. Once again, one can capture the output by passing a
 * PrintWriter to TreePrint.printTree.
 * 
 * difference: already tokenized text
 * 
 * 
 */
public static void demoAPI(LexicalizedParser lp) {
	// This option shows parsing a list of correctly tokenized words
	String[] sent = { "This", "is", "an", "easy", "sentence", "." };
	List<CoreLabel> rawWords = Sentence.toCoreLabelList(sent);
	Tree parse = lp.apply(rawWords);
	parse.pennPrint();
	System.out.println();

	// This option shows loading and using an explicit tokenizer
	String sent2 = "Hey @Apple, pretty much all your products are amazing. You blow minds every time you launch a new gizmo."
			+ " that said, your hold music is crap";
	TokenizerFactory<CoreLabel> tokenizerFactory = PTBTokenizer.factory(
			new CoreLabelTokenFactory(), "");
	Tokenizer<CoreLabel> tok = tokenizerFactory
			.getTokenizer(new StringReader(sent2));
	List<CoreLabel> rawWords2 = tok.tokenize();
	parse = lp.apply(rawWords2);

	TreebankLanguagePack tlp = new PennTreebankLanguagePack();
	GrammaticalStructureFactory gsf = tlp.grammaticalStructureFactory();
	GrammaticalStructure gs = gsf.newGrammaticalStructure(parse);
	List<TypedDependency> tdl = gs.typedDependenciesCCprocessed();
	System.out.println(tdl);
	System.out.println();

	// You can also use a TreePrint object to print trees and dependencies
	TreePrint tp = new TreePrint("penn,typedDependenciesCollapsed");
	tp.printTree(parse);
}
 
开发者ID:opinion-extraction-propagation,项目名称:TASC-Tuples,代码行数:42,代码来源:ParserDemo.java

示例2: getPenn

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
public String getPenn()
{
	if(bufferTree==null) return "";
	TreePrint tp = new TreePrint("penn");
	
	Writer parse_string = new StringWriter();
	PrintWriter printWriter = new PrintWriter(parse_string);
	
	tp.printTree(bufferTree, printWriter); // print tree
	
	return parse_string.toString();
}
 
开发者ID:ehsane,项目名称:rainbownlp,代码行数:13,代码来源:StanfordParser.java

示例3: getDependencies

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
public String getDependencies()
{
	TreePrint tp = new TreePrint("typedDependenciesCollapsed");
	Writer parse_string = new StringWriter();
	PrintWriter printWriter = new PrintWriter(parse_string);
	
	tp.printTree(bufferTree, printWriter); // print tree
	
	return parse_string.toString();
}
 
开发者ID:ehsane,项目名称:rainbownlp,代码行数:11,代码来源:StanfordParser.java

示例4: parse

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/**
 * Parse a (speech) lattice with the PCFG parser.
 *
 * @param lr a lattice to parse
 * @return Whether the lattice could be parsed by the grammar
 */
boolean parse(HTKLatticeReader lr) {
  TreePrint treePrint = getTreePrint();
  PrintWriter pwOut = op.tlpParams.pw();
  parseSucceeded = false;
  parseNoMemory = false;
  parseUnparsable = false;
  parseSkipped = false;
  parseFallback = false;
  whatFailed = null;
  originalSentence = null;
  if (lr.getNumStates() > op.testOptions.maxLength + 1) {  // + 1 for boundary symbol
    parseSkipped = true;
    throw new UnsupportedOperationException("Lattice too big: " + lr.getNumStates());
  }
  if (op.doPCFG) {
    if (!pparser.parse(lr)) {
      return parseSucceeded;
    }
    if (op.testOptions.verbose) {
      pwOut.println("PParser output");
      treePrint.printTree(getBestPCFGParse(false), pwOut);
    }
  }
  parseSucceeded = true;
  return true;
}
 
开发者ID:benblamey,项目名称:stanford-nlp,代码行数:33,代码来源:LexicalizedParserQuery.java

示例5: addConstituentTreeInfo

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/**
 * Generates the XML content for a constituent tree
 */
private static void addConstituentTreeInfo(Element treeInfo, Tree tree, TreePrint constituentTreePrinter) {
  StringWriter treeStrWriter = new StringWriter();
  constituentTreePrinter.printTree(tree, new PrintWriter(treeStrWriter, true));
  String temp = treeStrWriter.toString();
  //System.err.println(temp);
  treeInfo.appendChild(temp);
}
 
开发者ID:benblamey,项目名称:stanford-nlp,代码行数:11,代码来源:XMLOutputter.java

示例6: parseTaggedWords

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
public ParseTree parseTaggedWords(List<TaggedWord> taggedWords, List<String> outputFormat) throws Exception
{
	TreePrint treePrinter = ParserUtil.setOptions(outputFormat, tlp);
	Tree parseTree = model.apply(taggedWords);
	// TODO: Do these parse trees have scores, like the lexicalized ones do?
	return new ParseTree(ParserUtil.TreeObjectToString(parseTree, treePrinter), parseTree.score());
}
 
开发者ID:dmnapolitano,项目名称:stanford-thrift,代码行数:8,代码来源:StanfordSRParserThrift.java

示例7: TreeObjectToString

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
public static String TreeObjectToString(Tree tree, TreePrint tp)
{
	StringWriter sw = new StringWriter();
	PrintWriter pw = new PrintWriter(sw);
	tp.printTree(tree, pw);
	return sw.getBuffer().toString().trim();
}
 
开发者ID:dmnapolitano,项目名称:stanford-thrift,代码行数:8,代码来源:ParserUtil.java

示例8: setOptions

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
public static TreePrint setOptions(List<String> outputOptions, TreebankLanguagePack tlp) throws Exception
{
	String outputFormatStr = "oneline";  // default
	String outputFormatOptionsStr = "";

	// for output formatting
	if (outputOptions != null && outputOptions.size() > 0)
	{
		int ofIndex = outputOptions.indexOf("-outputFormat");
		int ofoIndex = outputOptions.indexOf("-outputFormatOptions");

		if (ofIndex >= 0)
		{
			outputFormatStr = outputOptions.get(ofIndex+1);
		}
		if (ofoIndex >= 0)
		{
			outputFormatOptionsStr = outputOptions.get(ofoIndex+1);
		}
		if (ofIndex < 0 && ofoIndex < 0)
		{
			throw new Exception("Invalid option(s): " + outputOptions.toString());
		}
	}

	return new TreePrint(outputFormatStr, outputFormatOptionsStr, tlp);

	// for everything else; disabled for now
	//        if (!options.isEmpty())
	//        {
	//        	String[] remainingOptions = new String[options.size()];
	//        	options.toArray(remainingOptions);
	//        	org.ets.research.nlp.stanford_thrift.parser.setOptionFlags(remainingOptions);
	//        	customParserOptionsSet = true;
	//        }
}
 
开发者ID:dmnapolitano,项目名称:stanford-thrift,代码行数:37,代码来源:ParserUtil.java

示例9: analyzeSentences

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/**
   * @desc Parses input sentences and prints the parses to the given doc.
   * @param paragraphs Vector of strings of sentences
   * @param doc The current document we're printing to.
   * @param depdoc The document of dependencies that we're printing to.
   */
  private void analyzeSentences( Vector<String> paragraphs, GigaDoc doc, 
      GigaDoc depdoc) {
    int sid = 0;

    // Paragraphs may be multiple sentences
    for( String fragment : paragraphs ) {
      // Replace underscores (gigaword has underscores in many places commas should be)
      if( fragment.contains(" _ ") ) fragment = fragment.replaceAll(" _ ", " , ");
      // Split sentences
      List<List<HasWord>> list = Ling.getSentencesFromText(fragment);

//      System.out.println("From fragment: " + fragment);
//      for( List sent : list )
//        System.out.println("  -> " + sent);
      
      // Loop over each sentence
      for( List<HasWord> sentence : list ) {
        Tree ansTree;
        
        //        System.out.println(sentence.size() + ": " + sentence);
        if( sentence.size() > MAX_SENTENCE_LENGTH )
          System.out.println("Sentence far too long: " + sentence.size());
        else if( (ansTree = parser.parseTree(sentence)) == null )
          System.out.println("Failed to parse: " + sentence);
        else {
          // Build a StringWriter, print the tree to it, then save the string
          StringWriter treeStrWriter = new StringWriter();
          TreePrint tp = new TreePrint("penn");
          tp.printTree(ansTree, new PrintWriter(treeStrWriter,true));
          doc.addParse(treeStrWriter.toString());
          
          // Create the dependency tree - CAUTION: DESTRUCTIVE to parse tree
          try {
            GrammaticalStructure gs = gsf.newGrammaticalStructure(ansTree);
            //	    Collection<TypedDependency> deps = gs.typedDependenciesCollapsed();
            Collection<TypedDependency> deps = gs.typedDependenciesCCprocessed(true);
            depdoc.addDependencies(deps, sid);
          } catch( Exception ex ) { 
            ex.printStackTrace();
            System.out.println("WARNING: dependency tree creation failed...adding null deps");
            depdoc.addDependencies(null, sid);
          }
          sid++;
        }

      }
    }
  }
 
开发者ID:nchambers,项目名称:schemas,代码行数:55,代码来源:GigawordParser.java

示例10: analyzeSentences

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/**
   * @desc Parses input sentences and prints the parses to the given doc.
   * @param paragraphs Vector of strings of sentences
   * @param doc The current document we're printing to.
   * @param depdoc The document of dependencies that we're printing to.
   */
  private void analyzeSentences( Vector<String> paragraphs, GigaDoc doc, GigaDoc depdoc) {
    int sid = 0;

    // Paragraphs may be multiple sentences
    for( String fragment : paragraphs ) {
//      System.out.println("* " + fragment);
      // Replace underscores (gigaword has underscores in many places commas should be)
      if( fragment.contains(" _ ") ) fragment = fragment.replaceAll(" _ ", " , ");

      // Loop over each sentence
      for( List<HasWord> sentence : Ling.getSentencesFromText(fragment) ) {
        Tree ansTree;
        
//        System.out.println("Calling parse on: " + sentence);

        //	System.out.println(sentence.size() + ": **" + sentence + "**");
        if( sentence.size() > MAX_SENTENCE_LENGTH )
          System.out.println("Sentence far too long: " + sentence.size());
        else if( (ansTree = parser.parseTree(sentence)) == null )
          System.out.println("Failed to parse: " + sentence);
        else {
          // Build a StringWriter, print the tree to it, then save the string
          StringWriter treeStrWriter = new StringWriter();
          TreePrint tp = new TreePrint("penn");
          tp.printTree(ansTree, new PrintWriter(treeStrWriter,true));
          doc.addParse(treeStrWriter.toString());

          // Create the dependency tree - CAUTION: DESTRUCTIVE to parse tree
          try {
            GrammaticalStructure gs = gsf.newGrammaticalStructure(ansTree);
            //	    Collection<TypedDependency> deps = gs.typedDependenciesCollapsed();
            Collection<TypedDependency> deps = gs.typedDependenciesCCprocessed(true);
            depdoc.addDependencies(deps, sid);
          } catch( Exception ex ) { 
            ex.printStackTrace();
            System.out.println("WARNING: dependency tree creation failed...adding null deps");
            depdoc.addDependencies(null, sid);
          }
          sid++;
        }
      }
    }
  }
 
开发者ID:nchambers,项目名称:schemas,代码行数:50,代码来源:DirectoryParser.java

示例11: analyzeSentences

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/**
 * @desc Parses input sentences and prints the parses to the given doc.
 * @param paragraphs Vector of strings of sentences
 * @param doc The current document we're printing to.
 * @param depdoc The document of dependencies that we're printing to.
 */
private void analyzeSentences( List<List<HasWord>> sentences, GigaDoc doc, 
    GigaDoc depdoc) {
  int sid = 0;

  // Loop over each sentence
  for( List<HasWord> sentence : sentences ) {
    Tree ansTree;

    if( sid % 5 == 0 ) { System.out.print("."); }
    if( sid % 50 == 0 ) { System.out.println("\n" + sentence); }

    //      System.out.println(sentence.size() + ": " + sentence);
    if( sentence.size() > MAX_SENTENCE_LENGTH )
      System.out.println("Sentence far too long: " + sentence.size());
    else if( (ansTree = parser.parseTree(sentence)) == null )
      System.out.println("Failed to parse: " + sentence);
    else {
      // Save to InfoFile
      // Build a StringWriter, print the tree to it, then save the string
      StringWriter treeStrWriter = new StringWriter();
      TreePrint tp = new TreePrint("penn");
      tp.printTree(ansTree, new PrintWriter(treeStrWriter,true));

      //	  System.out.println(sentence);
      //	  System.out.println(treeStrWriter);
      doc.addParse(treeStrWriter.toString());

      // Create the dependency tree - CAUTION: DESTRUCTIVE to parse tree
      try {
        GrammaticalStructure gs = gsf.newGrammaticalStructure(ansTree);
        //	    Collection<TypedDependency> deps = gs.typedDependenciesCollapsed();
        Collection<TypedDependency> deps = gs.typedDependenciesCCprocessed(true);
        depdoc.addDependencies(deps, sid);
      } catch( Exception ex ) { 
        ex.printStackTrace();
        System.out.println("WARNING: dependency tree creation failed...adding null deps");
        depdoc.addDependencies(null, sid);
      }
      sid++;
    }

  }
}
 
开发者ID:nchambers,项目名称:schemas,代码行数:50,代码来源:LOTRParser.java

示例12: getTreePrint

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/** Return a TreePrint for formatting parsed output trees.
 *  @return A TreePrint for formatting parsed output trees.
 */
public TreePrint getTreePrint() {
  return op.testOptions.treePrint(op.tlpParams);
}
 
开发者ID:benblamey,项目名称:stanford-nlp,代码行数:7,代码来源:LexicalizedParserQuery.java

示例13: construct

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
private void construct(Properties props, boolean enforceRequirements) {
  this.numWords = 0;
  this.constituentTreePrinter = new TreePrint("penn");
  this.dependencyTreePrinter = new TreePrint("typedDependenciesCollapsed");
  this.gsf = new PennTreebankLanguagePack().grammaticalStructureFactory();

  if (props == null) {
    // if undefined, find the properties file in the classpath
    props = loadPropertiesFromClasspath();
  } else if (props.getProperty("annotators") == null) {
    // this happens when some command line options are specified (e.g just "-filelist") but no properties file is.
    // we use the options that are given and let them override the default properties from the class path properties.
    Properties fromClassPath = loadPropertiesFromClasspath();
    fromClassPath.putAll(props);
    props = fromClassPath;
  }
  this.properties = props;
  AnnotatorPool pool = getDefaultAnnotatorPool(props);

  // now construct the annotators from the given properties in the given order
  List<String> annoNames = Arrays.asList(getRequiredProperty(props, "annotators").split("[, \t]+"));
  Set<String> alreadyAddedAnnoNames = Generics.newHashSet();
  Set<Requirement> requirementsSatisfied = Generics.newHashSet();
  for (String name : annoNames) {
    name = name.trim();
    if (name.isEmpty()) { continue; }
    System.err.println("Adding annotator " + name);

    Annotator an = pool.get(name);
    this.addAnnotator(an);

    if (enforceRequirements) {
      Set<Requirement> allRequirements = an.requires();
      for (Requirement requirement : allRequirements) {
        if (!requirementsSatisfied.contains(requirement)) {
          String fmt = "annotator \"%s\" requires annotator \"%s\"";
          throw new IllegalArgumentException(String.format(fmt, name, requirement));
        }
      }
      requirementsSatisfied.addAll(an.requirementsSatisfied());
    }

    // the NFL domain requires several post-processing rules after
    // tokenization.  add these transparently if the NFL annotator
    // is required
    if (name.equals(STANFORD_TOKENIZE) &&
        annoNames.contains(STANFORD_NFL) &&
        !annoNames.contains(STANFORD_NFL_TOKENIZE)) {
      Annotator pp = pool.get(STANFORD_NFL_TOKENIZE);
      this.addAnnotator(pp);
    }

    alreadyAddedAnnoNames.add(name);
  }

  // Sanity check
  if (! alreadyAddedAnnoNames.contains(STANFORD_SSPLIT)) {
    System.setProperty(NEWLINE_SPLITTER_PROPERTY, "false");
  }
}
 
开发者ID:benblamey,项目名称:stanford-nlp,代码行数:61,代码来源:StanfordCoreNLP.java

示例14: toTreeString

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/**
 * Transform a parse tree into a format
 * 
 * @param tree
 * @param format
 * @return
 */
public static String toTreeString(Tree tree, String format) {
	StringWriter sw = new StringWriter();
	new TreePrint(format).printTree(tree, new PrintWriter(sw));
	return sw.toString().trim();
}
 
开发者ID:hakchul77,项目名称:irnlp_toolkit,代码行数:13,代码来源:StanfordNlpWrapper.java

示例15: treePrint

import edu.stanford.nlp.trees.TreePrint; //导入依赖的package包/类
/**
 * Determines method for print trees on output.
 *
 * @param tlpParams The treebank parser params
 * @return A suitable tree printing object
 */
public static TreePrint treePrint(TreebankLangParserParams tlpParams) {
  TreebankLanguagePack tlp = tlpParams.treebankLanguagePack();
  return new TreePrint(outputFormat, outputFormatOptions, tlp, tlpParams.headFinder());
}
 
开发者ID:FabianFriedrich,项目名称:Text2Process,代码行数:11,代码来源:Test.java


注:本文中的edu.stanford.nlp.trees.TreePrint类示例由纯净天空整理自Github/MSDocs等开源代码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。