Java Code Examples for edu.stanford.nlp.tagger.maxent.MaxentTagger#tagSentence()
The following examples show how to use
edu.stanford.nlp.tagger.maxent.MaxentTagger#tagSentence() .
You can vote up the ones you like or vote down the ones you don't like,
and go to the original project or source file by following the links above each example. You may check out the related API usage on the sidebar.
Example 1
Source File: StanfordPosTagger.java From OpenEphyra with GNU General Public License v2.0 | 6 votes |
/** * Tags the tokens with part of speech * * @param tokens Array of token strings * @return Part of speech tags */ public static String[] tagPos(String[] tokens) { Sentence untagged = createSentence(tokens); Sentence tagged = MaxentTagger.tagSentence(untagged); String[] pos = new String[tagged.size()]; for (int i = 0; i < tagged.size(); i++) { HasWord w = (HasWord) tagged.get(i); String[] s = w.toString().split("/"); if (s.length > 1) pos[i] = s[s.length - 1]; else pos[i] = ""; } return pos; }
Example 2
Source File: Chapter5.java From Natural-Language-Processing-with-Java-Second-Edition with MIT License | 5 votes |
private static void usingStanfordMaxentPOS() { try { MaxentTagger tagger = new MaxentTagger(getModelDir() + "//wsj-0-18-bidirectional-distsim.tagger"); // MaxentTagger tagger = new MaxentTagger(getModelDir() + "//gate-EN-twitter.model"); // System.out.println(tagger.tagString("AFAIK she H8 cth!")); // System.out.println(tagger.tagString("BTW had a GR8 tym at the party BBIAM.")); List<List<HasWord>> sentences = MaxentTagger.tokenizeText(new BufferedReader(new FileReader("sentences.txt"))); for (List<HasWord> sentence : sentences) { List<TaggedWord> taggedSentence = tagger.tagSentence(sentence); // Simple display System.out.println("---" + taggedSentence); // Simple conversion to String // System.out.println(Sentence.listToString(taggedSentence, false)); // Display of words and tags // for (TaggedWord taggedWord : taggedSentence) { // System.out.print(taggedWord.word() + "/" + taggedWord.tag() + " "); // } // System.out.println(); // List of specifc tags // System.out.print("NN Tagged: "); // for (TaggedWord taggedWord : taggedSentence) { // if (taggedWord.tag().startsWith("NN")) { // System.out.print(taggedWord.word() + " "); // } // } // System.out.println(); } } catch (FileNotFoundException ex) { ex.printStackTrace(); } }
Example 3
Source File: ParserDemo.java From NLIDB with Apache License 2.0 | 5 votes |
public static void main(String[] args) { String modelPath = DependencyParser.DEFAULT_MODEL; String taggerPath = "edu/stanford/nlp/models/pos-tagger/english-left3words/english-left3words-distsim.tagger"; for (int argIndex = 0; argIndex < args.length;) { switch (args[argIndex]) { case "-tagger": taggerPath = args[argIndex + 1]; argIndex += 2; break; case "-com.dukenlidb.nlidb.model": modelPath = args[argIndex + 1]; argIndex += 2; break; default: throw new RuntimeException("Unknown argument " + args[argIndex]); } } String text = "Return authors who have more papers than Bob in VLDB after 2000"; MaxentTagger tagger = new MaxentTagger(taggerPath); DependencyParser parser = DependencyParser.loadFromModelFile(modelPath); DocumentPreprocessor tokenizer = new DocumentPreprocessor(new StringReader(text)); for (List<HasWord> sentence : tokenizer) { List<TaggedWord> tagged = tagger.tagSentence(sentence); GrammaticalStructure gs = parser.predict(tagged); // Print typed dependencies log.info(gs); } }
Example 4
Source File: TaggerDemo.java From blog-codes with Apache License 2.0 | 4 votes |
public static void main(String[] args) throws Exception { InputStream input = TaggerDemo.class.getResourceAsStream("/"+MaxentTagger.DEFAULT_JAR_PATH); MaxentTagger tagger = new MaxentTagger(input); List<List<HasWord>> sentences = MaxentTagger.tokenizeText(new StringReader("Karma of humans is AI")); for (List<HasWord> sentence : sentences) { List<TaggedWord> tSentence = tagger.tagSentence(sentence); System.out.println(SentenceUtils.listToString(tSentence, false)); } }