public class AnalyzedCorpus extends Object implements Corpus
AnalyzedCorpus
is a special object that is backed by a Corpus
, but provides additional analysis methods.
Inspired by NLTK.Constructor and Description |
---|
AnalyzedCorpus(Corpus corpus) |
Modifier and Type | Method and Description |
---|---|
void |
getConcordance(String token) |
String |
getDescription() |
String |
getLanguage() |
String |
getName() |
List<Sentence> |
getSentenceList() |
Iterable<Sentence> |
getSentences() |
Iterable<Sentence> |
getSentences(int maxItems) |
List<TaggedToken> |
getTaggedTokenList() |
Iterable<TaggedToken> |
getTaggedTokens() |
Iterable<TaggedToken> |
getTaggedTokens(int maxItems) |
Iterable<Tag> |
getTags() |
Iterable<Tag> |
getTags(int maxItems) |
Tag.Tagset |
getTagset() |
Iterable<Text> |
getTexts() |
List<String> |
getTokenList() |
List<String> |
getTokenList(boolean toLowerCase) |
Iterable<String> |
getTokens() |
Iterable<String> |
getTokens(int maxItems) |
Corpus |
getUnderlyingCorpus() |
public AnalyzedCorpus(Corpus corpus)
public Corpus getUnderlyingCorpus()
public List<Sentence> getSentenceList() throws CorpusException
CorpusException
public List<String> getTokenList() throws CorpusException
CorpusException
public List<String> getTokenList(boolean toLowerCase) throws CorpusException
CorpusException
public List<TaggedToken> getTaggedTokenList() throws CorpusException
CorpusException
public void getConcordance(String token) throws CorpusException
CorpusException
public Iterable<Tag> getTags() throws CorpusException
getTags
in interface Corpus
CorpusException
public Iterable<Text> getTexts() throws CorpusException
getTexts
in interface Corpus
CorpusException
public Iterable<String> getTokens() throws CorpusException
getTokens
in interface Corpus
CorpusException
public Iterable<TaggedToken> getTaggedTokens() throws CorpusException
getTaggedTokens
in interface Corpus
CorpusException
public Iterable<Sentence> getSentences() throws CorpusException
getSentences
in interface Corpus
CorpusException
public Tag.Tagset getTagset() throws CorpusException
getTagset
in interface Corpus
CorpusException
public Iterable<String> getTokens(int maxItems) throws CorpusException
getTokens
in interface Corpus
CorpusException
public Iterable<TaggedToken> getTaggedTokens(int maxItems) throws CorpusException
getTaggedTokens
in interface Corpus
CorpusException
public Iterable<Sentence> getSentences(int maxItems) throws CorpusException
getSentences
in interface Corpus
CorpusException
public Iterable<Tag> getTags(int maxItems) throws CorpusException
getTags
in interface Corpus
CorpusException
public String getLanguage()
getLanguage
in interface Corpus
public String getDescription()
getDescription
in interface Corpus
Copyright © 2011-2014. All Rights Reserved.