Package | Description |
---|---|
dkpro.toolbox.corpus | |
dkpro.toolbox.corpus.analyzed | |
dkpro.toolbox.corpus.categorized | |
dkpro.toolbox.corpus.raw | |
dkpro.toolbox.corpus.special |
Constructor and Description |
---|
BrownCorpus() |
BrownCorpus(String brownPath) |
DkproCorpus(String language,
Tag.Tagset tagset,
String name,
String description,
org.apache.uima.collection.CollectionReaderDescription reader) |
SerializedCorpus(String corpusPath) |
SerializedCorpus(String corpusPath,
String... patterns) |
Modifier and Type | Method and Description |
---|---|
void |
AnalyzedCorpus.getConcordance(String token) |
static AnalyzedCorpus |
CorpusManager.getCorpus(CorpusManager.CorpusName name) |
static Sentence |
CorpusManager.getSentence(CorpusManager.CorpusName name) |
List<Sentence> |
AnalyzedCorpus.getSentenceList() |
Iterable<Sentence> |
AnalyzedCorpus.getSentences() |
Iterable<Sentence> |
AnalyzedCorpus.getSentences(int maxItems) |
List<TaggedToken> |
AnalyzedCorpus.getTaggedTokenList() |
Iterable<TaggedToken> |
AnalyzedCorpus.getTaggedTokens() |
Iterable<TaggedToken> |
AnalyzedCorpus.getTaggedTokens(int maxItems) |
Iterable<Tag> |
AnalyzedCorpus.getTags() |
Iterable<Tag> |
AnalyzedCorpus.getTags(int maxItems) |
Tag.Tagset |
AnalyzedCorpus.getTagset() |
Iterable<Text> |
AnalyzedCorpus.getTexts() |
List<String> |
AnalyzedCorpus.getTokenList() |
List<String> |
AnalyzedCorpus.getTokenList(boolean toLowerCase) |
Iterable<String> |
AnalyzedCorpus.getTokens() |
Iterable<String> |
AnalyzedCorpus.getTokens(int maxItems) |
Modifier and Type | Method and Description |
---|---|
void |
CategorizedCorpusBase.addCorpus(String category,
Tag.Tagset tagset,
String language,
String name,
String description,
org.apache.uima.collection.CollectionReaderDescription reader) |
String |
UserProvidedCategorizedCorpus.getLanguage(String category) |
String |
UdhrCorpus.getLanguage(String category) |
String |
InauguralCorpus.getLanguage(String category) |
String |
FirstNamesCorpus.getLanguage(String category) |
String |
CategorizedCorpus.getLanguage(String category) |
Iterable<Sentence> |
CategorizedCorpusBase.getSentences() |
Iterable<Sentence> |
CategorizedCorpusBase.getSentences(int maxItems) |
Iterable<Sentence> |
CategorizedCorpusBase.getSentences(String category) |
Iterable<Sentence> |
CategorizedCorpus.getSentences(String category) |
Iterable<TaggedToken> |
CategorizedCorpusBase.getTaggedTokens() |
Iterable<TaggedToken> |
CategorizedCorpusBase.getTaggedTokens(int maxItems) |
Iterable<TaggedToken> |
CategorizedCorpusBase.getTaggedTokens(String category) |
Iterable<TaggedToken> |
CategorizedCorpus.getTaggedTokens(String category) |
Iterable<Tag> |
CategorizedCorpusBase.getTags() |
Iterable<Tag> |
CategorizedCorpusBase.getTags(int maxItems) |
Iterable<Tag> |
CategorizedCorpusBase.getTags(String category) |
Iterable<Tag> |
CategorizedCorpus.getTags(String category) |
Tag.Tagset |
CategorizedCorpusBase.getTagset() |
Iterable<Text> |
CategorizedCorpusBase.getTexts() |
Iterable<Text> |
CategorizedCorpusBase.getTexts(String category) |
Iterable<Text> |
CategorizedCorpus.getTexts(String category) |
Iterable<String> |
CategorizedCorpusBase.getTokens() |
Iterable<String> |
CategorizedCorpusBase.getTokens(int maxItems) |
Iterable<String> |
CategorizedCorpusBase.getTokens(String category) |
Iterable<String> |
CategorizedCorpus.getTokens(String category) |
Constructor and Description |
---|
FirstNamesCorpus() |
InauguralCorpus() |
UdhrCorpus() |
Modifier and Type | Method and Description |
---|---|
String |
RawText.getText() |
String |
CorpusBackedRawText.getText() |
static RawText |
TextManager.getText(TextManager.TextName textName) |
Constructor and Description |
---|
CmuDict() |
ConllCorpus() |
SemCor() |
StopwordsCorpus(StopwordsCorpus.StopwordsLanguage language) |
WordCorpus(WordCorpus.AvailableLanguage language) |
Copyright © 2011-2014. All Rights Reserved.