|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |
java.lang.Objectsg.edu.nus.comp.nlp.ims.corpus.ACorpus
CTRECCorpus
public class CTRECCorpus
Field Summary |
---|
Fields inherited from class sg.edu.nus.comp.nlp.ims.corpus.ACorpus |
---|
g_LIDX, g_PIDX, g_TIDX, m_AlphabeticPattern, m_Boundaries, m_DefaultDelimiter, m_Delimiter, m_DocIDs, m_IDs, m_Indice, m_Instances, m_Judge, m_Lemmatized, m_Lemmatizer, m_LexeltIDs, m_POSs, m_POSTagged, m_POSTagger, m_SatID2Index, m_SatIDs, m_SatIndice, m_SatSentenceIDs, m_SentenceIDs, m_Sentences, m_SentenceSplitter, m_Split, m_Tags, m_Tokenized, m_Tokenizer |
Constructor Summary | |
---|---|
CTRECCorpus()
default constructor |
|
CTRECCorpus(IPOSTagger p_POSTagger,
ISentenceSplitter p_Splitter,
ITokenizer p_Tokenizer,
ILemmatizer p_Lemmatizer)
constructor with some components |
Method Summary | |
---|---|
protected void |
genInfo()
collection some information |
int |
getLowerBoundary(int p_Sentence)
get lower boundary |
int |
getUpperBoundary(int p_Sentence)
get upper boundary |
boolean |
load(java.io.Reader p_Reader)
load data into corpus |
static void |
main(java.lang.String[] p_Args)
|
protected void |
posTag()
pos tagging |
protected void |
tokenizeSentence(java.lang.String p_Sentence)
tokenize a sentence |
Methods inherited from class sg.edu.nus.comp.nlp.ims.corpus.ACorpus |
---|
alphabetic, clear, getIndexInSentence, getSentence, getSentenceID, getTag, getValue, lemmatize, numOfSentences, setDelimiter, setLemmatized, setPOSTagged, setSplit, setTokenized, size, tokenize, toString |
Methods inherited from class java.lang.Object |
---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, wait, wait, wait |
Constructor Detail |
---|
public CTRECCorpus()
public CTRECCorpus(IPOSTagger p_POSTagger, ISentenceSplitter p_Splitter, ITokenizer p_Tokenizer, ILemmatizer p_Lemmatizer)
p_POSTagger
- POS taggerp_Splitter
- Sentence splitterp_Tokenizer
- tokenzierp_Lemmatizer
- lemmatizerMethod Detail |
---|
public boolean load(java.io.Reader p_Reader)
ICorpus
p_Reader
- reader of the input stream
protected void posTag()
ACorpus
posTag
in class ACorpus
protected void tokenizeSentence(java.lang.String p_Sentence)
ACorpus
tokenizeSentence
in class ACorpus
p_Sentence
- input sentenceprotected void genInfo()
ACorpus
genInfo
in class ACorpus
public int getLowerBoundary(int p_Sentence)
ICorpus
getLowerBoundary
in interface ICorpus
getLowerBoundary
in class ACorpus
p_Sentence
- sentence number
public int getUpperBoundary(int p_Sentence)
ICorpus
getUpperBoundary
in interface ICorpus
getUpperBoundary
in class ACorpus
p_Sentence
- sentence number
public static void main(java.lang.String[] p_Args)
p_Args
- arguments
|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |