PK 2MMMETA-INF/MANIFEST.MFManifest-Version: 1.0 Main-Class: edu.nus.comp.nlp.tool.SentenceSplitter PK 2}_%edu/nus/comp/nlp/tool/PlainText.class. ; : : :  : : :               :   sentDelimLjava/lang/String; ConstantValueextraStr singleLineZtextLjava/lang/StringBuffer;sents[Ljava/lang/String;()VCodeLineNumberTableLocalVariableTablethis!Ledu/nus/comp/nlp/tool/PlainText;(Ljava/lang/String;)VfileName'(Ljava/lang/String;Ljava/lang/String;)V commentFlag(Ljava/lang/StringBuffer;)Vstr getSentCount()IaddQuote'(ZLjava/lang/String;)Ljava/lang/String; debugModeexStr(Z)Ljava/lang/String;iIoutStropenFlag closingFlag mergeQuots pureTextAsplitSentences()[Ljava/lang/String;9(Ljava/lang/String;Ljava/lang/String;)[Ljava/lang/String; previousSentendingtmp mSentenceHeadLjava/util/regex/Matcher; lastWdIdx tokenizerLjava/util/StringTokenizer;sentence title_acronym pSentenceHeadLjava/util/regex/Pattern;acronym openQuotationdelimLjava/util/ArrayList;delimForTokenizerout setSingleLine(Z)Vb removeTag pureTextB pureTextCrundebugtoString()Ljava/lang/String; SourceFilePlainText.java FG BC DE _G ~"``|''|\?"|\!"|\."|\. |\. | |\!|\? ac ?= UYjava/lang/String java/lang/StringBuffer    FMjava/util/ArrayList !|"|\.|\?java/util/StringTokenizer F(<[.[^<>]]+>\s?)*\s*[A-Z"].*   T " T    ([A-Z]\.)+ @A y  \&\w{1,8}\; u Medu/nus/comp/nlp/tool/PlainTextjava/lang/Objectedu/nus/comp/nlp/tool/UtilreadFile,(Ljava/lang/String;)Ljava/lang/StringBuffer;>(Ljava/lang/String;Ljava/lang/String;)Ljava/lang/StringBuffer;appendvalueOf(I)Ljava/lang/String;mergeDoubleSingleQuots&(Ljava/lang/String;)Ljava/lang/String;((Ljava/lang/String;Ljava/lang/String;Z)Vjava/util/regex/Patterncompile-(Ljava/lang/String;)Ljava/util/regex/Pattern; hasMoreTokens()Z nextTokentrimmatcher3(Ljava/lang/CharSequence;)Ljava/util/regex/Matcher;lengthmatches(Ljava/lang/String;)Zadd(Ljava/lang/Object;)Zequalssizeget(I)Ljava/lang/Object; substringremovejava/util/regex/Matcher lookingAt lastIndexOf(Ljava/lang/String;)Iedu/nus/comp/nlp/tool/TitleListcontains replaceAll8(Ljava/lang/String;Ljava/lang/String;)Ljava/lang/String;removeBlankLinejava/lang/SystemLjava/io/PrintStream;java/io/PrintStreamprintln!:;<=>?=@ABCDEFGHE***I73 48J KLFMHc****+*I:3 4;<=JKLN=FOHn****+,*I?3 4@ABJ KLN=P=FQH`****+*ID3 4EFGJKLRCSTHO*** *IJKNJ KLUVHN *W, * I RSJ  KL WA X=UYHI***  Y MN:6*MY,`- *2 M;Y,- *2 Mm,I2 [\_a"b&d3e7f~hjdnJ>)Z[KLWA\="]=&^=_GHT*L*Y+Ir stJKL `=abH7 * IwJ  KL acH/7YMN*ɻY*-::: :66 ! Y"#$:  %:  & -'; &0Y :!,(W )*  6 : ,+,,+d, #:   &d-:  -'R,+/,Y,,+d.  (W:,Y (WY : )* 6 ,Y,,+d.  (W /&w,+p  0`-1,Y,,+d.  :j,Y,,+d.  (W:: /,(W :6Y #:0`6 & -1Y: -2'Y:6s:& ,(W],+ :306,+!,, 4Sܧ&6,+,, SI*J{| }"),/7HQY\er!:=X[eq.59<?Xckn{    .4Jd= se= Hf= Qgh coi[ jkl="m=)no,pA/qA 'Z[ Z[7B=7r=/Ds ,t=YuEvwH=3I JKLxAyGH~&*5L+6M,74N*Y-I  !%"J*&KL `=z= {=|GH: 8* 9I % &J  KL|wHD 8* 9I ) *J KL }A~H2*I.J KLGH&  3I /2PK 2+47 7 ,edu/nus/comp/nlp/tool/SentenceSplitter.class. *C DEF GHIJKLMNOPQ DRST DUVW C )XY Z[\]^_`a bcde "f Dg "h "i "j "klm versionInfoLjava/lang/String; ConstantValue()VCodeLineNumberTableLocalVariableTablethis(Ledu/nus/comp/nlp/tool/SentenceSplitter;showHelpMessagemain([Ljava/lang/String;)ViIargs[Ljava/lang/String;showIdxZextraStr plainText1!Ledu/nus/comp/nlp/tool/PlainText; SourceFileSentenceSplitter.java ./n opfUsage: java -classpath SentenceSplitter.jar edu.nus.comp.nlp.tool.SentenceSplitter [options] textfileq rs6Or: java -jar SentenceSplitter.jar [options] textfile@Splits the text file into sentences. XML style tags are removed.Options:' -a str Surrounds sentences with str. -help Displays this message., -i Displays sentences with numeric index.) -s Puts single sentence in each line. -tag Keeps tags. -v Version information. tu SingleLinefalse vw RetainTagjava/lang/String 5/-i xy-strue-tag-a\n -help z{-v&SentenceSplitter version 2.02 20050725edu/nus/comp/nlp/tool/PlainText .s |} ~ >, / &edu/nus/comp/nlp/tool/SentenceSplitterjava/lang/Objectjava/lang/SystemoutLjava/io/PrintStream;java/io/PrintStreamprintln(Ljava/lang/String;)Vexit(I)V setProperty8(Ljava/lang/String;Ljava/lang/String;)Ljava/lang/String;equals(Ljava/lang/Object;)ZendsWith(Ljava/lang/String;)Z getProperty&(Ljava/lang/String;)Ljava/lang/String; setSingleLine(Z)V removeTagrun!)*+,-!./03*1 2 34 5/0U     12  (08@ H!P"T# 670<WWYM*>**2<*2 W*2 W*2*`2*`2M*2*2 !|"Y**d2#N-$%-W,&$-'-(1r() *+, -#0+16284C5K7V8^:i;=>@AB0FGHIJLM24%89:;<=>,+?@ABPK 2b*%edu/nus/comp/nlp/tool/TitleList.class.'      !listLjava/lang/String;()VCodeLineNumberTableLocalVariableTablethis!Ledu/nus/comp/nlp/tool/TitleList;contains(Ljava/lang/String;)Zwd SourceFileTitleList.java "# $%java/lang/StringA|Adj|Adm|Adv|Asst|B|Bart|Bldg|Brig|Bros|C|Capt|Cmdr|Col|Comdr|Con|Cpl|D|DR|Dr|E|Ens|F|G|Gen|Gov|H|Hon|Hosp|I|Insp|J|K|L|Lt|M|MM|MR|MRS|MS|Maj|Messrs|Mlle|Mme|Mr|Mrs|Ms|Msgr|Mt|N|No|O|Op|Ord|P|Pfc|Ph|Prof|Pvt|Q|R|Rep|Reps|Res|Rev|Rt|S|Sen|Sens|Sfc|Sgt|Sr|St|Supt|Surg|T|U|V|W|X|Y|Z|v|vs &edu/nus/comp/nlp/tool/TitleListjava/lang/Object toLowerCase()Ljava/lang/String;indexOf(Ljava/lang/String;)I(Ljava/lang/String;)V!   3*   >*   (YPK 2BhMHH edu/nus/comp/nlp/tool/Util.class. ?{ >|} {~              > {     +{ + +     ;()VCodeLineNumberTableLocalVariableTablethisLedu/nus/comp/nlp/tool/Util;readFile,(Ljava/lang/String;)Ljava/lang/StringBuffer;fileNameLjava/lang/String;>(Ljava/lang/String;Ljava/lang/String;)Ljava/lang/StringBuffer;inLjava/io/BufferedReader;sexLjava/io/IOException; commentFlagsbLjava/lang/StringBuffer;write((Ljava/lang/String;Ljava/lang/String;Z)VoutLjava/io/PrintWriter;contentappendZ'(Ljava/lang/String;Ljava/lang/String;)V removeTag&(Ljava/lang/String;)Ljava/lang/String;strrstpLjava/util/regex/Pattern;mLjava/util/regex/Matcher;removeBlankLine removeSpacemergeDoubleSingleQuotsnumberOfTokens(Ljava/lang/String;)IiIdelimtks[Ljava/lang/String;tkSetLjava/util/HashSet;UnixSystemCallcmdprocLjava/lang/Process;eLjava/lang/Exception;commandoutputFileNameoutput SourceFile Util.java @A GKjava/lang/StringBufferjava/io/BufferedReaderjava/io/FileReader @ @ YHline.separator ] Ajava/io/IOException Ajava/io/PrintWriterjava/io/BufferedWriterjava/io/FileWriter @ @ TUjava/lang/String <[.[^<>]]+>   ] ([\s^ ]* [\s^ ]*)+ \s ''|``" | java/util/HashSet /bin/sh-culimit -s unlimited; >   java/lang/Exception Wrong while running java/io/InputStreamReader @edu/nus/comp/nlp/tool/Utiljava/lang/Object(Ljava/lang/String;)V(Ljava/io/Reader;)VreadLine()Ljava/lang/String;trim startsWith(Ljava/lang/String;)Zjava/lang/System getPropertycloseprintStackTrace(Ljava/lang/String;Z)V(Ljava/io/Writer;)Vprintlnjava/util/regex/Patterncompile-(Ljava/lang/String;)Ljava/util/regex/Pattern;matcher3(Ljava/lang/CharSequence;)Ljava/util/regex/Matcher;java/util/regex/Matcher replaceAll8(Ljava/lang/String;Ljava/lang/String;)Ljava/lang/String;split'(Ljava/lang/String;)[Ljava/lang/String;add(Ljava/lang/Object;)Zsize()ItoStringjava/lang/Runtime getRuntime()Ljava/lang/Runtime;exec(([Ljava/lang/String;)Ljava/lang/Process;java/lang/ProcesswaitForerrLjava/io/PrintStream;java/io/PrintStreamgetInputStream()Ljava/io/InputStream;(Ljava/io/InputStream;)V!>? @AB3*C D EF GHB0*CD IJ GKBWYMYY*N- Y:*+ + , W,  W-N-,MPC6 ""#2&5(<*F+I,M0P.Q/U1D>5LM.NJQOPWIJWQJORS TUB*YYY*N-+-N-!$C79:!>$<%=)?D4 VW%OP*IJ*XJ*YZ T[B?*+C FGDIJXJ \]BuYLM,*N- !L+CJKLMND*^J_J`a bc d]BuYL"M,*N-#!L+CSTUVWD*^J_J`a bc e]B3 *$%&C[D  ^J f]B3 *'(&C_D  ^J ghB/)L*+*M+Y,N6,-,2-W-.Cde fgh$g*jD4ij/XJ,kJ &lmno p[BYY/SY0SYY1 * 2 + 3SM4,5N-6WM8Y9 * 3:;>7Co.s6t;y>w?xXzD4. qm6rs?tuYvJYwJ p]B.YLY/SY0SYY1 * 3SM4,5NY;Y-<=: Y:Y+  # 3L-6WM8Y9 * 3:+ux7C2 }-5ITmpuxyDH-Hqm5@rsI,LMQ$NJytuvJxJyzPK 2MMMETA-INF/MANIFEST.MFPK 2}_%edu/nus/comp/nlp/tool/PlainText.classPK 2+47 7 ,bedu/nus/comp/nlp/tool/SentenceSplitter.classPK 2b*% edu/nus/comp/nlp/tool/TitleList.classPK 2BhMHH $edu/nus/comp/nlp/tool/Util.classPKr6