|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |
java.lang.Object org.apache.lucene.benchmark.byTask.feeds.demohtml.HTMLParser
public class HTMLParser
Field Summary | |
---|---|
Token |
jj_nt
Next token. |
static int |
SUMMARY_LENGTH
|
Token |
token
Current token. |
HTMLParserTokenManager |
token_source
Generated Token Manager. |
Fields inherited from interface org.apache.lucene.benchmark.byTask.feeds.demohtml.HTMLParserConstants |
---|
AfterEquals, ArgEquals, ArgName, ArgQuote1, ArgQuote2, ArgValue, CloseQuote1, CloseQuote2, Comment1, Comment2, CommentEnd1, CommentEnd2, CommentText1, CommentText2, DeclName, DEFAULT, Entity, EOF, HEX, LET, NUM, Punct, Quote1Text, Quote2Text, ScriptEnd, ScriptStart, ScriptText, SP, Space, TagEnd, TagName, tokenImage, WithinComment1, WithinComment2, WithinQuote1, WithinQuote2, WithinScript, WithinTag, Word |
Constructor Summary | |
---|---|
HTMLParser(HTMLParserTokenManager tm)
Constructor with generated Token Manager. |
|
HTMLParser(InputStream stream)
Constructor with InputStream. |
|
HTMLParser(InputStream stream,
String encoding)
Constructor with InputStream and supplied encoding |
|
HTMLParser(Reader stream)
Constructor. |
Method Summary | |
---|---|
Token |
ArgValue()
|
void |
CommentTag()
|
Token |
Decl()
|
void |
disable_tracing()
Disable tracing. |
void |
enable_tracing()
Enable tracing. |
ParseException |
generateParseException()
Generate ParseException. |
Properties |
getMetaTags()
|
Token |
getNextToken()
Get the next Token. |
Reader |
getReader()
|
String |
getSummary()
|
String |
getTitle()
|
Token |
getToken(int index)
Get the specific Token. |
void |
HTMLDocument()
|
void |
ReInit(HTMLParserTokenManager tm)
Reinitialise. |
void |
ReInit(InputStream stream)
Reinitialise. |
void |
ReInit(InputStream stream,
String encoding)
Reinitialise. |
void |
ReInit(Reader stream)
Reinitialise. |
void |
ScriptTag()
|
void |
Tag()
|
Methods inherited from class java.lang.Object |
---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
Field Detail |
---|
public static int SUMMARY_LENGTH
public HTMLParserTokenManager token_source
public Token token
public Token jj_nt
Constructor Detail |
---|
public HTMLParser(InputStream stream)
public HTMLParser(InputStream stream, String encoding)
public HTMLParser(Reader stream)
public HTMLParser(HTMLParserTokenManager tm)
Method Detail |
---|
public String getTitle() throws IOException, InterruptedException
IOException
InterruptedException
public Properties getMetaTags() throws IOException, InterruptedException
IOException
InterruptedException
public String getSummary() throws IOException, InterruptedException
IOException
InterruptedException
public Reader getReader() throws IOException
IOException
public final void HTMLDocument() throws ParseException, IOException
ParseException
IOException
public final void Tag() throws ParseException, IOException
ParseException
IOException
public final Token ArgValue() throws ParseException
ParseException
public final Token Decl() throws ParseException
ParseException
public final void CommentTag() throws ParseException
ParseException
public final void ScriptTag() throws ParseException
ParseException
public void ReInit(InputStream stream)
public void ReInit(InputStream stream, String encoding)
public void ReInit(Reader stream)
public void ReInit(HTMLParserTokenManager tm)
public final Token getNextToken()
public final Token getToken(int index)
public ParseException generateParseException()
public final void enable_tracing()
public final void disable_tracing()
|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |