public class HTMLParser extends java.lang.Object implements HTMLParserConstants
| Modifier and Type | Field and Description |
|---|---|
Token |
jj_nt |
boolean |
lookingAhead |
static int |
SUMMARY_LENGTH |
Token |
token |
HTMLParserTokenManager |
token_source |
AfterEquals, ArgEquals, ArgName, ArgQuote1, ArgQuote2, ArgValue, CloseQuote1, CloseQuote2, Comment1, Comment2, CommentEnd1, CommentEnd2, CommentText1, CommentText2, DeclName, DEFAULT, Entity, EOF, HEX, LET, NUM, Punct, Quote1Text, Quote2Text, ScriptEnd, ScriptStart, ScriptText, SP, Space, TagEnd, TagName, tokenImage, WithinComment1, WithinComment2, WithinQuote1, WithinQuote2, WithinScript, WithinTag, Word| Constructor and Description |
|---|
HTMLParser(java.io.File file)
Deprecated.
Use HTMLParser(FileInputStream) instead
|
HTMLParser(HTMLParserTokenManager tm) |
HTMLParser(java.io.InputStream stream) |
HTMLParser(java.io.InputStream stream,
java.lang.String encoding) |
HTMLParser(java.io.Reader stream) |
| Modifier and Type | Method and Description |
|---|---|
Token |
ArgValue() |
void |
CommentTag() |
Token |
Decl() |
void |
disable_tracing() |
void |
enable_tracing() |
ParseException |
generateParseException() |
java.util.Properties |
getMetaTags() |
Token |
getNextToken() |
java.io.Reader |
getReader() |
java.lang.String |
getSummary() |
java.lang.String |
getTitle() |
Token |
getToken(int index) |
void |
HTMLDocument() |
void |
ReInit(HTMLParserTokenManager tm) |
void |
ReInit(java.io.InputStream stream) |
void |
ReInit(java.io.InputStream stream,
java.lang.String encoding) |
void |
ReInit(java.io.Reader stream) |
void |
ScriptTag() |
void |
Tag() |
public static int SUMMARY_LENGTH
public HTMLParserTokenManager token_source
public Token token
public Token jj_nt
public boolean lookingAhead
public HTMLParser(java.io.File file)
throws java.io.FileNotFoundException
java.io.FileNotFoundExceptionpublic HTMLParser(java.io.InputStream stream)
public HTMLParser(java.io.InputStream stream,
java.lang.String encoding)
public HTMLParser(java.io.Reader stream)
public HTMLParser(HTMLParserTokenManager tm)
public java.lang.String getTitle()
throws java.io.IOException,
java.lang.InterruptedException
java.io.IOExceptionjava.lang.InterruptedExceptionpublic java.util.Properties getMetaTags()
throws java.io.IOException,
java.lang.InterruptedException
java.io.IOExceptionjava.lang.InterruptedExceptionpublic java.lang.String getSummary()
throws java.io.IOException,
java.lang.InterruptedException
java.io.IOExceptionjava.lang.InterruptedExceptionpublic java.io.Reader getReader()
throws java.io.IOException
java.io.IOExceptionpublic final void HTMLDocument()
throws ParseException,
java.io.IOException
ParseExceptionjava.io.IOExceptionpublic final void Tag()
throws ParseException,
java.io.IOException
ParseExceptionjava.io.IOExceptionpublic final Token ArgValue() throws ParseException
ParseExceptionpublic final Token Decl() throws ParseException
ParseExceptionpublic final void CommentTag()
throws ParseException
ParseExceptionpublic final void ScriptTag()
throws ParseException
ParseExceptionpublic void ReInit(java.io.InputStream stream)
public void ReInit(java.io.InputStream stream,
java.lang.String encoding)
public void ReInit(java.io.Reader stream)
public void ReInit(HTMLParserTokenManager tm)
public final Token getNextToken()
public final Token getToken(int index)
public ParseException generateParseException()
public final void enable_tracing()
public final void disable_tracing()
Copyright © 2000-2014 Apache Software Foundation. All Rights Reserved.