public class HTMLParser extends Object implements HTMLParserConstants
Modifier and Type | Field and Description |
---|---|
Token |
jj_nt |
boolean |
lookingAhead |
static int |
SUMMARY_LENGTH |
Token |
token |
HTMLParserTokenManager |
token_source |
AfterEquals, ArgEquals, ArgName, ArgQuote1, ArgQuote2, ArgValue, CloseQuote1, CloseQuote2, Comment1, Comment2, CommentEnd1, CommentEnd2, CommentText1, CommentText2, DeclName, DEFAULT, Entity, EOF, HEX, LET, NUM, Punct, Quote1Text, Quote2Text, ScriptEnd, ScriptStart, ScriptText, SP, Space, TagEnd, TagName, tokenImage, WithinComment1, WithinComment2, WithinQuote1, WithinQuote2, WithinScript, WithinTag, Word
Constructor and Description |
---|
HTMLParser(File file)
Deprecated.
Use HTMLParser(FileInputStream) instead
|
HTMLParser(HTMLParserTokenManager tm) |
HTMLParser(InputStream stream) |
HTMLParser(Reader stream) |
Modifier and Type | Method and Description |
---|---|
Token |
ArgValue() |
void |
CommentTag() |
Token |
Decl() |
void |
disable_tracing() |
void |
enable_tracing() |
ParseException |
generateParseException() |
Properties |
getMetaTags() |
Token |
getNextToken() |
Reader |
getReader() |
String |
getSummary() |
String |
getTitle() |
Token |
getToken(int index) |
void |
HTMLDocument() |
void |
ReInit(HTMLParserTokenManager tm) |
void |
ReInit(InputStream stream) |
void |
ReInit(Reader stream) |
void |
ScriptTag() |
void |
Tag() |
public static int SUMMARY_LENGTH
public HTMLParserTokenManager token_source
public Token token
public Token jj_nt
public boolean lookingAhead
public HTMLParser(File file) throws FileNotFoundException
FileNotFoundException
public HTMLParser(InputStream stream)
public HTMLParser(Reader stream)
public HTMLParser(HTMLParserTokenManager tm)
public String getTitle() throws IOException, InterruptedException
IOException
InterruptedException
public Properties getMetaTags() throws IOException, InterruptedException
IOException
InterruptedException
public String getSummary() throws IOException, InterruptedException
IOException
InterruptedException
public Reader getReader() throws IOException
IOException
public final void HTMLDocument() throws ParseException, IOException
ParseException
IOException
public final void Tag() throws ParseException, IOException
ParseException
IOException
public final Token ArgValue() throws ParseException
ParseException
public final Token Decl() throws ParseException
ParseException
public final void CommentTag() throws ParseException
ParseException
public final void ScriptTag() throws ParseException
ParseException
public void ReInit(InputStream stream)
public void ReInit(Reader stream)
public void ReInit(HTMLParserTokenManager tm)
public final Token getNextToken()
public final Token getToken(int index)
public ParseException generateParseException()
public final void enable_tracing()
public final void disable_tracing()
Copyright © 2000-2013 Apache Software Foundation. All Rights Reserved.