Package org.apache.lucene.demo.html
Class HTMLParser
java.lang.Object
org.apache.lucene.demo.html.HTMLParser
- All Implemented Interfaces:
HTMLParserConstants
-
Field Summary
Modifier and TypeFieldDescriptionboolean
static int
Fields inherited from interface org.apache.lucene.demo.html.HTMLParserConstants
AfterEquals, ArgEquals, ArgName, ArgQuote1, ArgQuote2, ArgValue, CloseQuote1, CloseQuote2, Comment1, Comment2, CommentEnd1, CommentEnd2, CommentText1, CommentText2, DeclName, DEFAULT, Entity, EOF, HEX, LET, NUM, Punct, Quote1Text, Quote2Text, ScriptEnd, ScriptStart, ScriptText, SP, Space, TagEnd, TagName, tokenImage, WithinComment1, WithinComment2, WithinQuote1, WithinQuote2, WithinScript, WithinTag, Word
-
Constructor Summary
ConstructorDescriptionHTMLParser
(File file) Deprecated.Use HTMLParser(FileInputStream) insteadHTMLParser
(InputStream stream) HTMLParser
(InputStream stream, String encoding) HTMLParser
(Reader stream) -
Method Summary
Modifier and TypeMethodDescriptionfinal Token
ArgValue()
final void
final Token
Decl()
final void
final void
final Token
getTitle()
final Token
getToken
(int index) final void
void
parse()
void
ReInit
(InputStream stream) void
ReInit
(InputStream stream, String encoding) void
void
final void
void
setException
(Exception exception) final void
Tag()
-
Field Details
-
SUMMARY_LENGTH
public static int SUMMARY_LENGTH -
token_source
-
token
-
jj_nt
-
lookingAhead
public boolean lookingAhead
-
-
Constructor Details
-
HTMLParser
Deprecated.Use HTMLParser(FileInputStream) instead- Throws:
FileNotFoundException
-
HTMLParser
-
HTMLParser
-
HTMLParser
-
HTMLParser
-
-
Method Details
-
getTitle
- Throws:
IOException
InterruptedException
-
getMetaTags
- Throws:
IOException
InterruptedException
-
getSummary
- Throws:
IOException
InterruptedException
-
getReader
- Throws:
IOException
-
parse
- Throws:
IOException
-
HTMLDocument
- Throws:
ParseException
IOException
-
Tag
- Throws:
ParseException
IOException
-
ArgValue
- Throws:
ParseException
-
Decl
- Throws:
ParseException
-
CommentTag
- Throws:
ParseException
-
ScriptTag
- Throws:
ParseException
-
ReInit
-
ReInit
-
ReInit
-
ReInit
-
getNextToken
-
getToken
-
generateParseException
-
enable_tracing
public final void enable_tracing() -
disable_tracing
public final void disable_tracing() -
setException
-
getException
-