Package org.apache.lucene.demo.html
Class HTMLParser
java.lang.Object
org.apache.lucene.demo.html.HTMLParser
- All Implemented Interfaces:
HTMLParserConstants
-
Field Summary
FieldsModifier and TypeFieldDescriptionbooleanstatic intFields inherited from interface org.apache.lucene.demo.html.HTMLParserConstants
AfterEquals, ArgEquals, ArgName, ArgQuote1, ArgQuote2, ArgValue, CloseQuote1, CloseQuote2, Comment1, Comment2, CommentEnd1, CommentEnd2, CommentText1, CommentText2, DeclName, DEFAULT, Entity, EOF, HEX, LET, NUM, Punct, Quote1Text, Quote2Text, ScriptEnd, ScriptStart, ScriptText, SP, Space, TagEnd, TagName, tokenImage, WithinComment1, WithinComment2, WithinQuote1, WithinQuote2, WithinScript, WithinTag, Word -
Constructor Summary
ConstructorsConstructorDescriptionHTMLParser(File file) Deprecated.Use HTMLParser(FileInputStream) insteadHTMLParser(InputStream stream) HTMLParser(InputStream stream, String encoding) HTMLParser(Reader stream) -
Method Summary
Modifier and TypeMethodDescriptionfinal TokenArgValue()final voidfinal TokenDecl()final voidfinal voidfinal TokengetTitle()final TokengetToken(int index) final voidvoidparse()voidReInit(InputStream stream) voidReInit(InputStream stream, String encoding) voidvoidfinal voidvoidsetException(Exception exception) final voidTag()
-
Field Details
-
SUMMARY_LENGTH
public static int SUMMARY_LENGTH -
token_source
-
token
-
jj_nt
-
lookingAhead
public boolean lookingAhead
-
-
Constructor Details
-
HTMLParser
Deprecated.Use HTMLParser(FileInputStream) instead- Throws:
FileNotFoundException
-
HTMLParser
-
HTMLParser
-
HTMLParser
-
HTMLParser
-
-
Method Details
-
getTitle
- Throws:
IOExceptionInterruptedException
-
getMetaTags
- Throws:
IOExceptionInterruptedException
-
getSummary
- Throws:
IOExceptionInterruptedException
-
getReader
- Throws:
IOException
-
parse
- Throws:
IOException
-
HTMLDocument
- Throws:
ParseExceptionIOException
-
Tag
- Throws:
ParseExceptionIOException
-
ArgValue
- Throws:
ParseException
-
Decl
- Throws:
ParseException
-
CommentTag
- Throws:
ParseException
-
ScriptTag
- Throws:
ParseException
-
ReInit
-
ReInit
-
ReInit
-
ReInit
-
getNextToken
-
getToken
-
generateParseException
-
enable_tracing
public final void enable_tracing() -
disable_tracing
public final void disable_tracing() -
setException
-
getException
-