org.apache.lucene.demo.html

Class HTMLParser

Implemented Interfaces:
HTMLParserConstants

public class HTMLParser
extends Object
implements HTMLParserConstants

Field Summary

static int
SUMMARY_LENGTH
Token
jj_nt
boolean
lookingAhead
Token
token
HTMLParserTokenManager
token_source

Fields inherited from interface org.apache.lucene.demo.html.HTMLParserConstants

AfterEquals, ArgEquals, ArgName, ArgQuote1, ArgQuote2, ArgValue, CloseQuote1, CloseQuote2, Comment1, Comment2, CommentEnd1, CommentEnd2, CommentText1, CommentText2, DEFAULT, DeclName, EOF, Entity, HEX, LET, NUM, Punct, Quote1Text, Quote2Text, SP, ScriptEnd, ScriptStart, ScriptText, Space, TagEnd, TagName, WithinComment1, WithinComment2, WithinQuote1, WithinQuote2, WithinScript, WithinTag, Word, tokenImage

Constructor Summary

HTMLParser(File file)
Deprecated. Use HTMLParser(FileInputStream) instead
HTMLParser(InputStream stream)
HTMLParser(Reader stream)
HTMLParser(HTMLParserTokenManager tm)

Method Summary

Token
ArgValue()
void
CommentTag()
Token
Decl()
void
HTMLDocument()
void
ReInit(InputStream stream)
void
ReInit(Reader stream)
void
ReInit(HTMLParserTokenManager tm)
void
ScriptTag()
void
Tag()
void
disable_tracing()
void
enable_tracing()
ParseException
generateParseException()
Properties
getMetaTags()
Token
getNextToken()
Reader
getReader()
String
getSummary()
String
getTitle()
Token
getToken(int index)

Field Details

SUMMARY_LENGTH

public static int SUMMARY_LENGTH

jj_nt

public Token jj_nt

lookingAhead

public boolean lookingAhead

token

public Token token

token_source

public HTMLParserTokenManager token_source

Constructor Details

HTMLParser

public HTMLParser(File file)
            throws FileNotFoundException

Deprecated. Use HTMLParser(FileInputStream) instead


HTMLParser

public HTMLParser(InputStream stream)

HTMLParser

public HTMLParser(Reader stream)

HTMLParser

public HTMLParser(HTMLParserTokenManager tm)

Method Details

ArgValue

public final Token ArgValue()
            throws ParseException

CommentTag

public final void CommentTag()
            throws ParseException

Decl

public final Token Decl()
            throws ParseException

HTMLDocument

public final void HTMLDocument()
            throws ParseException,
                   IOException

ReInit

public void ReInit(InputStream stream)

ReInit

public void ReInit(Reader stream)

ReInit

public void ReInit(HTMLParserTokenManager tm)

ScriptTag

public final void ScriptTag()
            throws ParseException

Tag

public final void Tag()
            throws ParseException,
                   IOException

disable_tracing

public final void disable_tracing()

enable_tracing

public final void enable_tracing()

generateParseException

public ParseException generateParseException()

getMetaTags

public Properties getMetaTags()
            throws IOException,
                   InterruptedException

getNextToken

public final Token getNextToken()

getReader

public Reader getReader()
            throws IOException

getSummary

public String getSummary()
            throws IOException,
                   InterruptedException

getTitle

public String getTitle()
            throws IOException,
                   InterruptedException

getToken

public final Token getToken(int index)

Copyright © 2000-2007 Apache Software Foundation. All Rights Reserved.