org.openpipeline.pipeline.docfilter
Class HTMLLexer

java.lang.Object
  extended by org.openpipeline.pipeline.docfilter.HTMLLexer

public final class HTMLLexer
extends Object


Field Summary
static int AMP
           
static int APOS
           
static int BASE
           
static int CHAR
           
static int COMMENT
           
static int DOCTYPE
           
static int ENDANCHOR
           
static int ENDHEAD
           
static int ENDNOINDEX
           
static int ENDTAG
           
static int ENDTITLE
           
static int EOF
           
static int FRAME
           
static int GT
           
static int IMG
           
static int LT
           
static int META
           
static int NBSP
           
static int NEWLINE
           
static int QUOT
           
static String[] resultAsString
           
static int SCRIPT
           
static int STARTANCHOR
           
static int STARTHEAD
           
static int STARTNOINDEX
           
static int STARTTAG
           
static int STARTTITLE
           
static int STYLE
           
static int SYMBOL_CHAR
           
static int SYMBOL_DECIMAL
           
static int SYMBOL_HEX
           
static int TEXT
           
static int WHITESPACE
           
 
Constructor Summary
HTMLLexer()
           
HTMLLexer(InputStream in)
          Creates a new scanner.
HTMLLexer(Reader in)
          Creates a new scanner There is also a java.io.InputStream version of this constructor.
 
Method Summary
 char getChar()
           
 int getOffset()
           
 int getSize()
           
 int getText(char[] dest, int destOffset)
           
 int lex()
           
 int lex(FastStringBuffer matchedText)
           
 void reset(Reader reader)
           
 
Methods inherited from class java.lang.Object
equals, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 

Field Detail

EOF

public static final int EOF
See Also:
Constant Field Values

TEXT

public static final int TEXT
See Also:
Constant Field Values

CHAR

public static final int CHAR
See Also:
Constant Field Values

COMMENT

public static final int COMMENT
See Also:
Constant Field Values

STARTTITLE

public static final int STARTTITLE
See Also:
Constant Field Values

ENDTITLE

public static final int ENDTITLE
See Also:
Constant Field Values

STARTHEAD

public static final int STARTHEAD
See Also:
Constant Field Values

ENDHEAD

public static final int ENDHEAD
See Also:
Constant Field Values

STARTTAG

public static final int STARTTAG
See Also:
Constant Field Values

ENDTAG

public static final int ENDTAG
See Also:
Constant Field Values

SCRIPT

public static final int SCRIPT
See Also:
Constant Field Values

META

public static final int META
See Also:
Constant Field Values

STYLE

public static final int STYLE
See Also:
Constant Field Values

DOCTYPE

public static final int DOCTYPE
See Also:
Constant Field Values

IMG

public static final int IMG
See Also:
Constant Field Values

NEWLINE

public static final int NEWLINE
See Also:
Constant Field Values

WHITESPACE

public static final int WHITESPACE
See Also:
Constant Field Values

STARTANCHOR

public static final int STARTANCHOR
See Also:
Constant Field Values

ENDANCHOR

public static final int ENDANCHOR
See Also:
Constant Field Values

FRAME

public static final int FRAME
See Also:
Constant Field Values

NBSP

public static final int NBSP
See Also:
Constant Field Values

AMP

public static final int AMP
See Also:
Constant Field Values

GT

public static final int GT
See Also:
Constant Field Values

LT

public static final int LT
See Also:
Constant Field Values

QUOT

public static final int QUOT
See Also:
Constant Field Values

APOS

public static final int APOS
See Also:
Constant Field Values

SYMBOL_DECIMAL

public static final int SYMBOL_DECIMAL
See Also:
Constant Field Values

SYMBOL_HEX

public static final int SYMBOL_HEX
See Also:
Constant Field Values

SYMBOL_CHAR

public static final int SYMBOL_CHAR
See Also:
Constant Field Values

BASE

public static final int BASE
See Also:
Constant Field Values

STARTNOINDEX

public static final int STARTNOINDEX
See Also:
Constant Field Values

ENDNOINDEX

public static final int ENDNOINDEX
See Also:
Constant Field Values

resultAsString

public static final String[] resultAsString
Constructor Detail

HTMLLexer

public HTMLLexer()

HTMLLexer

public HTMLLexer(Reader in)
Creates a new scanner There is also a java.io.InputStream version of this constructor.

Parameters:
in - the java.io.Reader to read input from.

HTMLLexer

public HTMLLexer(InputStream in)
Creates a new scanner. There is also java.io.Reader version of this constructor.

Parameters:
in - the java.io.Inputstream to read input from.
Method Detail

lex

public int lex(FastStringBuffer matchedText)
        throws IOException
Throws:
IOException

lex

public int lex()
        throws IOException
Throws:
IOException

getText

public int getText(char[] dest,
                   int destOffset)

getChar

public char getChar()

reset

public void reset(Reader reader)

getOffset

public int getOffset()

getSize

public int getSize()