Package nu.validator.htmlparser.impl
Class Tokenizer
- java.lang.Object
-
- nu.validator.htmlparser.impl.Tokenizer
-
- All Implemented Interfaces:
org.xml.sax.Locator
- Direct Known Subclasses:
ErrorReportingTokenizer
public class Tokenizer extends java.lang.Object implements org.xml.sax.LocatorAn implementation of http://www.whatwg.org/specs/web-apps/current-work/multipage/tokenization.html This class implements theLocatorinterface. This is not an incidental implementation detail: Users of this class are encouraged to make use of theLocatornature. By default, the tokenizer may report data that XML 1.0 bans. The tokenizer can be configured to treat these conditions as fatal or to coerce the infoset to something that XML 1.0 allows.- Version:
- $Id$
- Author:
- hsivonen
-
-
Field Summary
-
Constructor Summary
Constructors Constructor Description Tokenizer(TokenHandler tokenHandler)The constructor.Tokenizer(TokenHandler tokenHandler, boolean newAttributesEachTime)
-
Method Summary
All Methods Instance Methods Concrete Methods Modifier and Type Method Description voidbecomeConfident()protected charcheckChar(char[] buf, int pos)voidend()voideof()voiderr(java.lang.String message)Reports a Parse Error.protected voiderrAstralNonCharacter(int ch)protected voiderrAttributeValueMissing()protected voiderrBadCharAfterLt(char c)protected voiderrBadCharBeforeAttributeNameOrNull(char c)protected voiderrBogusComment()protected voiderrBogusDoctype()protected voiderrCharRefLacksSemicolon()protected voiderrConsecutiveHyphens()protected voiderrDuplicateAttribute()protected voiderrEofAfterLt()protected voiderrEofInAttributeName()protected voiderrEofInAttributeValue()protected voiderrEofInComment()protected voiderrEofInDoctype()protected voiderrEofInEndTag()protected voiderrEofInPublicId()protected voiderrEofInSystemId()protected voiderrEofInTagName()protected voiderrEofWithoutGt()protected voiderrEqualsSignBeforeAttributeName()protected voiderrExpectedPublicId()protected voiderrExpectedSystemId()protected voiderrGarbageAfterLtSlash()protected voiderrGtInPublicId()protected voiderrGtInSystemId()protected voiderrHtml4LtSlashInRcdata(char folded)protected voiderrHtml4NonNameInUnquotedAttribute(char c)protected voiderrHtml4XmlVoidSyntax()protected voiderrHyphenHyphenBang()protected voiderrLtGt()protected voiderrLtOrEqualsOrGraveInUnquotedAttributeOrNull(char c)protected voiderrLtSlashGt()protected voiderrMissingSpaceBeforeDoctypeName()protected voiderrNamelessDoctype()protected voiderrNcrControlChar()protected charerrNcrControlChar(char ch)protected voiderrNcrCr()protected voiderrNcrInC1Range()protected charerrNcrNonCharacter(char ch)protected voiderrNcrOutOfRange()protected voiderrNcrSurrogate()protected voiderrNcrUnassigned()protected voiderrNcrZero()protected voiderrNoDigitsInNCR()protected voiderrNoNamedCharacterMatch()protected voiderrNoSpaceBetweenAttributes()protected voiderrNoSpaceBetweenDoctypePublicKeywordAndQuote()protected voiderrNoSpaceBetweenDoctypeSystemKeywordAndQuote()protected voiderrNoSpaceBetweenPublicAndSystemIds()protected voiderrNotSemicolonTerminated()protected voiderrPrematureEndOfComment()protected voiderrProcessingInstruction()protected voiderrQuoteBeforeAttributeName(char c)protected voiderrQuoteOrLtInAttributeNameOrNull(char c)protected voiderrSlashNotFollowedByGt()voiderrTreeBuilder(java.lang.String message)protected voiderrUnescapedAmpersandInterpretedAsCharacterReference()protected voiderrUnquotedAttributeValOrNull(char c)protected voiderrWarnLtSlashInRcdata()voidfatal(java.lang.String message)Reports an condition that would make the infoset incompatible with XML 1.0 as fatal.protected voidflushChars(char[] buf, int pos)Flushes coalesced character tokens.intgetCol()Returns the col.intgetColumnNumber()org.xml.sax.ErrorHandlergetErrorHandler()intgetLine()Returns the line.intgetLineNumber()java.lang.StringgetPublicId()java.lang.StringgetSystemId()voidinitializeWithoutStarting()voidinitLocation(java.lang.String newPublicId, java.lang.String newSystemId)booleaninternalEncodingDeclaration(java.lang.String internalCharset)booleanisAlreadyComplainedAboutNonAscii()Returns the alreadyComplainedAboutNonAscii.booleanisInDataState()booleanisMappingLangToXmlLang()Returns the mappingLangToXmlLang.booleanisNextCharOnNewLine()Returns the nextCharOnNewLine.booleanisPrevCR()voidloadState(Tokenizer other)protected voidmaybeErrAttributesOnEndTag(HtmlAttributes attrs)protected voidmaybeErrSlashInEndTag(boolean selfClosing)protected voidmaybeWarnPrivateUse(char ch)protected voidmaybeWarnPrivateUseAstral()protected voidnoteAttributeWithoutValue()protected voidnoteUnquotedAttributeValue()voidnotifyAboutMetaBoundary()voidrequestSuspension()voidresetToDataState()voidsetCommentPolicy(XmlViolationPolicy commentPolicy)Sets the commentPolicy.voidsetContentNonXmlCharPolicy(XmlViolationPolicy contentNonXmlCharPolicy)Sets the contentNonXmlCharPolicy.voidsetContentSpacePolicy(XmlViolationPolicy contentSpacePolicy)Sets the contentSpacePolicy.voidsetEncodingDeclarationHandler(EncodingDeclarationHandler encodingDeclarationHandler)Sets the encodingDeclarationHandler.voidsetErrorHandler(org.xml.sax.ErrorHandler eh)Sets the error handler.voidsetHtml4ModeCompatibleWithXhtml1Schemata(boolean html4ModeCompatibleWithXhtml1Schemata)Sets the html4ModeCompatibleWithXhtml1Schemata.voidsetInterner(Interner interner)voidsetLineNumber(int line)For C++ use only.voidsetMappingLangToXmlLang(boolean mappingLangToXmlLang)Sets the mappingLangToXmlLang.voidsetNamePolicy(XmlViolationPolicy namePolicy)voidsetStateAndEndTagExpectation(int specialTokenizerState, java.lang.String endTagExpectation)Sets the tokenizer state and the associated element name.voidsetStateAndEndTagExpectation(int specialTokenizerState, ElementName endTagExpectation)Sets the tokenizer state and the associated element name.voidsetTransitionBaseOffset(int offset)Sets an offset to be added to the position reported toTransitionHandler.voidsetXmlnsPolicy(XmlViolationPolicy xmlnsPolicy)Sets the xmlnsPolicy.protected voidsilentCarriageReturn()protected voidsilentLineFeed()voidstart()protected voidstartErrorReporting()protected java.lang.StringstrBufToString()The smaller buffer as a String.booleantokenizeBuffer(UTF16Buffer buffer)protected inttransition(int from, int to, boolean reconsume, int pos)voidwarn(java.lang.String message)Reports a warning
-
-
-
Field Detail
-
DATA
public static final int DATA
- See Also:
- Constant Field Values
-
RCDATA
public static final int RCDATA
- See Also:
- Constant Field Values
-
SCRIPT_DATA
public static final int SCRIPT_DATA
- See Also:
- Constant Field Values
-
RAWTEXT
public static final int RAWTEXT
- See Also:
- Constant Field Values
-
SCRIPT_DATA_ESCAPED
public static final int SCRIPT_DATA_ESCAPED
- See Also:
- Constant Field Values
-
ATTRIBUTE_VALUE_DOUBLE_QUOTED
public static final int ATTRIBUTE_VALUE_DOUBLE_QUOTED
- See Also:
- Constant Field Values
-
ATTRIBUTE_VALUE_SINGLE_QUOTED
public static final int ATTRIBUTE_VALUE_SINGLE_QUOTED
- See Also:
- Constant Field Values
-
ATTRIBUTE_VALUE_UNQUOTED
public static final int ATTRIBUTE_VALUE_UNQUOTED
- See Also:
- Constant Field Values
-
PLAINTEXT
public static final int PLAINTEXT
- See Also:
- Constant Field Values
-
TAG_OPEN
public static final int TAG_OPEN
- See Also:
- Constant Field Values
-
CLOSE_TAG_OPEN
public static final int CLOSE_TAG_OPEN
- See Also:
- Constant Field Values
-
TAG_NAME
public static final int TAG_NAME
- See Also:
- Constant Field Values
-
BEFORE_ATTRIBUTE_NAME
public static final int BEFORE_ATTRIBUTE_NAME
- See Also:
- Constant Field Values
-
ATTRIBUTE_NAME
public static final int ATTRIBUTE_NAME
- See Also:
- Constant Field Values
-
AFTER_ATTRIBUTE_NAME
public static final int AFTER_ATTRIBUTE_NAME
- See Also:
- Constant Field Values
-
BEFORE_ATTRIBUTE_VALUE
public static final int BEFORE_ATTRIBUTE_VALUE
- See Also:
- Constant Field Values
-
AFTER_ATTRIBUTE_VALUE_QUOTED
public static final int AFTER_ATTRIBUTE_VALUE_QUOTED
- See Also:
- Constant Field Values
-
BOGUS_COMMENT
public static final int BOGUS_COMMENT
- See Also:
- Constant Field Values
-
MARKUP_DECLARATION_OPEN
public static final int MARKUP_DECLARATION_OPEN
- See Also:
- Constant Field Values
-
DOCTYPE
public static final int DOCTYPE
- See Also:
- Constant Field Values
-
BEFORE_DOCTYPE_NAME
public static final int BEFORE_DOCTYPE_NAME
- See Also:
- Constant Field Values
-
DOCTYPE_NAME
public static final int DOCTYPE_NAME
- See Also:
- Constant Field Values
-
AFTER_DOCTYPE_NAME
public static final int AFTER_DOCTYPE_NAME
- See Also:
- Constant Field Values
-
BEFORE_DOCTYPE_PUBLIC_IDENTIFIER
public static final int BEFORE_DOCTYPE_PUBLIC_IDENTIFIER
- See Also:
- Constant Field Values
-
DOCTYPE_PUBLIC_IDENTIFIER_DOUBLE_QUOTED
public static final int DOCTYPE_PUBLIC_IDENTIFIER_DOUBLE_QUOTED
- See Also:
- Constant Field Values
-
DOCTYPE_PUBLIC_IDENTIFIER_SINGLE_QUOTED
public static final int DOCTYPE_PUBLIC_IDENTIFIER_SINGLE_QUOTED
- See Also:
- Constant Field Values
-
AFTER_DOCTYPE_PUBLIC_IDENTIFIER
public static final int AFTER_DOCTYPE_PUBLIC_IDENTIFIER
- See Also:
- Constant Field Values
-
BEFORE_DOCTYPE_SYSTEM_IDENTIFIER
public static final int BEFORE_DOCTYPE_SYSTEM_IDENTIFIER
- See Also:
- Constant Field Values
-
DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED
public static final int DOCTYPE_SYSTEM_IDENTIFIER_DOUBLE_QUOTED
- See Also:
- Constant Field Values
-
DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED
public static final int DOCTYPE_SYSTEM_IDENTIFIER_SINGLE_QUOTED
- See Also:
- Constant Field Values
-
AFTER_DOCTYPE_SYSTEM_IDENTIFIER
public static final int AFTER_DOCTYPE_SYSTEM_IDENTIFIER
- See Also:
- Constant Field Values
-
BOGUS_DOCTYPE
public static final int BOGUS_DOCTYPE
- See Also:
- Constant Field Values
-
COMMENT_START
public static final int COMMENT_START
- See Also:
- Constant Field Values
-
COMMENT_START_DASH
public static final int COMMENT_START_DASH
- See Also:
- Constant Field Values
-
COMMENT
public static final int COMMENT
- See Also:
- Constant Field Values
-
COMMENT_END_DASH
public static final int COMMENT_END_DASH
- See Also:
- Constant Field Values
-
COMMENT_END
public static final int COMMENT_END
- See Also:
- Constant Field Values
-
COMMENT_END_BANG
public static final int COMMENT_END_BANG
- See Also:
- Constant Field Values
-
NON_DATA_END_TAG_NAME
public static final int NON_DATA_END_TAG_NAME
- See Also:
- Constant Field Values
-
MARKUP_DECLARATION_HYPHEN
public static final int MARKUP_DECLARATION_HYPHEN
- See Also:
- Constant Field Values
-
MARKUP_DECLARATION_OCTYPE
public static final int MARKUP_DECLARATION_OCTYPE
- See Also:
- Constant Field Values
-
DOCTYPE_UBLIC
public static final int DOCTYPE_UBLIC
- See Also:
- Constant Field Values
-
DOCTYPE_YSTEM
public static final int DOCTYPE_YSTEM
- See Also:
- Constant Field Values
-
AFTER_DOCTYPE_PUBLIC_KEYWORD
public static final int AFTER_DOCTYPE_PUBLIC_KEYWORD
- See Also:
- Constant Field Values
-
BETWEEN_DOCTYPE_PUBLIC_AND_SYSTEM_IDENTIFIERS
public static final int BETWEEN_DOCTYPE_PUBLIC_AND_SYSTEM_IDENTIFIERS
- See Also:
- Constant Field Values
-
AFTER_DOCTYPE_SYSTEM_KEYWORD
public static final int AFTER_DOCTYPE_SYSTEM_KEYWORD
- See Also:
- Constant Field Values
-
CONSUME_CHARACTER_REFERENCE
public static final int CONSUME_CHARACTER_REFERENCE
- See Also:
- Constant Field Values
-
CONSUME_NCR
public static final int CONSUME_NCR
- See Also:
- Constant Field Values
-
CHARACTER_REFERENCE_TAIL
public static final int CHARACTER_REFERENCE_TAIL
- See Also:
- Constant Field Values
-
HEX_NCR_LOOP
public static final int HEX_NCR_LOOP
- See Also:
- Constant Field Values
-
DECIMAL_NRC_LOOP
public static final int DECIMAL_NRC_LOOP
- See Also:
- Constant Field Values
-
HANDLE_NCR_VALUE
public static final int HANDLE_NCR_VALUE
- See Also:
- Constant Field Values
-
HANDLE_NCR_VALUE_RECONSUME
public static final int HANDLE_NCR_VALUE_RECONSUME
- See Also:
- Constant Field Values
-
CHARACTER_REFERENCE_HILO_LOOKUP
public static final int CHARACTER_REFERENCE_HILO_LOOKUP
- See Also:
- Constant Field Values
-
SELF_CLOSING_START_TAG
public static final int SELF_CLOSING_START_TAG
- See Also:
- Constant Field Values
-
CDATA_START
public static final int CDATA_START
- See Also:
- Constant Field Values
-
CDATA_SECTION
public static final int CDATA_SECTION
- See Also:
- Constant Field Values
-
CDATA_RSQB
public static final int CDATA_RSQB
- See Also:
- Constant Field Values
-
CDATA_RSQB_RSQB
public static final int CDATA_RSQB_RSQB
- See Also:
- Constant Field Values
-
SCRIPT_DATA_LESS_THAN_SIGN
public static final int SCRIPT_DATA_LESS_THAN_SIGN
- See Also:
- Constant Field Values
-
SCRIPT_DATA_ESCAPE_START
public static final int SCRIPT_DATA_ESCAPE_START
- See Also:
- Constant Field Values
-
SCRIPT_DATA_ESCAPE_START_DASH
public static final int SCRIPT_DATA_ESCAPE_START_DASH
- See Also:
- Constant Field Values
-
SCRIPT_DATA_ESCAPED_DASH
public static final int SCRIPT_DATA_ESCAPED_DASH
- See Also:
- Constant Field Values
-
SCRIPT_DATA_ESCAPED_DASH_DASH
public static final int SCRIPT_DATA_ESCAPED_DASH_DASH
- See Also:
- Constant Field Values
-
BOGUS_COMMENT_HYPHEN
public static final int BOGUS_COMMENT_HYPHEN
- See Also:
- Constant Field Values
-
RAWTEXT_RCDATA_LESS_THAN_SIGN
public static final int RAWTEXT_RCDATA_LESS_THAN_SIGN
- See Also:
- Constant Field Values
-
SCRIPT_DATA_ESCAPED_LESS_THAN_SIGN
public static final int SCRIPT_DATA_ESCAPED_LESS_THAN_SIGN
- See Also:
- Constant Field Values
-
SCRIPT_DATA_DOUBLE_ESCAPE_START
public static final int SCRIPT_DATA_DOUBLE_ESCAPE_START
- See Also:
- Constant Field Values
-
SCRIPT_DATA_DOUBLE_ESCAPED
public static final int SCRIPT_DATA_DOUBLE_ESCAPED
- See Also:
- Constant Field Values
-
SCRIPT_DATA_DOUBLE_ESCAPED_LESS_THAN_SIGN
public static final int SCRIPT_DATA_DOUBLE_ESCAPED_LESS_THAN_SIGN
- See Also:
- Constant Field Values
-
SCRIPT_DATA_DOUBLE_ESCAPED_DASH
public static final int SCRIPT_DATA_DOUBLE_ESCAPED_DASH
- See Also:
- Constant Field Values
-
SCRIPT_DATA_DOUBLE_ESCAPED_DASH_DASH
public static final int SCRIPT_DATA_DOUBLE_ESCAPED_DASH_DASH
- See Also:
- Constant Field Values
-
SCRIPT_DATA_DOUBLE_ESCAPE_END
public static final int SCRIPT_DATA_DOUBLE_ESCAPE_END
- See Also:
- Constant Field Values
-
tokenHandler
protected final TokenHandler tokenHandler
The token handler.
-
encodingDeclarationHandler
protected EncodingDeclarationHandler encodingDeclarationHandler
-
errorHandler
protected org.xml.sax.ErrorHandler errorHandler
The error handler.
-
lastCR
protected boolean lastCR
Whether the previous char read was CR.
-
stateSave
protected int stateSave
-
index
protected int index
-
value
protected int value
-
cstart
protected int cstart
-
endTagExpectation
protected ElementName endTagExpectation
The element whose end tag closes the current CDATA or RCDATA element.
-
endTag
protected boolean endTag
trueif tokenizing an end tag
-
attributeName
protected AttributeName attributeName
The current attribute name.
-
html4
protected boolean html4
truewhen HTML4-specific additional errors are requested.
-
confident
protected boolean confident
-
currentBufferGlobalOffset
protected int currentBufferGlobalOffset
-
ampersandLocation
protected LocatorImpl ampersandLocation
-
-
Constructor Detail
-
Tokenizer
public Tokenizer(TokenHandler tokenHandler, boolean newAttributesEachTime)
-
Tokenizer
public Tokenizer(TokenHandler tokenHandler)
The constructor.- Parameters:
tokenHandler- the handler for receiving tokens
-
-
Method Detail
-
setInterner
public void setInterner(Interner interner)
-
initLocation
public void initLocation(java.lang.String newPublicId, java.lang.String newSystemId)
-
isMappingLangToXmlLang
public boolean isMappingLangToXmlLang()
Returns the mappingLangToXmlLang.- Returns:
- the mappingLangToXmlLang
-
setMappingLangToXmlLang
public void setMappingLangToXmlLang(boolean mappingLangToXmlLang)
Sets the mappingLangToXmlLang.- Parameters:
mappingLangToXmlLang- the mappingLangToXmlLang to set
-
setErrorHandler
public void setErrorHandler(org.xml.sax.ErrorHandler eh)
Sets the error handler.- See Also:
XMLReader.setErrorHandler(org.xml.sax.ErrorHandler)
-
getErrorHandler
public org.xml.sax.ErrorHandler getErrorHandler()
-
setCommentPolicy
public void setCommentPolicy(XmlViolationPolicy commentPolicy)
Sets the commentPolicy.- Parameters:
commentPolicy- the commentPolicy to set
-
setContentNonXmlCharPolicy
public void setContentNonXmlCharPolicy(XmlViolationPolicy contentNonXmlCharPolicy)
Sets the contentNonXmlCharPolicy.- Parameters:
contentNonXmlCharPolicy- the contentNonXmlCharPolicy to set
-
setContentSpacePolicy
public void setContentSpacePolicy(XmlViolationPolicy contentSpacePolicy)
Sets the contentSpacePolicy.- Parameters:
contentSpacePolicy- the contentSpacePolicy to set
-
setXmlnsPolicy
public void setXmlnsPolicy(XmlViolationPolicy xmlnsPolicy)
Sets the xmlnsPolicy.- Parameters:
xmlnsPolicy- the xmlnsPolicy to set
-
setNamePolicy
public void setNamePolicy(XmlViolationPolicy namePolicy)
-
setHtml4ModeCompatibleWithXhtml1Schemata
public void setHtml4ModeCompatibleWithXhtml1Schemata(boolean html4ModeCompatibleWithXhtml1Schemata)
Sets the html4ModeCompatibleWithXhtml1Schemata.- Parameters:
html4ModeCompatibleWithXhtml1Schemata- the html4ModeCompatibleWithXhtml1Schemata to set
-
setStateAndEndTagExpectation
public void setStateAndEndTagExpectation(int specialTokenizerState, java.lang.String endTagExpectation)Sets the tokenizer state and the associated element name. This should only ever used to put the tokenizer into one of the states that have a special end tag expectation.- Parameters:
specialTokenizerState- the tokenizer state to setendTagExpectation- the expected end tag for transitioning back to normal
-
setStateAndEndTagExpectation
public void setStateAndEndTagExpectation(int specialTokenizerState, ElementName endTagExpectation)Sets the tokenizer state and the associated element name. This should only ever used to put the tokenizer into one of the states that have a special end tag expectation.- Parameters:
specialTokenizerState- the tokenizer state to setendTagExpectation- the expected end tag for transitioning back to normal
-
setLineNumber
public void setLineNumber(int line)
For C++ use only.
-
getLineNumber
public int getLineNumber()
- Specified by:
getLineNumberin interfaceorg.xml.sax.Locator- See Also:
Locator.getLineNumber()
-
getColumnNumber
public int getColumnNumber()
- Specified by:
getColumnNumberin interfaceorg.xml.sax.Locator- See Also:
Locator.getColumnNumber()
-
getPublicId
public java.lang.String getPublicId()
- Specified by:
getPublicIdin interfaceorg.xml.sax.Locator- See Also:
Locator.getPublicId()
-
getSystemId
public java.lang.String getSystemId()
- Specified by:
getSystemIdin interfaceorg.xml.sax.Locator- See Also:
Locator.getSystemId()
-
notifyAboutMetaBoundary
public void notifyAboutMetaBoundary()
-
strBufToString
protected java.lang.String strBufToString()
The smaller buffer as a String. Currently only used for error reporting.C++ memory note: The return value must be released.
- Returns:
- the smaller buffer as a string
-
flushChars
protected void flushChars(char[] buf, int pos) throws org.xml.sax.SAXExceptionFlushes coalesced character tokens.- Parameters:
buf- TODOpos- TODO- Throws:
org.xml.sax.SAXException
-
fatal
public void fatal(java.lang.String message) throws org.xml.sax.SAXExceptionReports an condition that would make the infoset incompatible with XML 1.0 as fatal.- Parameters:
message- the message- Throws:
org.xml.sax.SAXExceptionorg.xml.sax.SAXParseException
-
err
public void err(java.lang.String message) throws org.xml.sax.SAXExceptionReports a Parse Error.- Parameters:
message- the message- Throws:
org.xml.sax.SAXException
-
errTreeBuilder
public void errTreeBuilder(java.lang.String message) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
warn
public void warn(java.lang.String message) throws org.xml.sax.SAXExceptionReports a warning- Parameters:
message- the message- Throws:
org.xml.sax.SAXException
-
startErrorReporting
protected void startErrorReporting() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
start
public void start() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
tokenizeBuffer
public boolean tokenizeBuffer(UTF16Buffer buffer) throws org.xml.sax.SAXException
- Throws:
org.xml.sax.SAXException
-
transition
protected int transition(int from, int to, boolean reconsume, int pos) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
silentCarriageReturn
protected void silentCarriageReturn()
-
silentLineFeed
protected void silentLineFeed()
-
eof
public void eof() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
checkChar
protected char checkChar(char[] buf, int pos) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
isAlreadyComplainedAboutNonAscii
public boolean isAlreadyComplainedAboutNonAscii()
Returns the alreadyComplainedAboutNonAscii.- Returns:
- the alreadyComplainedAboutNonAscii
-
internalEncodingDeclaration
public boolean internalEncodingDeclaration(java.lang.String internalCharset) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
end
public void end() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
requestSuspension
public void requestSuspension()
-
becomeConfident
public void becomeConfident()
-
isNextCharOnNewLine
public boolean isNextCharOnNewLine()
Returns the nextCharOnNewLine.- Returns:
- the nextCharOnNewLine
-
isPrevCR
public boolean isPrevCR()
-
getLine
public int getLine()
Returns the line.- Returns:
- the line
-
getCol
public int getCol()
Returns the col.- Returns:
- the col
-
isInDataState
public boolean isInDataState()
-
resetToDataState
public void resetToDataState()
-
loadState
public void loadState(Tokenizer other) throws org.xml.sax.SAXException
- Throws:
org.xml.sax.SAXException
-
initializeWithoutStarting
public void initializeWithoutStarting() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errGarbageAfterLtSlash
protected void errGarbageAfterLtSlash() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errLtSlashGt
protected void errLtSlashGt() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errWarnLtSlashInRcdata
protected void errWarnLtSlashInRcdata() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errHtml4LtSlashInRcdata
protected void errHtml4LtSlashInRcdata(char folded) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errCharRefLacksSemicolon
protected void errCharRefLacksSemicolon() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNoDigitsInNCR
protected void errNoDigitsInNCR() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errGtInSystemId
protected void errGtInSystemId() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errGtInPublicId
protected void errGtInPublicId() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNamelessDoctype
protected void errNamelessDoctype() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errConsecutiveHyphens
protected void errConsecutiveHyphens() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errPrematureEndOfComment
protected void errPrematureEndOfComment() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errBogusComment
protected void errBogusComment() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errUnquotedAttributeValOrNull
protected void errUnquotedAttributeValOrNull(char c) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errSlashNotFollowedByGt
protected void errSlashNotFollowedByGt() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errHtml4XmlVoidSyntax
protected void errHtml4XmlVoidSyntax() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNoSpaceBetweenAttributes
protected void errNoSpaceBetweenAttributes() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errHtml4NonNameInUnquotedAttribute
protected void errHtml4NonNameInUnquotedAttribute(char c) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errLtOrEqualsOrGraveInUnquotedAttributeOrNull
protected void errLtOrEqualsOrGraveInUnquotedAttributeOrNull(char c) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errAttributeValueMissing
protected void errAttributeValueMissing() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errBadCharBeforeAttributeNameOrNull
protected void errBadCharBeforeAttributeNameOrNull(char c) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEqualsSignBeforeAttributeName
protected void errEqualsSignBeforeAttributeName() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errBadCharAfterLt
protected void errBadCharAfterLt(char c) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errLtGt
protected void errLtGt() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errProcessingInstruction
protected void errProcessingInstruction() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errUnescapedAmpersandInterpretedAsCharacterReference
protected void errUnescapedAmpersandInterpretedAsCharacterReference() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNotSemicolonTerminated
protected void errNotSemicolonTerminated() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNoNamedCharacterMatch
protected void errNoNamedCharacterMatch() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errQuoteBeforeAttributeName
protected void errQuoteBeforeAttributeName(char c) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errQuoteOrLtInAttributeNameOrNull
protected void errQuoteOrLtInAttributeNameOrNull(char c) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errExpectedPublicId
protected void errExpectedPublicId() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errBogusDoctype
protected void errBogusDoctype() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
maybeWarnPrivateUseAstral
protected void maybeWarnPrivateUseAstral() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
maybeWarnPrivateUse
protected void maybeWarnPrivateUse(char ch) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
maybeErrAttributesOnEndTag
protected void maybeErrAttributesOnEndTag(HtmlAttributes attrs) throws org.xml.sax.SAXException
- Throws:
org.xml.sax.SAXException
-
maybeErrSlashInEndTag
protected void maybeErrSlashInEndTag(boolean selfClosing) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrNonCharacter
protected char errNcrNonCharacter(char ch) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errAstralNonCharacter
protected void errAstralNonCharacter(int ch) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrSurrogate
protected void errNcrSurrogate() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrControlChar
protected char errNcrControlChar(char ch) throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrCr
protected void errNcrCr() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrInC1Range
protected void errNcrInC1Range() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofInPublicId
protected void errEofInPublicId() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofInComment
protected void errEofInComment() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofInDoctype
protected void errEofInDoctype() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofInAttributeValue
protected void errEofInAttributeValue() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofInAttributeName
protected void errEofInAttributeName() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofWithoutGt
protected void errEofWithoutGt() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofInTagName
protected void errEofInTagName() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofInEndTag
protected void errEofInEndTag() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofAfterLt
protected void errEofAfterLt() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrOutOfRange
protected void errNcrOutOfRange() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrUnassigned
protected void errNcrUnassigned() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errDuplicateAttribute
protected void errDuplicateAttribute() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errEofInSystemId
protected void errEofInSystemId() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errExpectedSystemId
protected void errExpectedSystemId() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errMissingSpaceBeforeDoctypeName
protected void errMissingSpaceBeforeDoctypeName() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errHyphenHyphenBang
protected void errHyphenHyphenBang() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrControlChar
protected void errNcrControlChar() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNcrZero
protected void errNcrZero() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNoSpaceBetweenDoctypeSystemKeywordAndQuote
protected void errNoSpaceBetweenDoctypeSystemKeywordAndQuote() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNoSpaceBetweenPublicAndSystemIds
protected void errNoSpaceBetweenPublicAndSystemIds() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
errNoSpaceBetweenDoctypePublicKeywordAndQuote
protected void errNoSpaceBetweenDoctypePublicKeywordAndQuote() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
noteAttributeWithoutValue
protected void noteAttributeWithoutValue() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
noteUnquotedAttributeValue
protected void noteUnquotedAttributeValue() throws org.xml.sax.SAXException- Throws:
org.xml.sax.SAXException
-
setEncodingDeclarationHandler
public void setEncodingDeclarationHandler(EncodingDeclarationHandler encodingDeclarationHandler)
Sets the encodingDeclarationHandler.- Parameters:
encodingDeclarationHandler- the encodingDeclarationHandler to set
-
setTransitionBaseOffset
public void setTransitionBaseOffset(int offset)
Sets an offset to be added to the position reported toTransitionHandler.- Parameters:
offset- the offset
-
-