public class XMLEncodingDetector extends XMLParseState implements EncodingDetector
Modifier and Type | Field and Description |
---|---|
protected java.lang.String |
encoding |
accumBuffer, ampBuffer, bTagDepth, currentAttrList, currentAttrName, currentAttrNameBuffer, currentState, currentTagName, currentTagNameBuffer, currentValueBuffer, inAmpersand, mapLookup, TAGPARSESTATE_IN_ATTR_LOOKING_FOR_VALUE, TAGPARSESTATE_IN_ATTR_NAME, TAGPARSESTATE_IN_ATTR_VALUE, TAGPARSESTATE_IN_BANG_TOKEN, TAGPARSESTATE_IN_BRACKET_TOKEN, TAGPARSESTATE_IN_CDATA_BODY, TAGPARSESTATE_IN_COMMENT, TAGPARSESTATE_IN_DOUBLE_QUOTES_ATTR_VALUE, TAGPARSESTATE_IN_END_TAG_NAME, TAGPARSESTATE_IN_QTAG_ATTR_LOOKING_FOR_VALUE, TAGPARSESTATE_IN_QTAG_ATTR_NAME, TAGPARSESTATE_IN_QTAG_ATTR_VALUE, TAGPARSESTATE_IN_QTAG_DOUBLE_QUOTES_ATTR_VALUE, TAGPARSESTATE_IN_QTAG_NAME, TAGPARSESTATE_IN_QTAG_SAW_QUESTION, TAGPARSESTATE_IN_QTAG_SINGLE_QUOTES_ATTR_VALUE, TAGPARSESTATE_IN_QTAG_UNQUOTED_ATTR_VALUE, TAGPARSESTATE_IN_SINGLE_QUOTES_ATTR_VALUE, TAGPARSESTATE_IN_TAG_NAME, TAGPARSESTATE_IN_TAG_SAW_SLASH, TAGPARSESTATE_IN_UNQUOTED_ATTR_VALUE, TAGPARSESTATE_IN_UNQUOTED_ATTR_VALUE_SAW_SLASH, TAGPARSESTATE_NEED_FINAL_BRACKET, TAGPARSESTATE_NORMAL, TAGPARSESTATE_SAWCOMMENTDASH, TAGPARSESTATE_SAWDASH, TAGPARSESTATE_SAWEXCLAMATION, TAGPARSESTATE_SAWLEFTANGLE, TAGPARSESTATE_SAWRIGHTBRACKET, TAGPARSESTATE_SAWSECONDCOMMENTDASH, TAGPARSESTATE_SAWSECONDRIGHTBRACKET
charBuffer
Constructor and Description |
---|
XMLEncodingDetector()
Constructor.
|
Modifier and Type | Method and Description |
---|---|
java.lang.String |
getEncoding()
Retrieve final encoding determination.
|
protected boolean |
noteBTag(java.lang.String tagName)
This method is called for every <! <token> ...
|
protected boolean |
noteBTagToken(java.lang.String token)
This method gets called for every token inside a btag.
|
protected boolean |
noteEndBTag()
This method is called for the end of every btag, or any time
there's a naked '>' in the document.
|
protected boolean |
noteEndEscaped()
Called for the end of every cdata-like tag.
|
protected boolean |
noteEndTag(java.lang.String tagName)
This method gets called for every end tag.
|
protected boolean |
noteEscaped(java.lang.String token)
Called for the start of every cdata-like tag, e.g.
|
protected boolean |
noteEscapedCharacter(char thisChar)
This method gets called for every character that is found within an
escape block, e.g.
|
protected boolean |
noteNormalCharacter(char thisChar)
This method gets called for every character that is not part of a tag etc.
|
protected boolean |
noteQTag(java.lang.String tagName,
java.util.Map<java.lang.String,java.lang.String> attributes)
Map version of noteQTag method.
|
protected boolean |
noteTag(java.lang.String tagName,
java.util.Map<java.lang.String,java.lang.String> attributes)
Map version of the noteTag method.
|
void |
setEncoding(java.lang.String encoding)
Set initial encoding.
|
noteQTag, noteTag
acceptNewTag, attributeDecode, dealWithCharacter, dumpValues, isPunctuation, isWhitespace, mapChunk, newBuffer, outputAmpBuffer
dealWithCharacters, dealWithRemainder
finishUp
public void setEncoding(java.lang.String encoding)
setEncoding
in interface EncodingDetector
public java.lang.String getEncoding()
getEncoding
in interface EncodingDetector
protected boolean noteTag(java.lang.String tagName, java.util.Map<java.lang.String,java.lang.String> attributes) throws ManifoldCFException
noteTag
in class XMLParseState
ManifoldCFException
protected boolean noteEndTag(java.lang.String tagName) throws ManifoldCFException
noteEndTag
in class TagParseState
ManifoldCFException
protected boolean noteQTag(java.lang.String tagName, java.util.Map<java.lang.String,java.lang.String> attributes) throws ManifoldCFException
noteQTag
in class XMLParseState
ManifoldCFException
protected boolean noteBTag(java.lang.String tagName) throws ManifoldCFException
noteBTag
in class TagParseState
ManifoldCFException
protected boolean noteEndBTag() throws ManifoldCFException
noteEndBTag
in class TagParseState
ManifoldCFException
protected boolean noteEscaped(java.lang.String token) throws ManifoldCFException
noteEscaped
in class TagParseState
token
- may be empty!!!ManifoldCFException
protected boolean noteEndEscaped() throws ManifoldCFException
noteEndEscaped
in class TagParseState
ManifoldCFException
protected boolean noteBTagToken(java.lang.String token) throws ManifoldCFException
noteBTagToken
in class TagParseState
ManifoldCFException
protected boolean noteNormalCharacter(char thisChar) throws ManifoldCFException
noteNormalCharacter
in class TagParseState
ManifoldCFException
protected boolean noteEscapedCharacter(char thisChar) throws ManifoldCFException
noteEscapedCharacter
in class TagParseState
ManifoldCFException