final class Tokeniser
extends java.lang.Object
Modifier and Type | Field and Description |
---|---|
(package private) Token.Character |
charPending |
private java.lang.StringBuilder |
charsBuilder |
private java.lang.String |
charsString |
private int[] |
codepointHolder |
(package private) Token.Comment |
commentPending |
(package private) java.lang.StringBuilder |
dataBuffer |
(package private) Token.Doctype |
doctypePending |
private Token |
emitPending |
(package private) Token.EndTag |
endPending |
private ParseErrorList |
errors |
private boolean |
isEmitPending |
private java.lang.String |
lastStartTag |
private int[] |
multipointHolder |
private static char[] |
notCharRefCharsSorted |
private CharacterReader |
reader |
(package private) static char |
replacementChar |
(package private) Token.StartTag |
startPending |
private TokeniserState |
state |
(package private) Token.Tag |
tagPending |
(package private) static int[] |
win1252Extensions |
(package private) static int |
win1252ExtensionsStart |
Constructor and Description |
---|
Tokeniser(CharacterReader reader,
ParseErrorList errors) |
Modifier and Type | Method and Description |
---|---|
(package private) void |
advanceTransition(TokeniserState state) |
(package private) java.lang.String |
appropriateEndTagName() |
private void |
characterReferenceError(java.lang.String message) |
(package private) int[] |
consumeCharacterReference(java.lang.Character additionalAllowedCharacter,
boolean inAttribute) |
(package private) void |
createBogusCommentPending() |
(package private) void |
createCommentPending() |
(package private) void |
createDoctypePending() |
(package private) Token.Tag |
createTagPending(boolean start) |
(package private) void |
createTempBuffer() |
(package private) boolean |
currentNodeInHtmlNS() |
(package private) void |
emit(char c) |
(package private) void |
emit(char[] chars) |
(package private) void |
emit(int[] codepoints) |
(package private) void |
emit(java.lang.String str) |
(package private) void |
emit(Token token) |
(package private) void |
emitCommentPending() |
(package private) void |
emitDoctypePending() |
(package private) void |
emitTagPending() |
(package private) void |
eofError(TokeniserState state) |
(package private) void |
error(java.lang.String errorMsg) |
(package private) void |
error(TokeniserState state) |
(package private) TokeniserState |
getState() |
(package private) boolean |
isAppropriateEndTagToken() |
(package private) Token |
read() |
(package private) void |
transition(TokeniserState state) |
(package private) java.lang.String |
unescapeEntities(boolean inAttribute)
Utility method to consume reader and unescape entities found within.
|
static final char replacementChar
private static final char[] notCharRefCharsSorted
static final int win1252ExtensionsStart
static final int[] win1252Extensions
private final CharacterReader reader
private final ParseErrorList errors
private TokeniserState state
private Token emitPending
private boolean isEmitPending
private java.lang.String charsString
private java.lang.StringBuilder charsBuilder
java.lang.StringBuilder dataBuffer
Token.Tag tagPending
Token.StartTag startPending
Token.EndTag endPending
Token.Character charPending
Token.Doctype doctypePending
Token.Comment commentPending
private java.lang.String lastStartTag
private final int[] codepointHolder
private final int[] multipointHolder
Tokeniser(CharacterReader reader, ParseErrorList errors)
Token read()
void emit(Token token)
void emit(java.lang.String str)
void emit(char[] chars)
void emit(int[] codepoints)
void emit(char c)
TokeniserState getState()
void transition(TokeniserState state)
void advanceTransition(TokeniserState state)
int[] consumeCharacterReference(java.lang.Character additionalAllowedCharacter, boolean inAttribute)
Token.Tag createTagPending(boolean start)
void emitTagPending()
void createCommentPending()
void emitCommentPending()
void createBogusCommentPending()
void createDoctypePending()
void emitDoctypePending()
void createTempBuffer()
boolean isAppropriateEndTagToken()
java.lang.String appropriateEndTagName()
void error(TokeniserState state)
void eofError(TokeniserState state)
private void characterReferenceError(java.lang.String message)
void error(java.lang.String errorMsg)
boolean currentNodeInHtmlNS()
java.lang.String unescapeEntities(boolean inAttribute)
inAttribute
- if the text to be unescaped is in an attribute