Package org.jsoup.parser
Class HtmlTreeBuilder
- java.lang.Object
-
- org.jsoup.parser.TreeBuilder
-
- org.jsoup.parser.HtmlTreeBuilder
-
public class HtmlTreeBuilder extends TreeBuilder
HTML Tree Builder; creates a DOM from Tokens.
-
-
Field Summary
Fields Modifier and Type Field Description private boolean
baseUriSetFromDoc
private Element
contextElement
private Token.EndTag
emptyEnd
private java.util.ArrayList<Element>
formattingElements
private FormElement
formElement
private boolean
fosterInserts
private boolean
fragmentParsing
private boolean
framesetOk
private Element
headElement
static int
MaxScopeSearchDepth
private HtmlTreeBuilderState
originalState
private java.util.List<java.lang.String>
pendingTableCharacters
private java.lang.String[]
specificScopeTarget
private HtmlTreeBuilderState
state
(package private) static java.lang.String[]
TagSearchButton
(package private) static java.lang.String[]
TagSearchEndTags
(package private) static java.lang.String[]
TagSearchList
(package private) static java.lang.String[]
TagSearchSelectScope
(package private) static java.lang.String[]
TagSearchSpecial
(package private) static java.lang.String[]
TagSearchTableScope
(package private) static java.lang.String[]
TagsSearchInScope
-
Fields inherited from class org.jsoup.parser.TreeBuilder
baseUri, currentToken, doc, parser, reader, settings, stack, tokeniser
-
-
Constructor Summary
Constructors Constructor Description HtmlTreeBuilder()
-
Method Summary
All Methods Instance Methods Concrete Methods Modifier and Type Method Description (package private) Element
aboveOnStack(Element el)
(package private) void
clearFormattingElementsToLastMarker()
private void
clearStackToContext(java.lang.String... nodeNames)
(package private) void
clearStackToTableBodyContext()
(package private) void
clearStackToTableContext()
(package private) void
clearStackToTableRowContext()
(package private) ParseSettings
defaultSettings()
(package private) void
error(HtmlTreeBuilderState state)
(package private) boolean
framesetOk()
(package private) void
framesetOk(boolean framesetOk)
(package private) void
generateImpliedEndTags()
(package private) void
generateImpliedEndTags(java.lang.String excludeTag)
11.2.5.2 Closing elements that have implied end tags(package private) Element
getActiveFormattingElement(java.lang.String nodeName)
(package private) java.lang.String
getBaseUri()
(package private) Document
getDocument()
(package private) FormElement
getFormElement()
(package private) Element
getFromStack(java.lang.String elName)
(package private) Element
getHeadElement()
(package private) java.util.List<java.lang.String>
getPendingTableCharacters()
(package private) java.util.ArrayList<Element>
getStack()
(package private) boolean
inButtonScope(java.lang.String targetName)
protected void
initialiseParse(java.io.Reader input, java.lang.String baseUri, Parser parser)
(package private) boolean
inListItemScope(java.lang.String targetName)
(package private) boolean
inScope(java.lang.String targetName)
(package private) boolean
inScope(java.lang.String[] targetNames)
(package private) boolean
inScope(java.lang.String targetName, java.lang.String[] extras)
(package private) boolean
inSelectScope(java.lang.String targetName)
(package private) void
insert(Element el)
(package private) void
insert(Token.Character characterToken)
(package private) void
insert(Token.Comment commentToken)
(package private) Element
insert(Token.StartTag startTag)
(package private) Element
insertEmpty(Token.StartTag startTag)
(package private) FormElement
insertForm(Token.StartTag startTag, boolean onStack)
(package private) void
insertInFosterParent(Node in)
(package private) void
insertMarkerToFormattingElements()
private void
insertNode(Node node)
(package private) void
insertOnStackAfter(Element after, Element in)
(package private) Element
insertStartTag(java.lang.String startTagName)
private boolean
inSpecificScope(java.lang.String[] targetNames, java.lang.String[] baseTypes, java.lang.String[] extraTypes)
private boolean
inSpecificScope(java.lang.String targetName, java.lang.String[] baseTypes, java.lang.String[] extraTypes)
(package private) boolean
inTableScope(java.lang.String targetName)
private boolean
isElementInQueue(java.util.ArrayList<Element> queue, Element element)
(package private) boolean
isFosterInserts()
(package private) boolean
isFragmentParsing()
(package private) boolean
isInActiveFormattingElements(Element el)
private boolean
isSameFormattingElement(Element a, Element b)
(package private) boolean
isSpecial(Element el)
(package private) Element
lastFormattingElement()
(package private) void
markInsertionMode()
(package private) void
maybeSetBaseUri(Element base)
(package private) void
newPendingTableCharacters()
(package private) boolean
onStack(Element el)
(package private) HtmlTreeBuilderState
originalState()
(package private) java.util.List<Node>
parseFragment(java.lang.String inputFragment, Element context, java.lang.String baseUri, Parser parser)
(package private) Element
pop()
(package private) void
popStackToBefore(java.lang.String elName)
(package private) void
popStackToClose(java.lang.String elName)
(package private) void
popStackToClose(java.lang.String... elNames)
protected boolean
process(Token token)
(package private) boolean
process(Token token, HtmlTreeBuilderState state)
(package private) void
push(Element element)
(package private) void
pushActiveFormattingElements(Element in)
(package private) void
reconstructFormattingElements()
(package private) void
removeFromActiveFormattingElements(Element el)
(package private) boolean
removeFromStack(Element el)
(package private) Element
removeLastFormattingElement()
(package private) void
replaceActiveFormattingElement(Element out, Element in)
private void
replaceInQueue(java.util.ArrayList<Element> queue, Element out, Element in)
(package private) void
replaceOnStack(Element out, Element in)
(package private) void
resetInsertionMode()
(package private) void
setFormElement(FormElement formElement)
(package private) void
setFosterInserts(boolean fosterInserts)
(package private) void
setHeadElement(Element headElement)
(package private) HtmlTreeBuilderState
state()
java.lang.String
toString()
(package private) void
transition(HtmlTreeBuilderState state)
-
Methods inherited from class org.jsoup.parser.TreeBuilder
currentElement, parse, processEndTag, processStartTag, processStartTag, runParser
-
-
-
-
Field Detail
-
TagsSearchInScope
static final java.lang.String[] TagsSearchInScope
-
TagSearchList
static final java.lang.String[] TagSearchList
-
TagSearchButton
static final java.lang.String[] TagSearchButton
-
TagSearchTableScope
static final java.lang.String[] TagSearchTableScope
-
TagSearchSelectScope
static final java.lang.String[] TagSearchSelectScope
-
TagSearchEndTags
static final java.lang.String[] TagSearchEndTags
-
TagSearchSpecial
static final java.lang.String[] TagSearchSpecial
-
MaxScopeSearchDepth
public static final int MaxScopeSearchDepth
- See Also:
- Constant Field Values
-
state
private HtmlTreeBuilderState state
-
originalState
private HtmlTreeBuilderState originalState
-
baseUriSetFromDoc
private boolean baseUriSetFromDoc
-
headElement
private Element headElement
-
formElement
private FormElement formElement
-
contextElement
private Element contextElement
-
formattingElements
private java.util.ArrayList<Element> formattingElements
-
pendingTableCharacters
private java.util.List<java.lang.String> pendingTableCharacters
-
emptyEnd
private Token.EndTag emptyEnd
-
framesetOk
private boolean framesetOk
-
fosterInserts
private boolean fosterInserts
-
fragmentParsing
private boolean fragmentParsing
-
specificScopeTarget
private java.lang.String[] specificScopeTarget
-
-
Method Detail
-
defaultSettings
ParseSettings defaultSettings()
- Specified by:
defaultSettings
in classTreeBuilder
-
initialiseParse
protected void initialiseParse(java.io.Reader input, java.lang.String baseUri, Parser parser)
- Overrides:
initialiseParse
in classTreeBuilder
-
parseFragment
java.util.List<Node> parseFragment(java.lang.String inputFragment, Element context, java.lang.String baseUri, Parser parser)
- Specified by:
parseFragment
in classTreeBuilder
-
process
protected boolean process(Token token)
- Specified by:
process
in classTreeBuilder
-
process
boolean process(Token token, HtmlTreeBuilderState state)
-
transition
void transition(HtmlTreeBuilderState state)
-
state
HtmlTreeBuilderState state()
-
markInsertionMode
void markInsertionMode()
-
originalState
HtmlTreeBuilderState originalState()
-
framesetOk
void framesetOk(boolean framesetOk)
-
framesetOk
boolean framesetOk()
-
getDocument
Document getDocument()
-
getBaseUri
java.lang.String getBaseUri()
-
maybeSetBaseUri
void maybeSetBaseUri(Element base)
-
isFragmentParsing
boolean isFragmentParsing()
-
error
void error(HtmlTreeBuilderState state)
-
insert
Element insert(Token.StartTag startTag)
-
insertStartTag
Element insertStartTag(java.lang.String startTagName)
-
insert
void insert(Element el)
-
insertEmpty
Element insertEmpty(Token.StartTag startTag)
-
insertForm
FormElement insertForm(Token.StartTag startTag, boolean onStack)
-
insert
void insert(Token.Comment commentToken)
-
insert
void insert(Token.Character characterToken)
-
insertNode
private void insertNode(Node node)
-
pop
Element pop()
-
push
void push(Element element)
-
getStack
java.util.ArrayList<Element> getStack()
-
onStack
boolean onStack(Element el)
-
isElementInQueue
private boolean isElementInQueue(java.util.ArrayList<Element> queue, Element element)
-
getFromStack
Element getFromStack(java.lang.String elName)
-
removeFromStack
boolean removeFromStack(Element el)
-
popStackToClose
void popStackToClose(java.lang.String elName)
-
popStackToClose
void popStackToClose(java.lang.String... elNames)
-
popStackToBefore
void popStackToBefore(java.lang.String elName)
-
clearStackToTableContext
void clearStackToTableContext()
-
clearStackToTableBodyContext
void clearStackToTableBodyContext()
-
clearStackToTableRowContext
void clearStackToTableRowContext()
-
clearStackToContext
private void clearStackToContext(java.lang.String... nodeNames)
-
replaceInQueue
private void replaceInQueue(java.util.ArrayList<Element> queue, Element out, Element in)
-
resetInsertionMode
void resetInsertionMode()
-
inSpecificScope
private boolean inSpecificScope(java.lang.String targetName, java.lang.String[] baseTypes, java.lang.String[] extraTypes)
-
inSpecificScope
private boolean inSpecificScope(java.lang.String[] targetNames, java.lang.String[] baseTypes, java.lang.String[] extraTypes)
-
inScope
boolean inScope(java.lang.String[] targetNames)
-
inScope
boolean inScope(java.lang.String targetName)
-
inScope
boolean inScope(java.lang.String targetName, java.lang.String[] extras)
-
inListItemScope
boolean inListItemScope(java.lang.String targetName)
-
inButtonScope
boolean inButtonScope(java.lang.String targetName)
-
inTableScope
boolean inTableScope(java.lang.String targetName)
-
inSelectScope
boolean inSelectScope(java.lang.String targetName)
-
setHeadElement
void setHeadElement(Element headElement)
-
getHeadElement
Element getHeadElement()
-
isFosterInserts
boolean isFosterInserts()
-
setFosterInserts
void setFosterInserts(boolean fosterInserts)
-
getFormElement
FormElement getFormElement()
-
setFormElement
void setFormElement(FormElement formElement)
-
newPendingTableCharacters
void newPendingTableCharacters()
-
getPendingTableCharacters
java.util.List<java.lang.String> getPendingTableCharacters()
-
generateImpliedEndTags
void generateImpliedEndTags(java.lang.String excludeTag)
11.2.5.2 Closing elements that have implied end tags When the steps below require the UA to generate implied end tags, then, while the current node is a dd element, a dt element, an li element, an option element, an optgroup element, a p element, an rp element, or an rt element, the UA must pop the current node off the stack of open elements.- Parameters:
excludeTag
- If a step requires the UA to generate implied end tags but lists an element to exclude from the process, then the UA must perform the above steps as if that element was not in the above list.
-
generateImpliedEndTags
void generateImpliedEndTags()
-
isSpecial
boolean isSpecial(Element el)
-
lastFormattingElement
Element lastFormattingElement()
-
removeLastFormattingElement
Element removeLastFormattingElement()
-
pushActiveFormattingElements
void pushActiveFormattingElements(Element in)
-
reconstructFormattingElements
void reconstructFormattingElements()
-
clearFormattingElementsToLastMarker
void clearFormattingElementsToLastMarker()
-
removeFromActiveFormattingElements
void removeFromActiveFormattingElements(Element el)
-
isInActiveFormattingElements
boolean isInActiveFormattingElements(Element el)
-
getActiveFormattingElement
Element getActiveFormattingElement(java.lang.String nodeName)
-
insertMarkerToFormattingElements
void insertMarkerToFormattingElements()
-
insertInFosterParent
void insertInFosterParent(Node in)
-
toString
public java.lang.String toString()
- Overrides:
toString
in classjava.lang.Object
-
-