Orbits
1
|
Public Member Functions | |
def | __init__ |
def | reset |
def | isHTMLIntegrationPoint |
def | isMathMLTextIntegrationPoint |
def | mainLoop |
def | normalizedTokens |
def | parse |
def | parseFragment |
def | parseError |
def | normalizeToken |
def | adjustMathMLAttributes |
def | adjustSVGAttributes |
def | adjustForeignAttributes |
def | reparseTokenNormal |
def | resetInsertionMode |
def | parseRCDataRawtext |
Public Attributes | |
strict | |
tree | |
tokenizer_class | |
errors | |
phases | |
innerHTMLMode | |
container | |
tokenizer | |
firstStartTag | |
log | |
compatMode | |
innerHTML | |
phase | |
lastPhase | |
beforeRCDataPhase | |
framesetOK | |
originalPhase | |
Private Member Functions | |
def | _parse |
HTML parser. Generates a tree structure from a stream of (possibly malformed) HTML
def pip._vendor.html5lib.html5parser.HTMLParser.__init__ | ( | self, | |
tree = None , |
|||
tokenizer = tokenizer.HTMLTokenizer , |
|||
strict = False , |
|||
namespaceHTMLElements = True , |
|||
debug = False |
|||
) |
strict - raise an exception when a parse error is encountered tree - a treebuilder class controlling the type of tree that will be returned. Built in treebuilders can be accessed through html5lib.treebuilders.getTreeBuilder(treeType) tokenizer - a class that provides a stream of tokens to the treebuilder. This may be replaced for e.g. a sanitizer which converts some tags to text
|
private |
def pip._vendor.html5lib.html5parser.HTMLParser.adjustForeignAttributes | ( | self, | |
token | |||
) |
def pip._vendor.html5lib.html5parser.HTMLParser.adjustMathMLAttributes | ( | self, | |
token | |||
) |
def pip._vendor.html5lib.html5parser.HTMLParser.adjustSVGAttributes | ( | self, | |
token | |||
) |
def pip._vendor.html5lib.html5parser.HTMLParser.isHTMLIntegrationPoint | ( | self, | |
element | |||
) |
def pip._vendor.html5lib.html5parser.HTMLParser.isMathMLTextIntegrationPoint | ( | self, | |
element | |||
) |
def pip._vendor.html5lib.html5parser.HTMLParser.mainLoop | ( | self | ) |
def pip._vendor.html5lib.html5parser.HTMLParser.normalizedTokens | ( | self | ) |
def pip._vendor.html5lib.html5parser.HTMLParser.normalizeToken | ( | self, | |
token | |||
) |
HTML5 specific normalizations to the token stream
def pip._vendor.html5lib.html5parser.HTMLParser.parse | ( | self, | |
stream, | |||
encoding = None , |
|||
parseMeta = True , |
|||
useChardet = True |
|||
) |
Parse a HTML document into a well-formed tree stream - a filelike object or string containing the HTML to be parsed The optional encoding parameter must be a string that indicates the encoding. If specified, that encoding will be used, regardless of any BOM or later declaration (such as in a meta element)
def pip._vendor.html5lib.html5parser.HTMLParser.parseError | ( | self, | |
errorcode = "XXX-undefined-error" , |
|||
datavars = {} |
|||
) |
def pip._vendor.html5lib.html5parser.HTMLParser.parseFragment | ( | self, | |
stream, | |||
container = "div" , |
|||
encoding = None , |
|||
parseMeta = False , |
|||
useChardet = True |
|||
) |
Parse a HTML fragment into a well-formed tree fragment container - name of the element we're setting the innerHTML property if set to None, default to 'div' stream - a filelike object or string containing the HTML to be parsed The optional encoding parameter must be a string that indicates the encoding. If specified, that encoding will be used, regardless of any BOM or later declaration (such as in a meta element)
def pip._vendor.html5lib.html5parser.HTMLParser.parseRCDataRawtext | ( | self, | |
token, | |||
contentType | |||
) |
Generic RCDATA/RAWTEXT Parsing algorithm contentType - RCDATA or RAWTEXT
def pip._vendor.html5lib.html5parser.HTMLParser.reparseTokenNormal | ( | self, | |
token | |||
) |
def pip._vendor.html5lib.html5parser.HTMLParser.reset | ( | self | ) |
def pip._vendor.html5lib.html5parser.HTMLParser.resetInsertionMode | ( | self | ) |
pip._vendor.html5lib.html5parser.HTMLParser.beforeRCDataPhase |
pip._vendor.html5lib.html5parser.HTMLParser.compatMode |
pip._vendor.html5lib.html5parser.HTMLParser.container |
pip._vendor.html5lib.html5parser.HTMLParser.errors |
pip._vendor.html5lib.html5parser.HTMLParser.firstStartTag |
pip._vendor.html5lib.html5parser.HTMLParser.framesetOK |
pip._vendor.html5lib.html5parser.HTMLParser.innerHTML |
pip._vendor.html5lib.html5parser.HTMLParser.innerHTMLMode |
pip._vendor.html5lib.html5parser.HTMLParser.lastPhase |
pip._vendor.html5lib.html5parser.HTMLParser.log |
pip._vendor.html5lib.html5parser.HTMLParser.originalPhase |
pip._vendor.html5lib.html5parser.HTMLParser.phase |
pip._vendor.html5lib.html5parser.HTMLParser.phases |
pip._vendor.html5lib.html5parser.HTMLParser.strict |
pip._vendor.html5lib.html5parser.HTMLParser.tokenizer |
pip._vendor.html5lib.html5parser.HTMLParser.tokenizer_class |
pip._vendor.html5lib.html5parser.HTMLParser.tree |
Copyright 2014 Google Inc. All rights reserved.