Python: module AdvancedHTMLParser.utils

AdvancedHTMLParser.utils

Modules

re

Functions

addStartTag(contents, startTag)
addStartTag - Safetly add a start tag to the document, taking into account the DOCTYPE @param contents <str> - Contents @param startTag <str> - Fully formed tag, i.e. <html>

escapeQuotes(value)
escapeQuotes - Escape quotes within a value (replaces " with ") @param value <str> @return <str> - Escaped value

stripIEConditionals(contents, addHtmlIfMissing=True)
stripIEConditionals - Strips Internet Explorer conditional statements. @param contents <str> - Contents String @param addHtmlIfMissing <bool> - Since these normally encompass the "html" element, optionally add it back if missing.

unescapeQuotes(value)
unescapeQuotes - Unescapes quotes within a value (replaces " with ") @param value <str> @return <str> - Escaped value

Data

DOCTYPE_MATCH = re.compile('[\n]*[ \t]*(?P<tag><[!][ \t]*[dD][oO][cC][tT][yY][pP][eE].*[>])')
END_HTML = re.compile('.*</[ \t\r\n]*[hH][tT][mM][lL][ \t\r\n]*>.*', re.DOTALL)
IE_CONDITIONAL_PATTERN = re.compile('[<][!][-][-][ \t\r\n]*[\\[][ \t\r\n]*if.*-->', re.MULTILINE)
START_HTML = re.compile('.*<[ \t\r\n]*[hH][tT][mM][lL][ \t\r\n]*>.*', re.DOTALL)
__all__ = ('IE_CONDITIONAL_PATTERN', 'END_HTML', 'START_HTML', 'DOCTYPE_MATCH', 'stripIEConditionals', 'addStartTag', 'escapeQuotes', 'unescapeQuotes')

Data
		DOCTYPE_MATCH = re.compile('[\n][ \t](?P<tag><[!][ \t][dD][oO][cC][tT][yY][pP][eE].[>])') END_HTML = re.compile('.</[ \t\r\n][hH][tT][mM][lL][ \t\r\n]>.', re.DOTALL) IE_CONDITIONAL_PATTERN = re.compile('[<][!][-][-][ \t\r\n][\\[][ \t\r\n]if.-->', re.MULTILINE) START_HTML* = re.compile('.<[ \t\r\n][hH][tT][mM][lL][ \t\r\n]>.', re.DOTALL) __all__ = ('IE_CONDITIONAL_PATTERN', 'END_HTML', 'START_HTML', 'DOCTYPE_MATCH', 'stripIEConditionals', 'addStartTag', 'escapeQuotes', 'unescapeQuotes')