webkit
2cdf99a9e3038c7e01b3c37e8ad903ecbe5eecf1
https://github.com/WebKit/webkit
|
Classes | |
class | _BaseHTMLProcessor |
class | _HTMLSanitizer |
Functions | |
def | HTML (htmlSource, encoding='utf8') |
def | characters (text, isXML=False, guess=None) |
Variables | |
TIDY_MARKUP | |
PREFERRED_TIDY_INTERFACES | |
chardet | |
unicode_bom_map | |
xml_bom_map | |
sanitize: bringing sanitiy to world of messed-up data
def planet.sanitize.characters | ( | text, | |
isXML = False , |
|||
guess = None |
|||
) |
Takes a string text of unknown encoding and tries to provide a Unicode string for it.
def planet.sanitize.HTML | ( | htmlSource, | |
encoding = 'utf8' |
|||
) |
planet.sanitize.chardet |
planet.sanitize.PREFERRED_TIDY_INTERFACES |
planet.sanitize.TIDY_MARKUP |
planet.sanitize.unicode_bom_map |
planet.sanitize.xml_bom_map |