cubicweb: comparison devtools/htmlparser.py

equal deleted inserted replaced

-:321b99973b69
+:4ba4be5553cf
 STRICT_DOCTYPE = str(STRICT_DOCTYPE)
 TRANSITIONAL_DOCTYPE = str(TRANSITIONAL_DOCTYPE)
 ERR_COUNT = 0
-_REM_SCRIPT_RGX = re.compile(r"<script[^>]*>.*?</script>", re.U|re.M|re.I|re.S)
+_REM_SCRIPT_RGX = re.compile(br"<script[^>]*>.*?</script>", re.M|re.I|re.S)
 def _remove_script_tags(data):
 """Remove the script (usually javascript) tags to help the lxml
 XMLParser / HTMLParser do their job. Without that, they choke on
 tags embedded in JS strings.
 """
 # >>> cleaner.clean_html('<html><body><div/><br><span></body><html>')
 # '<html><body><div></div><br><span></span></body></html>'
 #
 # using that, we'll miss most actual validation error we want to
 # catch. For now, use dumb regexp
-return _REM_SCRIPT_RGX.sub('', data)
+return _REM_SCRIPT_RGX.sub(b'', data)
 class Validator(object):
 """ base validator API """
 parser = None

changeset 10696	4ba4be5553cf
parent 10662	10942ed172de