stripHTML() should work when tag split over multiple lines

This commit is contained in:
Damien Elmes 2017-09-30 15:33:05 +10:00
parent fff49a1370
commit b04c2212b5

View file

@ -127,7 +127,7 @@ def fmtFloat(float_value, point=1):
##############################################################################
reStyle = re.compile("(?si)<style.*?>.*?</style>")
reScript = re.compile("(?si)<script.*?>.*?</script>")
reTag = re.compile("<.*?>")
reTag = re.compile("(?s)<.*?>")
reEnts = re.compile("&#?\w+;")
reMedia = re.compile("(?i)<img[^>]+src=[\"']?([^\"'>]+)[\"']?[^>]*>")