stripHTML() handles entity replacement, which should be done post-strip

2025-12-30 23:32:57 -05:00 · 2012-09-07 04:54:59 +09:00 · 2012-09-07 04:54:59 +09:00 · b66d1479c2
commit b66d1479c2
parent 59cb45eda6
1 changed files with 0 additions and 3 deletions
--- a/anki/latex.py
+++ b/anki/latex.py
@ -64,9 +64,6 @@ def _latexFromHtml(col, latex):
    # entitydefs defines nbsp as \xa0 instead of a standard space, so we
    # replace it first
    latex = latex.replace("&nbsp;", " ")
    for match in re.compile("&([a-z]+);", re.IGNORECASE).finditer(latex):
        if match.group(1) in entitydefs:
            latex = latex.replace(match.group(), entitydefs[match.group(1)])
    latex = re.sub("<br( /)?>", "\n", latex)
    # replace <div> etc with spaces
    latex = re.sub("<.+?>", " ", latex)