From b403f20cae8fcdd7c3ff4c8d21766998e8efaba0 Mon Sep 17 00:00:00 2001 From: Brayan Oliveira <69634269+BrayanDSO@users.noreply.github.com> Date: Sun, 6 Mar 2022 22:02:30 -0300 Subject: [PATCH] Fix html_media_regexps (#1710) * Fix html_media_regexps * Update CONTRIBUTORS --- CONTRIBUTORS | 1 + pylib/anki/media.py | 8 ++++---- 2 files changed, 5 insertions(+), 4 deletions(-) diff --git a/CONTRIBUTORS b/CONTRIBUTORS index 56f2ea18a..9a3299b5c 100644 --- a/CONTRIBUTORS +++ b/CONTRIBUTORS @@ -97,6 +97,7 @@ Sam Bradshaw gnnoh Sachin Govind Patric Cunha +Brayan Oliveira ******************** diff --git a/pylib/anki/media.py b/pylib/anki/media.py index 941fe3920..86e3589cf 100644 --- a/pylib/anki/media.py +++ b/pylib/anki/media.py @@ -34,13 +34,13 @@ class MediaManager(DeprecatedNamesMixin): sound_regexps = [r"(?i)(\[sound:(?P[^]]+)\])"] html_media_regexps = [ # src element quoted case - r"(?i)(<[img|audio][^>]* src=(?P[\"'])(?P[^>]+?)(?P=str)[^>]*>)", + r"(?i)(<(?:img|audio)\b[^>]* src=(?P[\"'])(?P[^>]+?)(?P=str)[^>]*>)", # unquoted case - r"(?i)(<[img|audio][^>]* src=(?!['\"])(?P[^ >]+)[^>]*?>)", + r"(?i)(<(?:img|audio)\b[^>]* src=(?!['\"])(?P[^ >]+)[^>]*?>)", # src element quoted case - r"(?i)(]* data=(?P[\"'])(?P[^>]+?)(?P=str)[^>]*>)", + r"(?i)(]* data=(?P[\"'])(?P[^>]+?)(?P=str)[^>]*>)", # unquoted case - r"(?i)(]* data=(?!['\"])(?P[^ >]+)[^>]*?>)", + r"(?i)(]* data=(?!['\"])(?P[^ >]+)[^>]*?>)", ] regexps = sound_regexps + html_media_regexps