mirror of
https://github.com/ankitects/anki.git
synced 2025-09-18 22:12:21 -04:00
cleanup / renames
・ soundRegexps → sound_regexps ・ htmlRegexps → html_media_regexps ・ HTML_TAGS → HTML_MEDIA_TAGS ・ escapeImages → escape_media_filenames + alias ・ strip_html_preserving_image_filenames → strip_html_preserving_media_filenames
This commit is contained in:
parent
6e9aaad11e
commit
e68a40f13e
8 changed files with 35 additions and 28 deletions
|
@ -33,8 +33,8 @@ def media_paths_from_col_path(col_path: str) -> Tuple[str, str]:
|
|||
|
||||
class MediaManager:
|
||||
|
||||
soundRegexps = [r"(?i)(\[sound:(?P<fname>[^]]+)\])"]
|
||||
htmlRegexps = [
|
||||
sound_regexps = [r"(?i)(\[sound:(?P<fname>[^]]+)\])"]
|
||||
html_media_regexps = [
|
||||
# src element quoted case
|
||||
r"(?i)(<[img|audio][^>]* src=(?P<str>[\"'])(?P<fname>[^>]+?)(?P=str)[^>]*>)",
|
||||
# unquoted case
|
||||
|
@ -44,7 +44,7 @@ class MediaManager:
|
|||
# unquoted case
|
||||
r"(?i)(<object[^>]* data=(?!['\"])(?P<fname>[^ >]+)[^>]*?>)",
|
||||
]
|
||||
regexps = soundRegexps + htmlRegexps
|
||||
regexps = sound_regexps + html_media_regexps
|
||||
|
||||
def __init__(self, col: anki.collection.Collection, server: bool) -> None:
|
||||
self.col = col.weakref()
|
||||
|
@ -163,7 +163,11 @@ class MediaManager:
|
|||
return txt
|
||||
|
||||
def escapeImages(self, string: str, unescape: bool = False) -> str:
|
||||
"Apply or remove percent encoding to image filenames."
|
||||
"escape_media_filenames alias for compatibility with add-ons."
|
||||
return self.escape_media_filenames(string, unescape)
|
||||
|
||||
def escape_media_filenames(self, string: str, unescape: bool = False) -> str:
|
||||
"Apply or remove percent encoding to filenames in html tags (audio, image, object)."
|
||||
fn: Callable
|
||||
if unescape:
|
||||
fn = urllib.parse.unquote
|
||||
|
@ -177,7 +181,7 @@ class MediaManager:
|
|||
return tag
|
||||
return tag.replace(fname, fn(fname))
|
||||
|
||||
for reg in self.htmlRegexps:
|
||||
for reg in self.html_media_regexps:
|
||||
string = re.sub(reg, repl, string)
|
||||
return string
|
||||
|
||||
|
|
|
@ -46,7 +46,7 @@ def test_strings():
|
|||
assert sp("aoeu") == "aoeu"
|
||||
assert sp("aoeu[sound:foo.mp3]aoeu") == "aoeuaoeu"
|
||||
assert sp("a<img src=yo>oeu") == "aoeu"
|
||||
es = col.media.escapeImages
|
||||
es = col.media.escape_media_filenames
|
||||
assert es("aoeu") == "aoeu"
|
||||
assert es("<img src='http://foo.com'>") == "<img src='http://foo.com'>"
|
||||
assert es('<img src="foo bar.jpg">') == '<img src="foo%20bar.jpg">'
|
||||
|
|
|
@ -450,7 +450,8 @@ class Editor:
|
|||
return
|
||||
|
||||
data = [
|
||||
(fld, self.mw.col.media.escapeImages(val)) for fld, val in self.note.items()
|
||||
(fld, self.mw.col.media.escape_media_filenames(val))
|
||||
for fld, val in self.note.items()
|
||||
]
|
||||
self.widget.show()
|
||||
self.updateTags()
|
||||
|
@ -547,11 +548,13 @@ class Editor:
|
|||
if html.find(">") > -1:
|
||||
# filter html through beautifulsoup so we can strip out things like a
|
||||
# leading </div>
|
||||
html_escaped = self.mw.col.media.escapeImages(html)
|
||||
html_escaped = self.mw.col.media.escape_media_filenames(html)
|
||||
with warnings.catch_warnings():
|
||||
warnings.simplefilter("ignore", UserWarning)
|
||||
html_escaped = str(BeautifulSoup(html_escaped, "html.parser"))
|
||||
html = self.mw.col.media.escapeImages(html_escaped, unescape=True)
|
||||
html = self.mw.col.media.escape_media_filenames(
|
||||
html_escaped, unescape=True
|
||||
)
|
||||
self.note.fields[field] = html
|
||||
if not self.addMode:
|
||||
self.note.flush()
|
||||
|
@ -1231,7 +1234,7 @@ def remove_null_bytes(txt, editor):
|
|||
|
||||
def reverse_url_quoting(txt, editor):
|
||||
# reverse the url quoting we added to get images to display
|
||||
return editor.mw.col.media.escapeImages(txt, unescape=True)
|
||||
return editor.mw.col.media.escape_media_filenames(txt, unescape=True)
|
||||
|
||||
|
||||
gui_hooks.editor_will_use_font_for_field.append(fontMungeHack)
|
||||
|
|
|
@ -483,7 +483,7 @@ close the profile or restart Anki."""
|
|||
return anki.sound.strip_av_refs(text)
|
||||
|
||||
def prepare_card_text_for_display(self, text: str) -> str:
|
||||
text = self.col.media.escapeImages(text)
|
||||
text = self.col.media.escape_media_filenames(text)
|
||||
text = self._add_play_buttons(text)
|
||||
return text
|
||||
|
||||
|
|
|
@ -548,7 +548,7 @@ def restore_combo_history(comboBox: QComboBox, name: str):
|
|||
|
||||
def mungeQA(col, txt):
|
||||
print("mungeQA() deprecated; use mw.prepare_card_text_for_display()")
|
||||
txt = col.media.escapeImages(txt)
|
||||
txt = col.media.escape_media_filenames(txt)
|
||||
return txt
|
||||
|
||||
|
||||
|
|
|
@ -10,7 +10,7 @@ use crate::{
|
|||
err::{AnkiError, Result},
|
||||
notetype::{CardGenContext, NoteField, NoteType, NoteTypeID},
|
||||
template::field_is_empty,
|
||||
text::{ensure_string_in_nfc, normalize_to_nfc, strip_html_preserving_image_filenames},
|
||||
text::{ensure_string_in_nfc, normalize_to_nfc, strip_html_preserving_media_filenames},
|
||||
timestamp::TimestampSecs,
|
||||
types::Usn,
|
||||
};
|
||||
|
@ -100,12 +100,12 @@ impl Note {
|
|||
}
|
||||
}
|
||||
|
||||
let field1_nohtml = strip_html_preserving_image_filenames(&self.fields()[0]);
|
||||
let field1_nohtml = strip_html_preserving_media_filenames(&self.fields()[0]);
|
||||
let checksum = field_checksum(field1_nohtml.as_ref());
|
||||
let sort_field = if nt.config.sort_field_idx == 0 {
|
||||
field1_nohtml
|
||||
} else {
|
||||
strip_html_preserving_image_filenames(
|
||||
strip_html_preserving_media_filenames(
|
||||
self.fields
|
||||
.get(nt.config.sort_field_idx as usize)
|
||||
.map(AsRef::as_ref)
|
||||
|
@ -208,7 +208,7 @@ impl From<pb::Note> for Note {
|
|||
}
|
||||
}
|
||||
|
||||
/// Text must be passed to strip_html_preserving_image_filenames() by
|
||||
/// Text must be passed to strip_html_preserving_media_filenames() by
|
||||
/// caller prior to passing in here.
|
||||
pub(crate) fn field_checksum(text: &str) -> u32 {
|
||||
let digest = sha1::Sha1::from(text).digest().bytes();
|
||||
|
@ -429,7 +429,7 @@ impl Collection {
|
|||
} else {
|
||||
field1.into()
|
||||
};
|
||||
let stripped = strip_html_preserving_image_filenames(&field1);
|
||||
let stripped = strip_html_preserving_media_filenames(&field1);
|
||||
if stripped.trim().is_empty() {
|
||||
Ok(DuplicateState::Empty)
|
||||
} else {
|
||||
|
@ -438,7 +438,7 @@ impl Collection {
|
|||
self.storage
|
||||
.note_fields_by_checksum(note.id, note.notetype_id, csum)?
|
||||
{
|
||||
if strip_html_preserving_image_filenames(&field) == stripped {
|
||||
if strip_html_preserving_media_filenames(&field) == stripped {
|
||||
return Ok(DuplicateState::Duplicate);
|
||||
}
|
||||
}
|
||||
|
|
|
@ -10,7 +10,7 @@ use crate::{
|
|||
notes::field_checksum,
|
||||
notetype::NoteTypeID,
|
||||
text::{matches_wildcard, text_to_re},
|
||||
text::{normalize_to_nfc, strip_html_preserving_image_filenames, without_combining},
|
||||
text::{normalize_to_nfc, strip_html_preserving_media_filenames, without_combining},
|
||||
timestamp::TimestampSecs,
|
||||
};
|
||||
use lazy_static::lazy_static;
|
||||
|
@ -424,7 +424,7 @@ impl SqlWriter<'_> {
|
|||
}
|
||||
|
||||
fn write_dupes(&mut self, ntid: NoteTypeID, text: &str) {
|
||||
let text_nohtml = strip_html_preserving_image_filenames(text);
|
||||
let text_nohtml = strip_html_preserving_media_filenames(text);
|
||||
let csum = field_checksum(text_nohtml.as_ref());
|
||||
write!(
|
||||
self.sql,
|
||||
|
|
|
@ -32,7 +32,7 @@ lazy_static! {
|
|||
))
|
||||
.unwrap();
|
||||
|
||||
static ref HTML_TAGS: Regex = Regex::new(
|
||||
static ref HTML_MEDIA_TAGS: Regex = Regex::new(
|
||||
r#"(?xsi)
|
||||
# the start of the image, audio, or object tag
|
||||
<\b(?:img|audio|object)\b[^>]+\b(?:src|data)\b=
|
||||
|
@ -149,7 +149,7 @@ pub(crate) struct MediaRef<'a> {
|
|||
pub(crate) fn extract_media_refs(text: &str) -> Vec<MediaRef> {
|
||||
let mut out = vec![];
|
||||
|
||||
for caps in HTML_TAGS.captures_iter(text) {
|
||||
for caps in HTML_MEDIA_TAGS.captures_iter(text) {
|
||||
let fname = caps
|
||||
.get(1)
|
||||
.or_else(|| caps.get(2))
|
||||
|
@ -213,8 +213,8 @@ fn tts_tag_from_string<'a>(field_text: &'a str, args: &'a str) -> AVTag {
|
|||
}
|
||||
}
|
||||
|
||||
pub fn strip_html_preserving_image_filenames(html: &str) -> Cow<str> {
|
||||
let without_fnames = HTML_TAGS.replace_all(html, r" ${1}${2}${3} ");
|
||||
pub fn strip_html_preserving_media_filenames(html: &str) -> Cow<str> {
|
||||
let without_fnames = HTML_MEDIA_TAGS.replace_all(html, r" ${1}${2}${3} ");
|
||||
let without_html = HTML.replace_all(&without_fnames, "");
|
||||
// no changes?
|
||||
if let Cow::Borrowed(b) = without_html {
|
||||
|
@ -306,7 +306,7 @@ mod test {
|
|||
use super::matches_wildcard;
|
||||
use crate::text::without_combining;
|
||||
use crate::text::{
|
||||
extract_av_tags, strip_av_tags, strip_html, strip_html_preserving_image_filenames, AVTag,
|
||||
extract_av_tags, strip_av_tags, strip_html, strip_html_preserving_media_filenames, AVTag,
|
||||
};
|
||||
use std::borrow::Cow;
|
||||
|
||||
|
@ -317,14 +317,14 @@ mod test {
|
|||
assert_eq!(strip_html("so<SCRIPT>t<b>e</b>st</script>me"), "some");
|
||||
|
||||
assert_eq!(
|
||||
strip_html_preserving_image_filenames("<img src=foo.jpg>"),
|
||||
strip_html_preserving_media_filenames("<img src=foo.jpg>"),
|
||||
" foo.jpg "
|
||||
);
|
||||
assert_eq!(
|
||||
strip_html_preserving_image_filenames("<img src='foo.jpg'><html>"),
|
||||
strip_html_preserving_media_filenames("<img src='foo.jpg'><html>"),
|
||||
" foo.jpg "
|
||||
);
|
||||
assert_eq!(strip_html_preserving_image_filenames("<html>"), "");
|
||||
assert_eq!(strip_html_preserving_media_filenames("<html>"), "");
|
||||
}
|
||||
|
||||
#[test]
|
||||
|
|
Loading…
Reference in a new issue