Merge branch 'master' of github.com:dae/libanki into some-fixes

2025-11-06 20:57:13 -05:00 · 2012-11-03 12:35:14 +01:00 · 2012-11-03 12:35:14 +01:00 · 1752652a4c
commit 1752652a4c
parent 34212ac06d 49df458409
9 changed files with 135 additions and 111 deletions
--- a/anki/collection.py
+++ b/anki/collection.py
@ -602,10 +602,10 @@ where c.nid == f.id
            "order by id desc limit 1", c.id)
        self.db.execute("delete from revlog where id = ?", last)
        # and finally, update daily counts
        # fixme: what to do in cramming case?
        n = 1 if c.queue == 3 else c.queue
        type = ("new", "lrn", "rev")[n]
        self.sched._updateStats(c, type, -1)
        self.sched.reps -= 1
        return c.id
    def _markOp(self, name):
@ -670,6 +670,10 @@ select id from notes where id not in (select distinct nid from cards)""")
        # field cache
        for m in self.models.all():
            self.updateFieldCache(self.models.nids(m))
        # new cards can't have a due position > 32 bits
        self.db.execute("""
 update cards set due = 1000000, mod = ?, usn = ? where due > 1000000
 and queue = 0""", intTime(), self.usn())
        # new card position
        self.conf['nextPos'] = self.db.scalar(
            "select max(due)+1 from cards where type = 0") or 0
--- a/anki/decks.py
+++ b/anki/decks.py
@ -221,16 +221,18 @@ class DeckManager(object):
        # make sure target node doesn't already exist
        if newName in self.allNames():
            raise DeckRenameError(_("That deck already exists."))
        # ensure we have parents
        newName = self._ensureParents(newName)
        # rename children
        for grp in self.all():
            if grp['name'].startswith(g['name'] + "::"):
                grp['name'] = grp['name'].replace(g['name']+ "::",
                                                  newName + "::")
                self.save(grp)
-        # ensure we have parents
+        # adjust name
        newName = self._ensureParents(newName)
        # adjust name and save
        g['name'] = newName
        # ensure we have parents again, as we may have renamed parent->child
        newName = self._ensureParents(newName)
        self.save(g)
        # renaming may have altered active did order
        self.maybeAddToActive()
--- a/anki/importing/anki2.py
+++ b/anki/importing/anki2.py
@ -4,21 +4,14 @@
 import os
 from anki import Collection
-from anki.utils import intTime, splitFields, joinFields, checksum, guid64
+from anki.utils import intTime, splitFields, joinFields, checksum, guid64, \
    incGuid
 from anki.importing.base import Importer
 from anki.lang import _
 from anki.lang import ngettext
-#
+MID = 2
-# Import a .anki2 file into the current collection. Used for migration from
+GUID = 1
 # 1.x, shared decks, and import from a packaged deck.
 #
 # We can't rely on internal ids, so we:
 # - compare notes by guid
 # - compare models by schema signature
 # - compare cards by note guid + ordinal
 # - compare decks by name
 #
 class Anki2Importer(Importer):
@ -56,10 +49,9 @@ class Anki2Importer(Importer):
    # Notes
    ######################################################################
    # - should note new for wizard
    def _importNotes(self):
-        # build guid -> (id,mod,mid) hash
+        # build guid -> (id,mod,mid) hash & map of existing note ids
        self._notes = {}
        existing = {}
        for id, guid, mod, mid in self.dst.db.execute(
@ -78,44 +70,20 @@ class Anki2Importer(Importer):
            "select * from notes"):
            # turn the db result into a mutable list
            note = list(note)
-            guid, mid = note[1:3]
+            shouldAdd = self._uniquifyNote(note)
-            canUseExisting = False
+            if shouldAdd:
            alreadyHaveGuid = False
            # do we have the same guid?
            if guid in self._notes:
                alreadyHaveGuid = True
                # and do they share the same model id?
                if self._notes[guid][2] == mid:
                    # and do they share the same schema?
                    srcM = self.src.models.get(mid)
                    dstM = self.dst.models.get(self._notes[guid][2])
                    if (self.src.models.scmhash(srcM) ==
                        self.src.models.scmhash(dstM)):
                        # then it's safe to treat as an exact duplicate
                        canUseExisting = True
            # if we can't reuse an existing one, we'll need to add new
            if not canUseExisting:
                # get corresponding local model
                lmid = self._mid(mid)
                # ensure id is unique
                while note[0] in existing:
                    note[0] += 999
                existing[note[0]] = True
-                # rewrite internal ids, models, etc
+                # bump usn
                note[2] = lmid
                note[4] = usn
                # update media references in case of dupes
-                note[6] = self._mungeMedia(mid, note[6])
+                note[6] = self._mungeMedia(note[MID], note[6])
                add.append(note)
                dirty.append(note[0])
-                # if it was originally the same as a note in this deck but the
+                # note we have the added the guid
-                # models have diverged, we need to change the guid
+                self._notes[note[GUID]] = (note[0], note[3], note[MID])
                if alreadyHaveGuid:
                    guid = guid64()
                    self._changedGuids[note[1]] = guid
                    note[1] = guid
                # note we have the added note
                self._notes[guid] = (note[0], note[3], note[2])
            else:
                dupes += 1
                ## update existing note - not yet tested; for post 2.0
@ -136,61 +104,69 @@ class Anki2Importer(Importer):
        self.dst.updateFieldCache(dirty)
        self.dst.tags.registerNotes(dirty)
    # determine if note is a duplicate, and adjust mid and/or guid as required
    # returns true if note should be added
    def _uniquifyNote(self, note):
        origGuid = note[GUID]
        srcMid = note[MID]
        dstMid = self._mid(srcMid)
        # duplicate schemas?
        if srcMid == dstMid:
            return origGuid not in self._notes
        # differing schemas
        note[MID] = dstMid
        if origGuid not in self._notes:
            return True
        # as the schemas differ and we already have a note with a different
        # note type, this note needs a new guid
        while True:
            note[GUID] = incGuid(note[GUID])
            self._changedGuids[origGuid] = note[GUID]
            # if we don't have an existing guid, we can add
            if note[GUID] not in self._notes:
                return True
            # if the existing guid shares the same mid, we can reuse
            if dstMid == self._notes[note[GUID]][MID]:
                return False
    # Models
    ######################################################################
    # Models in the two decks may share an ID but not a schema, so we need to
    # compare the field & template signature rather than just rely on ID. If
-    # we created a new model on a conflict then multiple imports would end up
+    # the schemas don't match, we increment the mid and try again, creating a
-    # with lots of models however, so we store a list of "alternate versions"
+    # new model if necessary.
    # of a model in the model, so that importing a model is idempotent.
    def _prepareModels(self):
        "Prepare index of schema hashes."
        self._modelMap = {}
-    def _mid(self, mid):
+    def _mid(self, srcMid):
        "Return local id for remote MID."
        # already processed this mid?
-        if mid in self._modelMap:
+        if srcMid in self._modelMap:
-            return self._modelMap[mid]
+            return self._modelMap[srcMid]
-        src = self.src.models.get(mid).copy()
+        mid = srcMid
-        # if it doesn't exist, we'll copy it over, preserving id
+        srcModel = self.src.models.get(srcMid)
-        if not self.dst.models.have(mid):
+        srcScm = self.src.models.scmhash(srcModel)
-            self.dst.models.update(src)
+        while True:
-            # if we're importing with a prefix, make the model default to it
+            # missing from target col?
-            if self.deckPrefix:
+            if not self.dst.models.have(mid):
-                src['did'] = self.dst.decks.current()['id']
+                # copy it over
-                # and give it a unique name if it's not a shared deck
+                model = srcModel.copy()
-                if self.deckPrefix != "shared":
+                model['id'] = mid
-                    src['name'] += " (%s)" % self.deckPrefix
+                self.dst.models.update(model)
-            # make sure to bump usn
+                break
-            self.dst.models.save(src)
+            # there's an existing model; do the schemas match?
-            self._modelMap[mid] = mid
+            dstModel = self.dst.models.get(mid)
-            return mid
+            dstScm = self.dst.models.scmhash(dstModel)
-        # if it does exist, do the schema match?
+            if srcScm == dstScm:
-        dst = self.dst.models.get(mid)
+                # they do; we can reuse this mid
-        shash = self.src.models.scmhash(src)
+                break
-        dhash = self.src.models.scmhash(dst)
+            # as they don't match, try next id
-        if shash == dhash:
+            mid += 1
-            # reuse without modification
+        # save map and return new mid
-            self._modelMap[mid] = mid
+        self._modelMap[srcMid] = mid
-            return mid
+        return mid
        # try any alternative versions
        vers = dst.get("vers")
        for v in vers:
            m = self.dst.models.get(v)
            if self.dst.models.scmhash(m) == shash:
                # valid alternate found; use that
                self._modelMap[mid] = m['id']
                return m['id']
        # need to add a new alternate version, with new id
        self.dst.models.add(src)
        if vers:
            dst['vers'].append(src['id'])
        else:
            dst['vers'] = [src['id']]
        self.dst.models.save(dst)
        return src['id']
    # Decks
    ######################################################################
--- a/anki/models.py
+++ b/anki/models.py
@ -28,7 +28,7 @@ defaultModel = {
    'latexPost': "\\end{document}",
    'mod': 0,
    'usn': 0,
-    'vers': [],
+    'vers': [], # FIXME: remove when other clients have caught up
    'type': MODEL_STD,
    'css': """\
 .card {
--- a/anki/sched.py
+++ b/anki/sched.py
@ -129,8 +129,10 @@ order by due""" % self._deckLimit(),
    def unburyCards(self):
        "Unbury cards when closing."
        mod = self.col.db.mod
        self.col.db.execute(
            "update cards set queue = type where queue = -2")
        self.col.db.mod = mod
    # Rev/lrn/time daily stats
    ##########################################################################
@ -203,10 +205,20 @@ order by due""" % self._deckLimit(),
            parts = parts[:-1]
            return "::".join(parts)
        for deck in decks:
            # if we've already seen the exact same deck name, remove the
            # invalid duplicate and reload
            if deck['name'] in lims:
                self.col.decks.rem(deck['id'], cardsToo=False, childrenToo=True)
                return self.deckDueList()
            p = parent(deck['name'])
            # new
            nlim = self._deckNewLimitSingle(deck)
            if p:
                if p not in lims:
                    # if parent was missing, this deck is invalid, and we
                    # need to reload the deck list
                    self.col.decks.rem(deck['id'], cardsToo=False, childrenToo=True)
                    return self.deckDueList()
                nlim = min(nlim, lims[p][0])
            new = self._newForDeck(deck['id'], nlim)
            # learning
@ -590,7 +602,10 @@ did = ? and queue = 3 and due <= ? limit ?""",
                card.due = self.col.nextID("pos")
    def _startingLeft(self, card):
-        conf = self._lrnConf(card)
+        if card.type == 2:
            conf = self._lapseConf(card)
        else:
            conf = self._lrnConf(card)
        tot = len(conf['delays'])
        tod = self._leftToday(conf['delays'], tot)
        return tot + tod*1000
@ -647,26 +662,24 @@ did = ? and queue = 3 and due <= ? limit ?""",
            time.sleep(0.01)
            log()
-    def removeFailed(self, ids=None, expiredOnly=False):
+    def removeLrn(self, ids=None):
-        "Remove failed cards from the learning queue."
+        "Remove cards from the learning queues."
        if ids:
            extra = " and id in "+ids2str(ids)
        else:
            # benchmarks indicate it's about 10x faster to search all decks
            # with the index than scan the table
            extra = " and did in "+ids2str(self.col.decks.allIds())
-        if expiredOnly:
+        # review cards in relearning
            extra += " and odue <= %d" % self.today
        mod = self.col.db.mod
        self.col.db.execute("""
 update cards set
 due = odue, queue = 2, mod = %d, usn = %d, odue = 0
-where queue = 1 and type = 2
+where queue in (1,3) and type = 2
 %s
 """ % (intTime(), self.col.usn(), extra))
-        if expiredOnly:
+        # new cards in learning
-            # we don't want to bump the mod time when removing expired
+        self.forgetCards(self.col.db.list(
-            self.col.db.mod = mod
+            "select id from cards where queue in (1,3) %s" % extra))
    def _lrnForDeck(self, did):
        cnt = self.col.db.scalar(
@ -793,10 +806,9 @@ select id from cards where did in %s and queue = 2 and due <= ? limit ?)"""
            card.odue = card.due
        delay = self._delayForGrade(conf, 0)
        card.due = int(delay + time.time())
        card.left = self._startingLeft(card)
        # queue 1
        if card.due < self.dayCutoff:
            card.left = len(conf['delays'])
            card.left += self._leftToday(conf['delays'], card.left)*1000
            self.lrnCount += card.left/1000
            card.queue = 1
            heappush(self._lrnQueue, (card.due, card.id))
@ -1202,7 +1214,7 @@ To study outside of the normal schedule, click the Custom Study button below."""
    def suspendCards(self, ids):
        "Suspend cards."
        self.remFromDyn(ids)
-        self.removeFailed(ids)
+        self.removeLrn(ids)
        self.col.db.execute(
            "update cards set queue=-1,mod=?,usn=? where id in "+
            ids2str(ids), intTime(), self.col.usn())
--- a/anki/upgrade.py
+++ b/anki/upgrade.py
@ -341,8 +341,11 @@ insert or replace into col select id, cast(created as int), :t,
        mods = {}
        for row in db.all(
            "select id, name from models"):
-            # use only first 31 bits
+            # use only first 31 bits if not old anki id
-            t = abs(row[0]) >> 32
+            t = abs(row[0])
            if t > 4294967296:
                t >>= 32
            assert t > 0
            m = anki.models.defaultModel.copy()
            m['id'] = t
            m['name'] = row[1]
--- a/anki/utils.py
+++ b/anki/utils.py
@ -198,22 +198,36 @@ def maxID(db):
 # used in ankiweb
 def base62(num, extra=""):
-    s = string
+    s = string; table = s.ascii_letters + s.digits + extra
    table = s.ascii_letters + s.digits + extra
    buf = ""
    while num:
        num, i = divmod(num, len(table))
        buf = table[i] + buf
    return buf
 _base91_extra_chars = "!#$%&()*+,-./:;<=>?@[]^_`{|}~"
 def base91(num):
    # all printable characters minus quotes, backslash and separators
-    return base62(num, "!#$%&()*+,-./:;<=>?@[]^_`{|}~")
+    return base62(num, _base91_extra_chars)
 def guid64():
    "Return a base91-encoded 64bit random number."
    return base91(random.randint(0, 2**64-1))
 # increment a guid by one, for note type conflicts
 def incGuid(guid):
    return _incGuid(guid[::-1])[::-1]
 def _incGuid(guid):
    s = string; table = s.ascii_letters + s.digits + _base91_extra_chars
    idx = table.index(guid[0])
    if idx + 1 == len(table):
        # overflow
        guid = table[0] + _incGuid(guid[1:])
    else:
        guid = table[idx+1] + guid[1:]
    return guid
 # Fields
 ##############################################################################
--- a/tests/test_importing.py
+++ b/tests/test_importing.py
@ -157,6 +157,13 @@ def test_anki1_diffmodels():
    after = dst.noteCount()
    # as the model schemas differ, should have been imported as new model
    assert after == before + 1
    # repeating the process should do nothing
    beforeModels = len(dst.models.all())
    imp = Anki1Importer(dst, tmp)
    imp.run()
    after = dst.noteCount()
    assert after == before + 1
    assert beforeModels == len(dst.models.all())
 def test_anki2_diffmodels():
    # create a new empty deck
@ -179,6 +186,12 @@ def test_anki2_diffmodels():
    assert after == before + 1
    # and the new model should have both cards
    assert dst.cardCount() == 3
    # repeating the process should do nothing
    imp = AnkiPackageImporter(dst, tmp)
    imp.run()
    after = dst.noteCount()
    assert after == before + 1
    assert dst.cardCount() == 3
 def test_csv():
    deck = getEmptyDeck()
--- a/tests/test_sched.py
+++ b/tests/test_sched.py
@ -165,7 +165,7 @@ def test_learn():
    c.queue = 1
    c.odue = 321
    c.flush()
-    d.sched.removeFailed()
+    d.sched.removeLrn()
    c.load()
    assert c.queue == 2
    assert c.due == 321