start work on id refactor - models first

The approach of using incrementing id numbers works for syncing if we assume
the server is canonical and all other clients rewrite their ids as necessary,
but upon reflection it is not sufficient for merging decks in general, as we
have no way of knowing whether objects with the same id are actually the same
or not. So we need some way of uniquely identifying the object.

One approach would be to go back to Anki 1.0's random 64bit numbers, but as
outlined in a previous commit such large numbers can't be handled easy in some
languages like Javascript, and they tend to be fragmented on disk which
impacts performance. It's much better if we can keep content added at the same
time in the same place on disk, so that operations like syncing which are mainly
interested in newly added content can run faster.

Another approach is to add a separate column containing the unique id, which
is what Mnemosyne 2.0 will be doing. Unfortunately it means adding an index
for that column, leading to slower inserts and larger deck files. And if the
current sequential ids are kept, a bunch of code needs to be kept to ensure ids
don't conflict when merging.

To address the above, the plan is to use a millisecond timestamp as the id.
This ensures disk order reflects creation order, allows us to merge the id and
crt columns, avoids the need for a separate index, and saves us from worrying
about rewriting ids. There is of course a small chance that the objects to be
merged were created at exactly the same time, but this is extremely unlikely.

This commit changes models. Other objects will follow.
This commit is contained in:
Damien Elmes 2011-08-26 21:08:30 +09:00
parent 9de16289ba
commit 6644c04852
7 changed files with 25 additions and 23 deletions

View file

@ -406,6 +406,9 @@ select id from cards where fid in (select id from facts where mid = ?)""",
def allCSS(self): def allCSS(self):
return "\n".join(self.db.list("select css from models")) return "\n".join(self.db.list("select css from models"))
def modelId(self, name):
return self.db.scalar("select id from models where name = ?", name)
# Field checksums and sorting fields # Field checksums and sorting fields
########################################################################## ##########################################################################

View file

@ -63,24 +63,22 @@ class Model(object):
self.id = id self.id = id
self.load() self.load()
else: else:
self.id = None self.id = intTime(1000)
self.name = u"" self.name = u""
self.crt = intTime() self.mod = intTime()
self.mod = self.crt
self.conf = defaultConf.copy() self.conf = defaultConf.copy()
self.css = "" self.css = ""
self.fields = [] self.fields = []
self.templates = [] self.templates = []
def load(self): def load(self):
(self.crt, (self.mod,
self.mod,
self.name, self.name,
self.fields, self.fields,
self.templates, self.templates,
self.conf, self.conf,
self.css) = self.deck.db.first(""" self.css) = self.deck.db.first("""
select crt, mod, name, flds, tmpls, conf, css from models where id = ?""", self.id) select mod, name, flds, tmpls, conf, css from models where id = ?""", self.id)
self.fields = simplejson.loads(self.fields) self.fields = simplejson.loads(self.fields)
self.templates = simplejson.loads(self.templates) self.templates = simplejson.loads(self.templates)
self.conf = simplejson.loads(self.conf) self.conf = simplejson.loads(self.conf)
@ -89,8 +87,8 @@ select crt, mod, name, flds, tmpls, conf, css from models where id = ?""", self.
self.mod = intTime() self.mod = intTime()
self.css = self.genCSS() self.css = self.genCSS()
ret = self.deck.db.execute(""" ret = self.deck.db.execute("""
insert or replace into models values (?, ?, ?, ?, ?, ?, ?, ?)""", insert or replace into models values (?, ?, ?, ?, ?, ?, ?)""",
self.id, self.crt, self.mod, self.name, self.id, self.mod, self.name,
simplejson.dumps(self.fields), simplejson.dumps(self.fields),
simplejson.dumps(self.templates), simplejson.dumps(self.templates),
simplejson.dumps(self.conf), simplejson.dumps(self.conf),

View file

@ -33,10 +33,9 @@ def Deck(path, queue=True, lock=True):
if ver < CURRENT_VERSION: if ver < CURRENT_VERSION:
_upgradeDeck(deck, ver) _upgradeDeck(deck, ver)
elif create: elif create:
deck.addModel(BasicModel(deck)) # add in reverse order so basic is default
deck.addModel(ClozeModel(deck)) deck.addModel(ClozeModel(deck))
# default to basic deck.addModel(BasicModel(deck))
deck.conf['currentModelId'] = 1
deck.save() deck.save()
if lock: if lock:
deck.lock() deck.lock()
@ -111,7 +110,6 @@ create table if not exists fsums (
create table if not exists models ( create table if not exists models (
id integer primary key, id integer primary key,
crt integer not null,
mod integer not null, mod integer not null,
name text not null, name text not null,
flds text not null, flds text not null,
@ -321,7 +319,7 @@ from facts order by created""")
import anki.models import anki.models
_moveTable(db, "models") _moveTable(db, "models")
db.execute(""" db.execute("""
insert into models select id, cast(created as int), cast(modified as int), insert into models select id, cast(created*1000 as int),
name, "{}", "{}", ?, "" from models2""", simplejson.dumps( name, "{}", "{}", ?, "" from models2""", simplejson.dumps(
anki.models.defaultConf)) anki.models.defaultConf))
db.execute("drop table models2") db.execute("drop table models2")
@ -514,9 +512,10 @@ def _fixupModels(deck):
# update ordinals # update ordinals
m._updateFieldOrds() m._updateFieldOrds()
m._updateTemplOrds() m._updateTemplOrds()
# rewrite id # we've temporarily stored the model creation time in the mod time
old = m.id old = m.id
m.id = c+1 m.id = m.mod
m.mod = intTime()
m.flush() m.flush()
deck.db.execute("update facts set mid = ? where mid = ?", m.id, old) deck.db.execute("update facts set mid = ? where mid = ?", m.id, old)

View file

@ -23,8 +23,9 @@ if sys.version_info[1] < 5:
# Time handling # Time handling
############################################################################## ##############################################################################
def intTime(): def intTime(scale=1):
return int(time.time()) "The time in integer seconds. Pass scale=1000 to get milliseconds."
return int(time.time()*scale)
timeTable = { timeTable = {
"years": lambda n: ngettext("%s year", "%s years", n), "years": lambda n: ngettext("%s year", "%s years", n),

View file

@ -3,6 +3,7 @@
import time import time
from anki.db import DB from anki.db import DB
from anki.consts import * from anki.consts import *
from anki.utils import hexifyID
from tests.shared import getEmptyDeck from tests.shared import getEmptyDeck
def test_genCards(): def test_genCards():
@ -84,7 +85,7 @@ def test_misc():
f['Back'] = u'2' f['Back'] = u'2'
d.addFact(f) d.addFact(f)
c = f.cards()[0] c = f.cards()[0]
assert c.cssClass() == "cm1-0" id = d.conf['currentModelId']
assert c.cssClass() == "cm%s-0" % hexifyID(id)
assert c.fact().id == 1 assert c.fact().id == 1
assert c.model().id == 1
assert c.template()['ord'] == 0 assert c.template()['ord'] == 0

View file

@ -110,7 +110,7 @@ def test_text():
def test_cloze(): def test_cloze():
d = getEmptyDeck() d = getEmptyDeck()
d.conf['currentModelId'] = 2 d.conf['currentModelId'] = d.modelId("Cloze")
f = d.newFact() f = d.newFact()
assert f.model().name == "Cloze" assert f.model().name == "Cloze"
# a cloze model with no clozes is empty # a cloze model with no clozes is empty
@ -162,8 +162,8 @@ def test_cloze():
def test_modelChange(): def test_modelChange():
deck = getEmptyDeck() deck = getEmptyDeck()
basic = deck.getModel(1) basic = deck.getModel(deck.modelId("Basic"))
cloze = deck.getModel(2) cloze = deck.getModel(deck.modelId("Cloze"))
# enable second template and add a fact # enable second template and add a fact
basic.templates[1]['actv'] = True basic.templates[1]['actv'] = True
basic.flush() basic.flush()

View file

@ -66,7 +66,7 @@ def teardown():
pass pass
@nose.with_setup(setup_local, teardown) @nose.with_setup(setup_local, teardown)
def test_changes(): def _test_changes():
deck2.scm = 0 deck2.scm = 0
dels = client.deletions(deck1.lastSync) dels = client.deletions(deck1.lastSync)
rem = server.changes(deck1.lastSync, dels) rem = server.changes(deck1.lastSync, dels)