anki/pylib/tests/test_importing.py

337 lines
9.9 KiB
Python
Raw Normal View History

2021-04-13 10:45:05 +02:00
# Copyright: Ankitects Pty Ltd and contributors
# License: GNU AGPL, version 3 or later; http://www.gnu.org/licenses/agpl.html
# coding: utf-8
2019-12-25 05:18:34 +01:00
import os
from tempfile import NamedTemporaryFile
import pytest
2020-07-19 05:27:31 +02:00
from anki.consts import *
2019-12-25 05:18:34 +01:00
from anki.importing import (
Anki2Importer,
AnkiPackageImporter,
MnemosyneImporter,
SupermemoXmlImporter,
TextImporter,
2019-12-25 05:18:34 +01:00
)
from tests.shared import getEmptyCol, getUpgradeDeckPath
testDir = os.path.dirname(__file__)
2019-12-25 05:18:34 +01:00
srcNotes = None
srcCards = None
def clear_tempfile(tf):
""" https://stackoverflow.com/questions/23212435/permission-denied-to-write-to-my-temporary-file """
try:
tf.close()
os.unlink(tf.name)
except:
pass
def test_anki2_mediadupes():
2020-07-17 17:37:17 +02:00
col = getEmptyCol()
# add a note that references a sound
2020-07-17 17:37:17 +02:00
n = col.newNote()
2019-12-25 05:18:34 +01:00
n["Front"] = "[sound:foo.mp3]"
mid = n.model()["id"]
2020-07-17 17:37:17 +02:00
col.addNote(n)
# add that sound to media folder
2020-07-17 17:37:17 +02:00
with open(os.path.join(col.media.dir(), "foo.mp3"), "w") as note:
note.write("foo")
2020-07-17 17:37:17 +02:00
col.close()
# it should be imported correctly into an empty deck
2014-06-03 10:38:47 +02:00
empty = getEmptyCol()
2020-07-17 17:37:17 +02:00
imp = Anki2Importer(empty, col.path)
imp.run()
assert os.listdir(empty.media.dir()) == ["foo.mp3"]
# and importing again will not duplicate, as the file content matches
2020-06-04 10:21:04 +02:00
empty.remove_cards_and_orphaned_notes(empty.db.list("select id from cards"))
2020-07-17 17:37:17 +02:00
imp = Anki2Importer(empty, col.path)
imp.run()
assert os.listdir(empty.media.dir()) == ["foo.mp3"]
n = empty.get_note(empty.db.scalar("select id from notes"))
assert "foo.mp3" in n.fields[0]
# if the local file content is different, and import should trigger a
# rename
2020-06-04 10:21:04 +02:00
empty.remove_cards_and_orphaned_notes(empty.db.list("select id from cards"))
with open(os.path.join(empty.media.dir(), "foo.mp3"), "w") as note:
note.write("bar")
2020-07-17 17:37:17 +02:00
imp = Anki2Importer(empty, col.path)
imp.run()
2019-12-25 05:18:34 +01:00
assert sorted(os.listdir(empty.media.dir())) == ["foo.mp3", "foo_%s.mp3" % mid]
n = empty.get_note(empty.db.scalar("select id from notes"))
assert "_" in n.fields[0]
# if the localized media file already exists, we rewrite the note and
# media
2020-06-04 10:21:04 +02:00
empty.remove_cards_and_orphaned_notes(empty.db.list("select id from cards"))
with open(os.path.join(empty.media.dir(), "foo.mp3"), "w") as note:
note.write("bar")
2020-07-17 17:37:17 +02:00
imp = Anki2Importer(empty, col.path)
imp.run()
2019-12-25 05:18:34 +01:00
assert sorted(os.listdir(empty.media.dir())) == ["foo.mp3", "foo_%s.mp3" % mid]
assert sorted(os.listdir(empty.media.dir())) == ["foo.mp3", "foo_%s.mp3" % mid]
n = empty.get_note(empty.db.scalar("select id from notes"))
assert "_" in n.fields[0]
2019-12-25 05:18:34 +01:00
def test_apkg():
2020-07-17 17:37:17 +02:00
col = getEmptyCol()
apkg = str(os.path.join(testDir, "support", "media.apkg"))
2020-07-17 17:37:17 +02:00
imp = AnkiPackageImporter(col, apkg)
assert os.listdir(col.media.dir()) == []
imp.run()
2020-07-17 17:37:17 +02:00
assert os.listdir(col.media.dir()) == ["foo.wav"]
# importing again should be idempotent in terms of media
2020-07-17 17:37:17 +02:00
col.remove_cards_and_orphaned_notes(col.db.list("select id from cards"))
imp = AnkiPackageImporter(col, apkg)
imp.run()
2020-07-17 17:37:17 +02:00
assert os.listdir(col.media.dir()) == ["foo.wav"]
# but if the local file has different data, it will rename
2020-07-17 17:37:17 +02:00
col.remove_cards_and_orphaned_notes(col.db.list("select id from cards"))
with open(os.path.join(col.media.dir(), "foo.wav"), "w") as note:
note.write("xyz")
2020-07-17 17:37:17 +02:00
imp = AnkiPackageImporter(col, apkg)
imp.run()
2020-07-17 17:37:17 +02:00
assert len(os.listdir(col.media.dir())) == 2
2019-12-25 05:18:34 +01:00
def test_anki2_diffmodel_templates():
# different from the above as this one tests only the template text being
# changed, not the number of cards/fields
dst = getEmptyCol()
# import the first version of the model
2020-07-17 17:37:17 +02:00
col = getUpgradeDeckPath("diffmodeltemplates-1.apkg")
imp = AnkiPackageImporter(dst, col)
imp.dupeOnSchemaChange = True
imp.run()
# then the version with updated template
2020-07-17 17:37:17 +02:00
col = getUpgradeDeckPath("diffmodeltemplates-2.apkg")
imp = AnkiPackageImporter(dst, col)
imp.dupeOnSchemaChange = True
imp.run()
# collection should contain the note we imported
2019-12-25 05:18:34 +01:00
assert dst.noteCount() == 1
# the front template should contain the text added in the 2nd package
2019-12-25 05:18:34 +01:00
tcid = dst.findCards("")[0] # only 1 note in collection
tnote = dst.getCard(tcid).note()
assert "Changed Front Template" in tnote.cards()[0].template()["qfmt"]
2019-12-25 05:18:34 +01:00
def test_anki2_updates():
# create a new empty deck
2014-06-03 10:38:47 +02:00
dst = getEmptyCol()
2020-07-17 17:37:17 +02:00
col = getUpgradeDeckPath("update1.apkg")
imp = AnkiPackageImporter(dst, col)
imp.run()
assert imp.dupes == 0
assert imp.added == 1
assert imp.updated == 0
# importing again should be idempotent
2020-07-17 17:37:17 +02:00
imp = AnkiPackageImporter(dst, col)
imp.run()
assert imp.dupes == 1
assert imp.added == 0
assert imp.updated == 0
# importing a newer note should update
assert dst.noteCount() == 1
assert dst.db.scalar("select flds from notes").startswith("hello")
2020-07-17 17:37:17 +02:00
col = getUpgradeDeckPath("update2.apkg")
imp = AnkiPackageImporter(dst, col)
imp.run()
assert imp.dupes == 0
assert imp.added == 0
assert imp.updated == 1
assert dst.noteCount() == 1
assert dst.db.scalar("select flds from notes").startswith("goodbye")
2019-12-25 05:18:34 +01:00
def test_csv():
col = getEmptyCol()
file = str(os.path.join(testDir, "support", "text-2fields.txt"))
i = TextImporter(col, file)
i.initMapping()
i.run()
# four problems - too many & too few fields, a missing front, and a
# duplicate entry
assert len(i.log) == 5
assert i.total == 5
# if we run the import again, it should update instead
i.run()
2013-05-16 10:19:11 +02:00
assert len(i.log) == 10
assert i.total == 5
# but importing should not clobber tags if they're unmapped
n = col.get_note(col.db.scalar("select id from notes"))
n.add_tag("test")
n.flush()
i.run()
n.load()
2019-12-25 05:18:34 +01:00
assert n.tags == ["test"]
# if add-only mode, count will be 0
i.importMode = 1
i.run()
assert i.total == 0
# and if dupes mode, will reimport everything
assert col.cardCount() == 5
i.importMode = 2
i.run()
# includes repeated field
assert i.total == 6
assert col.cardCount() == 11
col.close()
2019-12-25 05:18:34 +01:00
def test_csv2():
col = getEmptyCol()
mm = col.models
m = mm.current()
note = mm.newField("Three")
mm.addField(m, note)
mm.save(m)
n = col.newNote()
2019-12-25 05:18:34 +01:00
n["Front"] = "1"
n["Back"] = "2"
n["Three"] = "3"
col.addNote(n)
# an update with unmapped fields should not clobber those fields
file = str(os.path.join(testDir, "support", "text-update.txt"))
i = TextImporter(col, file)
i.initMapping()
i.run()
n.load()
2019-12-25 05:18:34 +01:00
assert n["Front"] == "1"
assert n["Back"] == "x"
assert n["Three"] == "3"
col.close()
2019-12-25 05:18:34 +01:00
def test_tsv_tag_modified():
col = getEmptyCol()
mm = col.models
m = mm.current()
note = mm.newField("Top")
mm.addField(m, note)
mm.save(m)
n = col.newNote()
n["Front"] = "1"
n["Back"] = "2"
n["Top"] = "3"
n.add_tag("four")
col.addNote(n)
# https://stackoverflow.com/questions/23212435/permission-denied-to-write-to-my-temporary-file
with NamedTemporaryFile(mode="w", delete=False) as tf:
tf.write("1\tb\tc\n")
tf.flush()
i = TextImporter(col, tf.name)
i.initMapping()
i.tagModified = "boom"
i.run()
clear_tempfile(tf)
n.load()
assert n["Front"] == "1"
assert n["Back"] == "b"
assert n["Top"] == "c"
assert "four" in n.tags
assert "boom" in n.tags
assert len(n.tags) == 2
assert i.updateCount == 1
col.close()
def test_tsv_tag_multiple_tags():
col = getEmptyCol()
mm = col.models
m = mm.current()
note = mm.newField("Top")
mm.addField(m, note)
mm.save(m)
n = col.newNote()
n["Front"] = "1"
n["Back"] = "2"
n["Top"] = "3"
n.add_tag("four")
n.add_tag("five")
col.addNote(n)
# https://stackoverflow.com/questions/23212435/permission-denied-to-write-to-my-temporary-file
with NamedTemporaryFile(mode="w", delete=False) as tf:
tf.write("1\tb\tc\n")
tf.flush()
i = TextImporter(col, tf.name)
i.initMapping()
2020-01-02 20:05:56 +01:00
i.tagModified = "five six"
i.run()
clear_tempfile(tf)
n.load()
assert n["Front"] == "1"
assert n["Back"] == "b"
assert n["Top"] == "c"
assert list(sorted(n.tags)) == list(sorted(["four", "five", "six"]))
col.close()
def test_csv_tag_only_if_modified():
col = getEmptyCol()
mm = col.models
m = mm.current()
note = mm.newField("Left")
mm.addField(m, note)
mm.save(m)
n = col.newNote()
n["Front"] = "1"
n["Back"] = "2"
n["Left"] = "3"
col.addNote(n)
# https://stackoverflow.com/questions/23212435/permission-denied-to-write-to-my-temporary-file
with NamedTemporaryFile(mode="w", delete=False) as tf:
tf.write("1,2,3\n")
tf.flush()
i = TextImporter(col, tf.name)
i.initMapping()
i.tagModified = "right"
i.run()
clear_tempfile(tf)
n.load()
assert n.tags == []
assert i.updateCount == 0
col.close()
@pytest.mark.filterwarnings("ignore:Using or importing the ABCs")
def test_supermemo_xml_01_unicode():
col = getEmptyCol()
file = str(os.path.join(testDir, "support", "supermemo1.xml"))
i = SupermemoXmlImporter(col, file)
2019-12-25 05:18:34 +01:00
# i.META.logToStdOutput = True
i.run()
assert i.total == 1
cid = col.db.scalar("select id from cards")
c = col.getCard(cid)
2014-02-13 08:46:38 +01:00
# Applies A Factor-to-E Factor conversion
assert c.factor == 2879
assert c.reps == 7
col.close()
2019-12-25 05:18:34 +01:00
def test_mnemo():
col = getEmptyCol()
file = str(os.path.join(testDir, "support", "mnemo.db"))
i = MnemosyneImporter(col, file)
i.run()
assert col.cardCount() == 7
assert "a_longer_tag" in col.tags.all()
2020-07-19 05:27:31 +02:00
assert col.db.scalar(f"select count() from cards where type = {CARD_TYPE_NEW}") == 1
col.close()