anki/qt/aqt/importing.py

505 lines
16 KiB
Python
Raw Normal View History

# coding=utf-8
2019-02-05 04:59:03 +01:00
# Copyright: Ankitects Pty Ltd and contributors
# License: GNU AGPL, version 3 or later; http://www.gnu.org/licenses/agpl.html
2019-12-20 10:19:03 +01:00
import json
import os
import re
2019-12-20 10:19:03 +01:00
import shutil
import traceback
2017-09-30 11:29:21 +02:00
import unicodedata
2019-12-20 10:19:03 +01:00
import zipfile
import anki.importing as importing
2019-12-20 10:19:03 +01:00
import aqt.deckchooser
import aqt.forms
import aqt.modelchooser
2019-12-20 10:19:03 +01:00
from anki.hooks import addHook, remHook
from anki.lang import _, ngettext
from aqt import AnkiQt
from aqt.qt import *
2019-12-23 01:34:10 +01:00
from aqt.utils import (
askUser,
getFile,
getOnlyText,
openHelp,
showInfo,
showText,
showWarning,
tooltip,
)
2019-12-20 10:19:03 +01:00
class ChangeMap(QDialog):
def __init__(self, mw: AnkiQt, model, current):
QDialog.__init__(self, mw, Qt.Window)
self.mw = mw
self.model = model
self.frm = aqt.forms.changemap.Ui_ChangeMap()
self.frm.setupUi(self)
n = 0
setCurrent = False
2019-12-23 01:34:10 +01:00
for field in self.model["flds"]:
item = QListWidgetItem(_("Map to %s") % field["name"])
self.frm.fields.addItem(item)
2019-12-23 01:34:10 +01:00
if current == field["name"]:
setCurrent = True
self.frm.fields.setCurrentRow(n)
n += 1
self.frm.fields.addItem(QListWidgetItem(_("Map to Tags")))
self.frm.fields.addItem(QListWidgetItem(_("Ignore field")))
if not setCurrent:
if current == "_tags":
self.frm.fields.setCurrentRow(n)
else:
2019-12-23 01:34:10 +01:00
self.frm.fields.setCurrentRow(n + 1)
self.field = None
def getField(self):
self.exec_()
return self.field
def accept(self):
row = self.frm.fields.currentRow()
2019-12-23 01:34:10 +01:00
if row < len(self.model["flds"]):
self.field = self.model["flds"][row]["name"]
elif row == self.frm.fields.count() - 2:
self.field = "_tags"
else:
self.field = None
QDialog.accept(self)
def reject(self):
self.accept()
2019-12-23 01:34:10 +01:00
class ImportDialog(QDialog):
def __init__(self, mw: AnkiQt, importer):
QDialog.__init__(self, mw, Qt.Window)
self.mw = mw
self.importer = importer
self.frm = aqt.forms.importing.Ui_ImportDialog()
self.frm.setupUi(self)
self.frm.buttonBox.button(QDialogButtonBox.Help).clicked.connect(
2019-12-23 01:34:10 +01:00
self.helpRequested
)
self.setupMappingFrame()
self.setupOptions()
self.modelChanged()
self.frm.autoDetect.setVisible(self.importer.needDelimiter)
addHook("currentModelChanged", self.modelChanged)
self.frm.autoDetect.clicked.connect(self.onDelimiter)
self.updateDelimiterButtonText()
2019-12-23 01:34:10 +01:00
self.frm.allowHTML.setChecked(self.mw.pm.profile.get("allowHTML", True))
self.frm.importMode.currentIndexChanged.connect(self.importModeChanged)
2019-12-23 01:34:10 +01:00
self.frm.importMode.setCurrentIndex(self.mw.pm.profile.get("importMode", 1))
# import button
b = QPushButton(_("Import"))
self.frm.buttonBox.addButton(b, QDialogButtonBox.AcceptRole)
self.exec_()
def setupOptions(self):
self.model = self.mw.col.models.current()
self.modelChooser = aqt.modelchooser.ModelChooser(
2019-12-23 01:34:10 +01:00
self.mw, self.frm.modelArea, label=False
)
self.deck = aqt.deckchooser.DeckChooser(self.mw, self.frm.deckArea, label=False)
def modelChanged(self):
self.importer.model = self.mw.col.models.current()
self.importer.initMapping()
self.showMapping()
if self.mw.col.conf.get("addToCur", True):
2019-12-23 01:34:10 +01:00
did = self.mw.col.conf["curDeck"]
if self.mw.col.decks.isDyn(did):
did = 1
else:
2019-12-23 01:34:10 +01:00
did = self.importer.model["did"]
# self.deck.setText(self.mw.col.decks.name(did))
def onDelimiter(self):
2019-12-23 01:34:10 +01:00
str = (
getOnlyText(
_(
"""\
By default, Anki will detect the character between fields, such as
a tab, comma, and so on. If Anki is detecting the character incorrectly,
2019-12-23 01:34:10 +01:00
you can enter it here. Use \\t to represent tab."""
),
self,
help="importing",
)
or "\t"
)
str = str.replace("\\t", "\t")
if len(str) > 1:
2019-12-23 01:34:10 +01:00
showWarning(
_(
"Multi-character separators are not supported. "
"Please enter one character only."
)
)
return
self.hideMapping()
2019-12-23 01:34:10 +01:00
def updateDelim():
self.importer.delimiter = str
self.importer.updateDelimiter()
2019-12-23 01:34:10 +01:00
self.showMapping(hook=updateDelim)
self.updateDelimiterButtonText()
def updateDelimiterButtonText(self):
if not self.importer.needDelimiter:
return
if self.importer.delimiter:
d = self.importer.delimiter
else:
d = self.importer.dialect.delimiter
if d == "\t":
d = _("Tab")
elif d == ",":
d = _("Comma")
elif d == " ":
d = _("Space")
elif d == ";":
d = _("Semicolon")
elif d == ":":
d = _("Colon")
else:
d = repr(d)
txt = _("Fields separated by: %s") % d
self.frm.autoDetect.setText(txt)
def accept(self):
self.importer.mapping = self.mapping
if not self.importer.mappingOk():
2019-12-23 01:34:10 +01:00
showWarning(_("The first field of the note type must be mapped."))
return
self.importer.importMode = self.frm.importMode.currentIndex()
2019-12-23 01:34:10 +01:00
self.mw.pm.profile["importMode"] = self.importer.importMode
self.importer.allowHTML = self.frm.allowHTML.isChecked()
2019-12-23 01:34:10 +01:00
self.mw.pm.profile["allowHTML"] = self.importer.allowHTML
if self.frm.tagModifiedCheck.isChecked():
self.importer.tagModified = self.frm.tagModifiedTag.text()
self.mw.pm.profile["tagModified"] = self.importer.tagModified
did = self.deck.selectedId()
2019-12-23 01:34:10 +01:00
if did != self.importer.model["did"]:
self.importer.model["did"] = did
self.mw.col.models.save(self.importer.model, updateReqs=False)
self.mw.col.decks.select(did)
self.mw.progress.start(immediate=True)
self.mw.checkpoint(_("Import"))
try:
self.importer.run()
except UnicodeDecodeError:
showUnicodeWarning()
return
except Exception as e:
msg = _("Import failed.\n")
err = repr(str(e))
if "1-character string" in err:
msg += err
2013-11-07 13:57:23 +01:00
elif "invalidTempFolder" in err:
msg += self.mw.errorHandler.tempFolderMsg()
else:
msg += traceback.format_exc()
showText(msg)
return
finally:
self.mw.progress.finish()
txt = _("Importing complete.") + "\n"
if self.importer.log:
txt += "\n".join(self.importer.log)
self.close()
showText(txt)
self.mw.reset()
def setupMappingFrame(self):
# qt seems to have a bug with adding/removing from a grid, so we add
# to a separate object and add/remove that instead
self.frame = QFrame(self.frm.mappingArea)
self.frm.mappingArea.setWidget(self.frame)
self.mapbox = QVBoxLayout(self.frame)
2019-12-23 01:34:10 +01:00
self.mapbox.setContentsMargins(0, 0, 0, 0)
self.mapwidget = None
def hideMapping(self):
self.frm.mappingGroup.hide()
def showMapping(self, keepMapping=False, hook=None):
if hook:
hook()
if not keepMapping:
self.mapping = self.importer.mapping
self.frm.mappingGroup.show()
assert self.importer.fields()
# set up the mapping grid
if self.mapwidget:
self.mapbox.removeWidget(self.mapwidget)
self.mapwidget.deleteLater()
self.mapwidget = QWidget()
self.mapbox.addWidget(self.mapwidget)
self.grid = QGridLayout(self.mapwidget)
self.mapwidget.setLayout(self.grid)
2019-12-23 01:34:10 +01:00
self.grid.setContentsMargins(3, 3, 3, 3)
self.grid.setSpacing(6)
fields = self.importer.fields()
for num in range(len(self.mapping)):
text = _("Field <b>%d</b> of file is:") % (num + 1)
self.grid.addWidget(QLabel(text), num, 0)
if self.mapping[num] == "_tags":
text = _("mapped to <b>Tags</b>")
elif self.mapping[num]:
text = _("mapped to <b>%s</b>") % self.mapping[num]
else:
text = _("<ignored>")
self.grid.addWidget(QLabel(text), num, 1)
button = QPushButton(_("Change"))
self.grid.addWidget(button, num, 2)
2019-12-23 01:34:10 +01:00
button.clicked.connect(lambda _, s=self, n=num: s.changeMappingNum(n))
def changeMappingNum(self, n):
f = ChangeMap(self.mw, self.importer.model, self.mapping[n]).getField()
try:
# make sure we don't have it twice
index = self.mapping.index(f)
self.mapping[index] = None
except ValueError:
pass
self.mapping[n] = f
if getattr(self.importer, "delimiter", False):
self.savedDelimiter = self.importer.delimiter
2019-12-23 01:34:10 +01:00
def updateDelim():
self.importer.delimiter = self.savedDelimiter
2019-12-23 01:34:10 +01:00
self.showMapping(hook=updateDelim, keepMapping=True)
else:
self.showMapping(keepMapping=True)
def reject(self):
self.modelChooser.cleanup()
self.deck.cleanup()
remHook("currentModelChanged", self.modelChanged)
QDialog.reject(self)
def helpRequested(self):
openHelp("importing")
def importModeChanged(self, newImportMode):
if newImportMode == 0:
allowTagModified = True
else:
allowTagModified = False
self.frm.tagModifiedCheck.setEnabled(allowTagModified)
self.frm.tagModifiedTag.setEnabled(allowTagModified)
def showUnicodeWarning():
"""Shorthand to show a standard warning."""
2019-12-23 01:34:10 +01:00
showWarning(
_(
"Selected file was not in UTF-8 format. Please see the "
"importing section of the manual."
)
)
def onImport(mw):
filt = ";;".join([x[0] for x in importing.Importers])
2019-12-23 01:34:10 +01:00
file = getFile(mw, _("Import"), None, key="import", filter=filt)
if not file:
return
file = str(file)
2018-09-27 03:35:21 +02:00
head, ext = os.path.splitext(file)
ext = ext.lower()
if ext == ".anki":
2019-12-23 01:34:10 +01:00
showInfo(
_(
".anki files are from a very old version of Anki. You can import them with Anki 2.0, available on the Anki website."
)
)
2018-09-27 03:35:21 +02:00
return
elif ext == ".anki2":
2019-12-23 01:34:10 +01:00
showInfo(
_(
".anki2 files are not directly importable - please import the .apkg or .zip file you have received instead."
)
)
2018-09-27 03:35:21 +02:00
return
importFile(mw, file)
2019-12-23 01:34:10 +01:00
def importFile(mw, file):
importerClass = None
done = False
for i in importing.Importers:
if done:
break
2019-03-04 08:03:43 +01:00
for mext in re.findall(r"[( ]?\*\.(.+?)[) ]", i[0]):
if file.endswith("." + mext):
importerClass = i[1]
done = True
break
if not importerClass:
# if no matches, assume TSV
importerClass = importing.Importers[0][1]
importer = importerClass(mw.col, file)
# need to show import dialog?
if importer.needMapper:
# make sure we can load the file first
mw.progress.start(immediate=True)
try:
importer.open()
except UnicodeDecodeError:
showUnicodeWarning()
return
except Exception as e:
msg = repr(str(e))
if msg == "'unknownFormat'":
2018-09-27 03:35:21 +02:00
showWarning(_("Unknown file format."))
else:
msg = _("Import failed. Debugging info:\n")
msg += str(traceback.format_exc())
showText(msg)
return
finally:
mw.progress.finish()
diag = ImportDialog(mw, importer)
else:
2013-09-11 08:56:59 +02:00
# if it's an apkg/zip, first test it's a valid file
if importer.__class__.__name__ == "AnkiPackageImporter":
2013-09-11 08:56:59 +02:00
try:
2014-09-27 17:19:43 +02:00
z = zipfile.ZipFile(importer.file)
2013-09-11 08:56:59 +02:00
z.getinfo("collection.anki2")
except:
showWarning(invalidZipMsg())
2013-09-11 08:56:59 +02:00
return
# we need to ask whether to import/replace
if not setupApkgImport(mw, importer):
return
mw.progress.start(immediate=True)
try:
try:
importer.run()
finally:
mw.progress.finish()
2013-05-17 07:22:49 +02:00
except zipfile.BadZipfile:
showWarning(invalidZipMsg())
except Exception as e:
err = repr(str(e))
if "invalidFile" in err:
2019-12-23 01:34:10 +01:00
msg = _(
"""\
Invalid file. Please restore from backup."""
)
showWarning(msg)
2014-02-02 17:51:51 +01:00
elif "invalidTempFolder" in err:
showWarning(mw.errorHandler.tempFolderMsg())
elif "readonly" in err:
2019-12-23 01:34:10 +01:00
showWarning(
_(
"""\
Unable to import from a read-only file."""
)
)
else:
msg = _("Import failed.\n")
msg += str(traceback.format_exc())
showText(msg)
else:
log = "\n".join(importer.log)
if "\n" not in log:
tooltip(log)
else:
showText(log)
mw.reset()
2019-12-23 01:34:10 +01:00
def invalidZipMsg():
2019-12-23 01:34:10 +01:00
return _(
"""\
This file does not appear to be a valid .apkg file. If you're getting this \
error from a file downloaded from AnkiWeb, chances are that your download \
failed. Please try again, and if the problem persists, please try again \
2019-12-23 01:34:10 +01:00
with a different browser."""
)
def setupApkgImport(mw, importer):
base = os.path.basename(importer.file).lower()
2019-12-23 01:34:10 +01:00
full = (
(base == "collection.apkg")
or re.match("backup-.*\\.apkg", base)
or base.endswith(".colpkg")
)
if not full:
# adding
return True
2019-12-23 01:34:10 +01:00
if not mw.restoringBackup and not askUser(
_(
"""\
This will delete your existing collection and replace it with the data in \
2019-12-23 01:34:10 +01:00
the file you're importing. Are you sure?"""
),
msgfunc=QMessageBox.warning,
defaultno=True,
):
return False
replaceWithApkg(mw, importer.file, mw.restoringBackup)
2019-12-23 01:34:10 +01:00
def replaceWithApkg(mw, file, backup):
mw.unloadCollection(lambda: _replaceWithApkg(mw, file, backup))
2019-12-23 01:34:10 +01:00
def _replaceWithApkg(mw, file, backup):
mw.progress.start(immediate=True)
z = zipfile.ZipFile(file)
# v2 scheduler?
colname = "collection.anki21"
try:
z.getinfo(colname)
except KeyError:
colname = "collection.anki2"
try:
2019-12-23 01:34:10 +01:00
with z.open(colname) as source, open(mw.pm.collectionPath(), "wb") as target:
2018-02-05 06:30:57 +01:00
shutil.copyfileobj(source, target)
except:
mw.progress.finish()
showWarning(_("The provided file is not a valid .apkg file."))
return
# because users don't have a backup of media, it's safer to import new
# data and rely on them running a media db check to get rid of any
# unwanted media. in the future we might also want to deduplicate this
# step
d = os.path.join(mw.pm.profileFolder(), "collection.media")
2016-07-11 06:56:58 +02:00
for n, (cStr, file) in enumerate(
2019-12-23 01:34:10 +01:00
json.loads(z.read("media").decode("utf8")).items()
):
mw.progress.update(
ngettext("Processed %d media file", "Processed %d media files", n) % n
)
size = z.getinfo(cStr).file_size
2017-09-30 11:29:21 +02:00
dest = os.path.join(d, unicodedata.normalize("NFC", file))
# if we have a matching file size
if os.path.exists(dest) and size == os.stat(dest).st_size:
continue
data = z.read(cStr)
open(dest, "wb").write(data)
z.close()
# reload
if not mw.loadCollection():
mw.progress.finish()
return
if backup:
mw.col.modSchema(check=False)
mw.progress.finish()