2022-09-10 18:26:52 +02:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
|
|
|
# This file is part of the Calibre-Web (https://github.com/janeczku/calibre-web)
|
|
|
|
# Copyright (C) 2020 monkey
|
|
|
|
#
|
|
|
|
# This program is free software: you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
#
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2022-09-14 17:03:48 +02:00
|
|
|
|
2022-09-10 18:26:52 +02:00
|
|
|
import os
|
2022-09-14 17:03:48 +02:00
|
|
|
from lxml import objectify
|
2022-09-10 18:26:52 +02:00
|
|
|
from urllib.request import urlopen
|
|
|
|
from lxml import etree
|
|
|
|
from html import escape
|
|
|
|
|
2023-02-25 16:31:48 +01:00
|
|
|
from cps import config, db, gdriveutils, logger
|
|
|
|
from cps.services.worker import CalibreTask
|
2022-09-10 18:26:52 +02:00
|
|
|
from flask_babel import lazy_gettext as N_
|
|
|
|
|
|
|
|
OPF_NAMESPACE = "http://www.idpf.org/2007/opf"
|
|
|
|
PURL_NAMESPACE = "http://purl.org/dc/elements/1.1/"
|
|
|
|
|
|
|
|
OPF = "{%s}" % OPF_NAMESPACE
|
|
|
|
PURL = "{%s}" % PURL_NAMESPACE
|
|
|
|
|
|
|
|
etree.register_namespace("opf", OPF_NAMESPACE)
|
|
|
|
etree.register_namespace("dc", PURL_NAMESPACE)
|
|
|
|
|
|
|
|
OPF_NS = {None: OPF_NAMESPACE} # the default namespace (no prefix)
|
|
|
|
NSMAP = {'dc': PURL_NAMESPACE, 'opf': OPF_NAMESPACE}
|
|
|
|
|
|
|
|
|
|
|
|
class TaskBackupMetadata(CalibreTask):
|
|
|
|
|
2022-09-19 18:56:22 +02:00
|
|
|
def __init__(self, export_language="en",
|
2022-09-19 22:39:40 +02:00
|
|
|
translated_title="Cover",
|
2022-09-19 18:56:22 +02:00
|
|
|
set_dirty=False,
|
|
|
|
task_message=N_('Backing up Metadata')):
|
2022-09-10 18:26:52 +02:00
|
|
|
super(TaskBackupMetadata, self).__init__(task_message)
|
|
|
|
self.log = logger.create()
|
2022-09-14 17:03:48 +02:00
|
|
|
self.calibre_db = db.CalibreDB(expire_on_commit=False, init=True)
|
|
|
|
self.export_language = export_language
|
|
|
|
self.translated_title = translated_title
|
2022-09-19 22:39:40 +02:00
|
|
|
self.set_dirty = set_dirty
|
2022-09-10 18:26:52 +02:00
|
|
|
|
|
|
|
def run(self, worker_thread):
|
2022-09-19 18:56:22 +02:00
|
|
|
if self.set_dirty:
|
|
|
|
self.set_all_books_dirty()
|
|
|
|
else:
|
|
|
|
self.backup_metadata()
|
|
|
|
|
|
|
|
def set_all_books_dirty(self):
|
|
|
|
try:
|
|
|
|
books = self.calibre_db.session.query(db.Books).all()
|
|
|
|
for book in books:
|
2022-09-19 22:39:40 +02:00
|
|
|
self.calibre_db.set_metadata_dirty(book.id)
|
|
|
|
self.calibre_db.session.commit()
|
|
|
|
self._handleSuccess()
|
2022-09-19 18:56:22 +02:00
|
|
|
except Exception as ex:
|
|
|
|
self.log.debug('Error adding book for backup: ' + str(ex))
|
|
|
|
self._handleError('Error adding book for backup: ' + str(ex))
|
|
|
|
self.calibre_db.session.rollback()
|
|
|
|
self.calibre_db.session.close()
|
|
|
|
|
|
|
|
def backup_metadata(self):
|
2022-09-10 18:26:52 +02:00
|
|
|
try:
|
2022-09-14 17:03:48 +02:00
|
|
|
metadata_backup = self.calibre_db.session.query(db.Metadata_Dirtied).all()
|
2023-02-25 16:31:48 +01:00
|
|
|
custom_columns = (self.calibre_db.session.query(db.CustomColumns)
|
|
|
|
.filter(db.CustomColumns.mark_for_delete == 0)
|
|
|
|
.filter(db.CustomColumns.datatype.notin_(db.cc_exceptions))
|
|
|
|
.order_by(db.CustomColumns.label).all())
|
2022-09-19 22:39:40 +02:00
|
|
|
count = len(metadata_backup)
|
|
|
|
i = 0
|
2022-09-10 18:26:52 +02:00
|
|
|
for backup in metadata_backup:
|
2022-09-14 17:03:48 +02:00
|
|
|
book = self.calibre_db.session.query(db.Books).filter(db.Books.id == backup.book).one_or_none()
|
2022-09-19 22:39:40 +02:00
|
|
|
self.calibre_db.session.query(db.Metadata_Dirtied).filter(
|
|
|
|
db.Metadata_Dirtied.book == backup.book).delete()
|
2022-09-19 18:56:22 +02:00
|
|
|
self.calibre_db.session.commit()
|
2022-09-10 18:26:52 +02:00
|
|
|
if book:
|
2022-09-14 17:03:48 +02:00
|
|
|
self.open_metadata(book, custom_columns)
|
2022-09-10 18:26:52 +02:00
|
|
|
else:
|
|
|
|
self.log.error("Book {} not found in database".format(backup.book))
|
2022-09-19 22:39:40 +02:00
|
|
|
i += 1
|
|
|
|
self.progress = (1.0 / count) * i
|
|
|
|
self._handleSuccess()
|
|
|
|
self.calibre_db.session.close()
|
2022-09-10 18:26:52 +02:00
|
|
|
|
|
|
|
except Exception as ex:
|
2022-09-23 20:45:30 +02:00
|
|
|
b = "NaN" if not hasattr(book, 'id') else book.id
|
|
|
|
self.log.debug('Error creating metadata backup for book {}: '.format(b) + str(ex))
|
2022-09-10 18:26:52 +02:00
|
|
|
self._handleError('Error creating metadata backup: ' + str(ex))
|
2022-09-14 17:03:48 +02:00
|
|
|
self.calibre_db.session.rollback()
|
|
|
|
self.calibre_db.session.close()
|
2022-09-10 18:26:52 +02:00
|
|
|
|
|
|
|
def open_metadata(self, book, custom_columns):
|
|
|
|
if config.config_use_google_drive:
|
|
|
|
if not gdriveutils.is_gdrive_ready():
|
|
|
|
raise Exception('Google Drive is configured but not ready')
|
|
|
|
|
|
|
|
web_content_link = gdriveutils.get_metadata_backup_via_gdrive(book.path)
|
|
|
|
if not web_content_link:
|
|
|
|
raise Exception('Google Drive cover url not found')
|
|
|
|
|
|
|
|
stream = None
|
|
|
|
try:
|
|
|
|
stream = urlopen(web_content_link)
|
|
|
|
except Exception as ex:
|
|
|
|
# Bubble exception to calling function
|
2022-09-19 18:56:22 +02:00
|
|
|
self.log.debug('Error reading metadata.opf: ' + str(ex)) # ToDo Check whats going on
|
2022-09-10 18:26:52 +02:00
|
|
|
raise ex
|
|
|
|
finally:
|
|
|
|
if stream is not None:
|
|
|
|
stream.close()
|
|
|
|
else:
|
2022-09-14 17:03:48 +02:00
|
|
|
# ToDo: Handle book folder not found or not readable
|
2022-09-10 18:26:52 +02:00
|
|
|
book_metadata_filepath = os.path.join(config.config_calibre_dir, book.path, 'metadata.opf')
|
2022-09-14 17:03:48 +02:00
|
|
|
#if not os.path.isfile(book_metadata_filepath):
|
|
|
|
self.create_new_metadata_backup(book, custom_columns, book_metadata_filepath)
|
|
|
|
# else:
|
2022-09-19 18:56:22 +02:00
|
|
|
'''namespaces = {'dc': PURL_NAMESPACE, 'opf': OPF_NAMESPACE}
|
|
|
|
test = etree.parse(book_metadata_filepath)
|
|
|
|
root = test.getroot()
|
|
|
|
for i in root.iter():
|
|
|
|
self.log.info(i)
|
|
|
|
title = root.find("dc:metadata", namespaces)
|
|
|
|
pass
|
|
|
|
with open(book_metadata_filepath, "rb") as f:
|
|
|
|
xml = f.read()
|
|
|
|
|
|
|
|
root = objectify.fromstring(xml)
|
|
|
|
# root.metadata['{http://purl.org/dc/elements/1.1/}title']
|
|
|
|
# root.metadata[PURL + 'title']
|
|
|
|
# getattr(root.metadata, PURL +'title')
|
|
|
|
# test = objectify.parse()
|
|
|
|
pass
|
|
|
|
# backup not found has to be created
|
|
|
|
#raise Exception('Book cover file not found')'''
|
2022-09-10 18:26:52 +02:00
|
|
|
|
|
|
|
def create_new_metadata_backup(self, book, custom_columns, book_metadata_filepath):
|
|
|
|
# generate root package element
|
|
|
|
package = etree.Element(OPF + "package", nsmap=OPF_NS)
|
|
|
|
package.set("unique-identifier", "uuid_id")
|
|
|
|
package.set("version", "2.0")
|
|
|
|
|
2023-02-21 17:03:54 +01:00
|
|
|
# generate metadata element and all sub elements of it
|
2022-09-10 18:26:52 +02:00
|
|
|
metadata = etree.SubElement(package, "metadata", nsmap=NSMAP)
|
|
|
|
identifier = etree.SubElement(metadata, PURL + "identifier", id="calibre_id", nsmap=NSMAP)
|
|
|
|
identifier.set(OPF + "scheme", "calibre")
|
|
|
|
identifier.text = str(book.id)
|
|
|
|
identifier2 = etree.SubElement(metadata, PURL + "identifier", id="uuid_id", nsmap=NSMAP)
|
|
|
|
identifier2.set(OPF + "scheme", "uuid")
|
|
|
|
identifier2.text = book.uuid
|
|
|
|
title = etree.SubElement(metadata, PURL + "title", nsmap=NSMAP)
|
|
|
|
title.text = book.title
|
|
|
|
for author in book.authors:
|
|
|
|
creator = etree.SubElement(metadata, PURL + "creator", nsmap=NSMAP)
|
2022-09-19 22:39:40 +02:00
|
|
|
creator.text = str(author.name)
|
2022-09-10 18:26:52 +02:00
|
|
|
creator.set(OPF + "file-as", book.author_sort) # ToDo Check
|
|
|
|
creator.set(OPF + "role", "aut")
|
|
|
|
contributor = etree.SubElement(metadata, PURL + "contributor", nsmap=NSMAP)
|
|
|
|
contributor.text = "calibre (5.7.2) [https://calibre-ebook.com]"
|
|
|
|
contributor.set(OPF + "file-as", "calibre") # ToDo Check
|
2022-09-19 22:39:40 +02:00
|
|
|
contributor.set(OPF + "role", "bkp")
|
2022-09-14 17:03:48 +02:00
|
|
|
|
2022-09-10 18:26:52 +02:00
|
|
|
date = etree.SubElement(metadata, PURL + "date", nsmap=NSMAP)
|
2022-09-14 17:03:48 +02:00
|
|
|
date.text = '{d.year:04}-{d.month:02}-{d.day:02}T{d.hour:02}:{d.minute:02}:{d.second:02}'.format(d=book.pubdate)
|
2023-03-19 17:21:30 +01:00
|
|
|
if book.comments and book.comments[0].text:
|
2022-09-19 22:39:40 +02:00
|
|
|
for b in book.comments:
|
|
|
|
description = etree.SubElement(metadata, PURL + "description", nsmap=NSMAP)
|
|
|
|
description.text = b.text
|
2023-03-05 16:03:07 +01:00
|
|
|
for b in book.publishers:
|
|
|
|
publisher = etree.SubElement(metadata, PURL + "publisher", nsmap=NSMAP)
|
|
|
|
publisher.text = str(b.name)
|
2022-09-14 17:03:48 +02:00
|
|
|
if not book.languages:
|
|
|
|
language = etree.SubElement(metadata, PURL + "language", nsmap=NSMAP)
|
|
|
|
language.text = self.export_language
|
2022-09-10 18:26:52 +02:00
|
|
|
else:
|
2022-09-14 17:03:48 +02:00
|
|
|
for b in book.languages:
|
|
|
|
language = etree.SubElement(metadata, PURL + "language", nsmap=NSMAP)
|
2022-09-19 22:39:40 +02:00
|
|
|
language.text = str(b.lang_code)
|
2022-09-14 17:03:48 +02:00
|
|
|
for b in book.tags:
|
2022-09-10 18:26:52 +02:00
|
|
|
subject = etree.SubElement(metadata, PURL + "subject", nsmap=NSMAP)
|
2022-09-19 22:39:40 +02:00
|
|
|
subject.text = str(b.name)
|
2022-09-10 18:26:52 +02:00
|
|
|
etree.SubElement(metadata, "meta", name="calibre:author_link_map",
|
2022-09-19 22:39:40 +02:00
|
|
|
content="{" + ", ".join(['"' + str(a.name) + '": ""' for a in book.authors]) + "}",
|
2022-09-10 18:26:52 +02:00
|
|
|
nsmap=NSMAP)
|
2022-09-19 22:39:40 +02:00
|
|
|
for b in book.series:
|
|
|
|
etree.SubElement(metadata, "meta", name="calibre:series",
|
|
|
|
content=str(str(b.name)),
|
|
|
|
nsmap=NSMAP)
|
2022-09-23 20:45:30 +02:00
|
|
|
if book.series:
|
|
|
|
etree.SubElement(metadata, "meta", name="calibre:series_index",
|
|
|
|
content=str(book.series_index),
|
|
|
|
nsmap=NSMAP)
|
2023-03-19 17:21:30 +01:00
|
|
|
if len(book.ratings) and book.ratings[0].rating > 0:
|
|
|
|
etree.SubElement(metadata, "meta", name="calibre:rating",
|
|
|
|
content=str(book.ratings[0].rating),
|
|
|
|
nsmap=NSMAP)
|
2022-09-10 18:26:52 +02:00
|
|
|
etree.SubElement(metadata, "meta", name="calibre:timestamp",
|
2022-09-14 17:03:48 +02:00
|
|
|
content='{d.year:04}-{d.month:02}-{d.day:02}T{d.hour:02}:{d.minute:02}:{d.second:02}'.format(
|
|
|
|
d=book.timestamp),
|
2022-09-10 18:26:52 +02:00
|
|
|
nsmap=NSMAP)
|
|
|
|
etree.SubElement(metadata, "meta", name="calibre:title_sort",
|
|
|
|
content=book.sort,
|
|
|
|
nsmap=NSMAP)
|
2022-09-19 22:39:40 +02:00
|
|
|
sequence = 0
|
2022-09-10 18:26:52 +02:00
|
|
|
for cc in custom_columns:
|
2022-09-14 17:03:48 +02:00
|
|
|
value = None
|
|
|
|
extra = None
|
|
|
|
cc_entry = getattr(book, "custom_column_" + str(cc.id))
|
|
|
|
if cc_entry.__len__():
|
2023-03-19 17:21:30 +01:00
|
|
|
value = cc_entry[0].value
|
|
|
|
extra = cc_entry[0].extra if hasattr(cc_entry[0], "extra") else None
|
2022-09-10 18:26:52 +02:00
|
|
|
etree.SubElement(metadata, "meta", name="calibre:user_metadata:#{}".format(cc.label),
|
2022-09-19 22:39:40 +02:00
|
|
|
content=cc.to_json(value, extra, sequence),
|
2022-09-10 18:26:52 +02:00
|
|
|
nsmap=NSMAP)
|
2022-09-19 22:39:40 +02:00
|
|
|
sequence += 1
|
2022-09-10 18:26:52 +02:00
|
|
|
|
|
|
|
# generate guide element and all sub elements of it
|
2022-09-14 17:03:48 +02:00
|
|
|
# Title is translated from default export language
|
2022-09-10 18:26:52 +02:00
|
|
|
guide = etree.SubElement(package, "guide")
|
2022-09-14 17:03:48 +02:00
|
|
|
etree.SubElement(guide, "reference", type="cover", title=self.translated_title, href="cover.jpg")
|
2022-09-10 18:26:52 +02:00
|
|
|
|
|
|
|
# prepare finalize everything and output
|
|
|
|
doc = etree.ElementTree(package)
|
2022-09-19 22:39:40 +02:00
|
|
|
# doc = etree.tostring(package, xml_declaration=True, encoding='utf-8', pretty_print=True) # .replace(b"&quot;", b""")
|
2022-09-14 17:03:48 +02:00
|
|
|
try:
|
|
|
|
with open(book_metadata_filepath, 'wb') as f:
|
|
|
|
doc.write(f, xml_declaration=True, encoding='utf-8', pretty_print=True)
|
2023-02-28 19:48:53 +01:00
|
|
|
except Exception as ex:
|
|
|
|
raise Exception('Writing Metadata failed with error: {} '.format(ex))
|
2023-02-25 16:31:48 +01:00
|
|
|
|
2022-09-10 18:26:52 +02:00
|
|
|
@property
|
|
|
|
def name(self):
|
2022-09-19 22:39:40 +02:00
|
|
|
return "Metadata backup"
|
|
|
|
|
|
|
|
# needed for logging
|
|
|
|
def __str__(self):
|
|
|
|
if self.set_dirty:
|
|
|
|
return "Queue all books for metadata backup"
|
|
|
|
else:
|
|
|
|
return "Perform metadata backup"
|
2022-09-10 18:26:52 +02:00
|
|
|
|
|
|
|
@property
|
|
|
|
def is_cancellable(self):
|
|
|
|
return True
|