1
0
mirror of https://github.com/janeczku/calibre-web synced 2025-01-12 10:20:29 +00:00

fb2 uploading

This commit is contained in:
Pavel Yakunin 2016-06-18 16:50:32 +03:00
parent 43d6077815
commit 8b5bd61467
2 changed files with 75 additions and 2 deletions

View File

@ -22,16 +22,25 @@ try:
import epub
use_epub_meta = True
except ImportError, e:
logger.warning('cannot import PyPDF2, extracting pdf metadata will not work: %s', e)
logger.warning('cannot import PyPDF2, extracting epub metadata will not work: %s', e)
use_epub_meta = False
try:
import fb2
use_fb2_meta = True
except ImportError, e:
logger.warning('cannot import lxml, extracting fb2 metadata will not work: %s', e)
use_fb2_meta = False
def process(tmp_file_path, original_file_name, original_file_extension):
try:
if ".PDF" == original_file_extension.upper():
return pdf_meta(tmp_file_path, original_file_name, original_file_extension)
if ".EPUB" == original_file_extension.upper() and use_pdf_meta == True:
if ".EPUB" == original_file_extension.upper() and use_epub_meta == True:
return epub.get_epub_info(tmp_file_path, original_file_name, original_file_extension)
if ".FB2" == original_file_extension.upper() and use_fb2_meta == True:
return fb2.get_fb2_info(tmp_file_path, original_file_name, original_file_extension)
except Exception, e:
logger.warning('cannot parse metadata, using default: %s', e)

64
cps/fb2.py Normal file
View File

@ -0,0 +1,64 @@
from lxml import etree
import os
import uploader
def get_fb2_info(tmp_file_path, original_file_name, original_file_extension):
ns = {
'fb':'http://www.gribuser.ru/xml/fictionbook/2.0',
'l':'ttp://www.w3.org/1999/xlink',
}
fb2_file = open(tmp_file_path)
tree = etree.fromstring(fb2_file.read())
authors = tree.xpath('/fb:FictionBook/fb:description/fb:title-info/fb:author', namespaces=ns)
def get_author(element):
return element.xpath('fb:first-name/text()', namespaces=ns)[0] + ' ' + element.xpath('fb:middle-name/text()', namespaces=ns)[0] + ' ' + element.xpath('fb:last-name/text()', namespaces=ns)[0]
author = ", ".join(map(get_author, authors))
title = unicode(tree.xpath('/fb:FictionBook/fb:description/fb:title-info/fb:book-title/text()', namespaces=ns)[0])
description = unicode(tree.xpath('/fb:FictionBook/fb:description/fb:publish-info/fb:book-name/text()', namespaces=ns)[0])
#
#
#
# cfname = tree.xpath('n:rootfiles/n:rootfile/@full-path',namespaces=ns)[0]
#
# cf = zip.read(cfname)
# tree = etree.fromstring(cf)
#
# p = tree.xpath('/pkg:package/pkg:metadata',namespaces=ns)[0]
#
# epub_metadata = {}
# for s in ['title', 'description', 'creator']:
# tmp = p.xpath('dc:%s/text()'%(s),namespaces=ns)
# if (len(tmp) > 0):
# epub_metadata[s] = p.xpath('dc:%s/text()'%(s),namespaces=ns)[0]
# else:
# epub_metadata[s] = "Unknown"
#
# coversection = tree.xpath("/pkg:package/pkg:manifest/pkg:item[@id='cover']/@href",namespaces=ns)
# if (len(coversection) > 0):
# coverfile = extractCover(zip, coversection[0], tmp_file_path)
# else:
# coverfile = None
# if epub_metadata['title'] is None:
# title = original_file_name
# else:
# title = epub_metadata['title']
#
#
return uploader.BookMeta(
file_path = tmp_file_path,
extension = original_file_extension,
title = title,
author = author,
cover = None,
description = description,
tags = "",
series = "",
series_id="")