~ubuntu-branches/debian/sid/calibre/sid

« back to all changes in this revision

Viewing changes to src/calibre/ebooks/metadata/pdf.py

Committer: Package Import Robot
Author(s): Martin Pitt
Date: 2014-02-27 07:48:06 UTC
mto: This revision was merged to the branch mainline in revision 74.
Revision ID: package-import@ubuntu.com-20140227074806-64wdebb3ptosxhhx

Tags: upstream-1.25.0+dfsg

Import upstream version 1.25.0+dfsg

files added:
manual/templates/epub_cover_template.html

recipes/disinformatico.recipe

recipes/gosc_full.recipe

recipes/icons/gosc_full.png

recipes/les_echos.recipe

resources/images/beautify.png

src/calibre/ebooks/metadata/xmp.py

src/calibre/gui2/tweak_book/diff/highlight.py

src/calibre/gui2/tweak_book/editor/smart

src/calibre/gui2/tweak_book/editor/smart/__init__.py

src/calibre/gui2/tweak_book/editor/smart/html.py

src/calibre/gui2/viewer/gestures.py

files removed:
recipes/icons/kdefamily_pl.png

recipes/kdefamily_pl.recipe

src/calibre/gui2/store/stores/foyles_uk_plugin.py

files modified:
Changelog.yaml

manual/conf.py

manual/conversion.rst

manual/custom.py

manual/diff.rst

manual/edit.rst

manual/epub.py

manual/faq.rst

manual/templates/layout.html

recipes/abc_es.recipe

recipes/ap.recipe

recipes/cosmopolitan_uk.recipe

recipes/cumhuriyet.recipe

recipes/gosc_niedzielny.recipe

recipes/kathemerini.recipe

recipes/mac_world_uk.recipe

recipes/nrc-nl-epub.recipe

recipes/nytimesbook.recipe

recipes/wired_it.recipe

resources/builtin_recipes.xml

resources/builtin_recipes.zip

resources/compiled_coffeescript.zip

resources/ebook-convert-complete.pickle

resources/images.qrc

resources/localization/locales.zip

resources/localization/stats.pickle

resources/quick_start.epub

setup/installer/__init__.py

setup/iso_639/pl.po

setup/iso_639/ru.po

setup/plugins_mirror.py

setup/resources.py

src/calibre/__init__.py

src/calibre/constants.py

src/calibre/customize/builtins.py

src/calibre/db/cache.py

src/calibre/debug.py

src/calibre/devices/kobo/driver.py

src/calibre/ebooks/chardet.py

src/calibre/ebooks/conversion/plugins/epub_output.py

src/calibre/ebooks/conversion/plugins/pdf_output.py

src/calibre/ebooks/html/input.py

src/calibre/ebooks/metadata/__init__.py

src/calibre/ebooks/metadata/meta.py

src/calibre/ebooks/metadata/opf2.py

src/calibre/ebooks/metadata/pdf.py

src/calibre/ebooks/metadata/sources/edelweiss.py

src/calibre/ebooks/mobi/reader/mobi8.py

src/calibre/ebooks/oeb/base.py

src/calibre/ebooks/oeb/display/paged.coffee

src/calibre/ebooks/oeb/parse_utils.py

src/calibre/ebooks/oeb/polish/check/links.py

src/calibre/ebooks/oeb/polish/check/main.py

src/calibre/ebooks/oeb/polish/check/parsing.py

src/calibre/ebooks/oeb/polish/choose.coffee

src/calibre/ebooks/oeb/polish/container.py

src/calibre/ebooks/oeb/polish/css.py

src/calibre/ebooks/oeb/polish/errors.py

src/calibre/ebooks/oeb/polish/font_stats.coffee

src/calibre/ebooks/oeb/polish/parsing.py

src/calibre/ebooks/oeb/polish/preview.coffee

src/calibre/ebooks/oeb/polish/split.py

src/calibre/ebooks/oeb/polish/tests/container.py

src/calibre/ebooks/oeb/polish/tests/parsing.py

src/calibre/ebooks/oeb/polish/toc.py

src/calibre/ebooks/oeb/polish/utils.py

src/calibre/ebooks/oeb/transforms/rasterize.py

src/calibre/ebooks/oeb/transforms/split.py

src/calibre/ebooks/pdf/render/from_html.py

src/calibre/ebooks/pdf/render/graphics.py

src/calibre/ebooks/pdf/render/serialize.py

src/calibre/gui2/__init__.py

src/calibre/gui2/actions/add.py

src/calibre/gui2/actions/copy_to_library.py

src/calibre/gui2/actions/next_match.py

src/calibre/gui2/actions/preferences.py

src/calibre/gui2/actions/restart.py

src/calibre/gui2/actions/similar_books.py

src/calibre/gui2/auto_add.py

src/calibre/gui2/comments_editor.py

src/calibre/gui2/complete2.py

src/calibre/gui2/dialogs/duplicates.py

src/calibre/gui2/dialogs/message_box.py

src/calibre/gui2/dialogs/metadata_bulk.py

src/calibre/gui2/email.py

src/calibre/gui2/init.py

src/calibre/gui2/jobs.py

src/calibre/gui2/layout.py

src/calibre/gui2/preferences/email.ui

src/calibre/gui2/preferences/email_ui.py

src/calibre/gui2/preferences/emailp.py

src/calibre/gui2/preferences/tweaks.py

src/calibre/gui2/preferences/tweaks.ui

src/calibre/gui2/preferences/tweaks_ui.py

src/calibre/gui2/progress_indicator/QProgressIndicator.cpp

src/calibre/gui2/progress_indicator/QProgressIndicator.h

src/calibre/gui2/progress_indicator/QProgressIndicator.sip

src/calibre/gui2/store/stores/amazon_de_plugin.py

src/calibre/gui2/store/stores/amazon_es_plugin.py

src/calibre/gui2/store/stores/amazon_fr_plugin.py

src/calibre/gui2/store/stores/amazon_it_plugin.py

src/calibre/gui2/store/stores/amazon_uk_plugin.py

src/calibre/gui2/store/stores/cdp_plugin.py

src/calibre/gui2/store/stores/mills_boon_uk_plugin.py

src/calibre/gui2/store/stores/publio_plugin.py

src/calibre/gui2/store/stores/woblink_plugin.py

src/calibre/gui2/store/stores/wolnelektury_plugin.py

src/calibre/gui2/toc/location.py

src/calibre/gui2/toc/main.py

src/calibre/gui2/tweak_book/boss.py

src/calibre/gui2/tweak_book/diff/main.py

src/calibre/gui2/tweak_book/diff/view.py

src/calibre/gui2/tweak_book/editor/syntax/base.py

src/calibre/gui2/tweak_book/editor/syntax/html.py

src/calibre/gui2/tweak_book/editor/text.py

src/calibre/gui2/tweak_book/editor/themes.py

src/calibre/gui2/tweak_book/editor/widget.py

src/calibre/gui2/tweak_book/file_list.py

src/calibre/gui2/tweak_book/main.py

src/calibre/gui2/tweak_book/preview.py

src/calibre/gui2/tweak_book/save.py

src/calibre/gui2/tweak_book/ui.py

src/calibre/gui2/tweak_book/undo.py

src/calibre/gui2/viewer/documentview.py

src/calibre/gui2/viewer/main_ui.py

src/calibre/gui2/viewer/toc.py

src/calibre/library/catalogs/epub_mobi.py

src/calibre/library/catalogs/epub_mobi_builder.py

src/calibre/library/cli.py

src/calibre/linux.py

src/calibre/translations/af.po

src/calibre/translations/ar.po

src/calibre/translations/ast.po

src/calibre/translations/az.po

src/calibre/translations/ber.po

src/calibre/translations/bg.po

src/calibre/translations/bn.po

src/calibre/translations/br.po

src/calibre/translations/bs.po

src/calibre/translations/ca.po

src/calibre/translations/calibre.pot

src/calibre/translations/cs.po

src/calibre/translations/cy.po

src/calibre/translations/da.po

src/calibre/translations/de.po

src/calibre/translations/el.po

src/calibre/translations/en_AU.po

src/calibre/translations/en_CA.po

src/calibre/translations/en_GB.po

src/calibre/translations/eo.po

src/calibre/translations/es.po

src/calibre/translations/et.po

src/calibre/translations/eu.po

src/calibre/translations/fa.po

src/calibre/translations/fi.po

src/calibre/translations/fil.po

src/calibre/translations/fo.po

src/calibre/translations/fr.po

src/calibre/translations/fr_CA.po

src/calibre/translations/fur.po

src/calibre/translations/gl.po

src/calibre/translations/gu.po

src/calibre/translations/he.po

src/calibre/translations/hi.po

src/calibre/translations/him.po

src/calibre/translations/hr.po

src/calibre/translations/hu.po

src/calibre/translations/id.po

src/calibre/translations/is.po

src/calibre/translations/it.po

src/calibre/translations/ja.po

src/calibre/translations/jv.po

src/calibre/translations/ka.po

src/calibre/translations/kn.po

src/calibre/translations/ko.po

src/calibre/translations/ku.po

src/calibre/translations/lt.po

src/calibre/translations/ltg.po

src/calibre/translations/lv.po

src/calibre/translations/mk.po

src/calibre/translations/ml.po

src/calibre/translations/mn.po

src/calibre/translations/mr.po

src/calibre/translations/ms.po

src/calibre/translations/my.po

src/calibre/translations/nb.po

src/calibre/translations/nds.po

src/calibre/translations/nl.po

src/calibre/translations/nn.po

src/calibre/translations/oc.po

src/calibre/translations/pa.po

src/calibre/translations/pl.po

src/calibre/translations/pt.po

src/calibre/translations/pt_BR.po

src/calibre/translations/ro.po

src/calibre/translations/ru.po

src/calibre/translations/sc.po

src/calibre/translations/si.po

src/calibre/translations/sk.po

src/calibre/translations/sl.po

src/calibre/translations/sq.po

src/calibre/translations/sr.po

src/calibre/translations/sr@latin.po

src/calibre/translations/sv.po

src/calibre/translations/ta.po

src/calibre/translations/te.po

src/calibre/translations/th.po

src/calibre/translations/tr.po

src/calibre/translations/ug.po

src/calibre/translations/uk.po

src/calibre/translations/ur.po

src/calibre/translations/vi.po

src/calibre/translations/wa.po

src/calibre/translations/yi.po

src/calibre/translations/zh_CN.po

src/calibre/translations/zh_HK.po

src/calibre/translations/zh_TW.po

src/calibre/utils/config.py

src/calibre/utils/ipc/simple_worker.py

src/calibre/utils/ipython.py

src/calibre/utils/localization.py

src/calibre/utils/logging.py

src/calibre/utils/podofo/__init__.py

src/calibre/utils/podofo/doc.cpp

src/calibre/utils/terminal.py

src/calibre/web/jsbrowser/browser.py

Show diffs side-by-side

added added

removed removed

src/calibre/ebooks/metadata/pdf.py

__copyright__ = '2008, Kovid Goyal <kovid at kovidgoyal.net>'

'''Read meta information from PDF files'''

#import re

import os, subprocess, shutil

import os, subprocess, shutil, re

from functools import partial

from calibre import prints

from calibre.constants import iswindows

from calibre.ptempfile import TemporaryDirectory

from calibre.ebooks.metadata import MetaInformation, string_to_authors, check_isbn

from calibre.ebooks.metadata import (

MetaInformation, string_to_authors, check_isbn, check_doi)

from calibre.utils.ipc.simple_worker import fork_job, WorkerError

#_isbn_pat = re.compile(r'ISBN[: ]*([-0-9Xx]+)')

file, only for src.pdf.'''

os.chdir(outputdir)

pdfinfo, pdftoppm = get_tools()

ans = {}

try:

raw = subprocess.check_output([pdfinfo, '-enc', 'UTF-8', 'src.pdf'])

raw = subprocess.check_output([pdfinfo, '-meta', '-enc', 'UTF-8', 'src.pdf'])

except subprocess.CalledProcessError as e:

prints('pdfinfo errored out with return code: %d'%e.returncode)

return None

# The XMP metadata could be in an encoding other than UTF-8, so split it

# out before trying to decode raw

parts = re.split(br'^Metadata:', raw, 1, flags=re.MULTILINE)

if len(parts) > 1:

raw, ans['xmp_metadata'] = parts

try:

raw = raw.decode('utf-8')

except UnicodeDecodeError:

prints('pdfinfo returned no UTF-8 data')

return None

ans = {}

for line in raw.splitlines():

if u':' not in line:

continue

127

132

if subject:

128

133

mi.tags.insert(0, subject)

129

134

135

if 'xmp_metadata' in info:

136

from calibre.ebooks.metadata.xmp import consolidate_metadata

137

mi = consolidate_metadata(mi, info)

138

139

# Look for recognizable identifiers in the info dict, if they were not

140

# found in the XMP metadata

141

for scheme, check_func in {'doi':check_doi, 'isbn':check_isbn}.iteritems():

142

if scheme not in mi.get_identifiers():

143

for k, v in info.iteritems():

144

if k != 'xmp_metadata':

145

val = check_func(v)

146

if val:

147

mi.set_identifier(scheme, val)

148

break

149

130

150

if cdata:

131

151

mi.cover_data = ('jpeg', cdata)

132

133

152

return mi

134

153

135

154

get_quick_metadata = partial(get_metadata, cover=False)

Older »