~ubuntu-branches/debian/sid/calibre/sid

« back to all changes in this revision

Viewing changes to src/calibre/ebooks/oeb/polish/check/links.py

Committer: Package Import Robot
Author(s): Martin Pitt
Date: 2014-02-27 07:48:06 UTC
mto: This revision was merged to the branch mainline in revision 74.
Revision ID: package-import@ubuntu.com-20140227074806-64wdebb3ptosxhhx

Tags: upstream-1.25.0+dfsg

Import upstream version 1.25.0+dfsg

files added:
manual/templates/epub_cover_template.html

recipes/disinformatico.recipe

recipes/gosc_full.recipe

recipes/icons/gosc_full.png

recipes/les_echos.recipe

resources/images/beautify.png

src/calibre/ebooks/metadata/xmp.py

src/calibre/gui2/tweak_book/diff/highlight.py

src/calibre/gui2/tweak_book/editor/smart

src/calibre/gui2/tweak_book/editor/smart/__init__.py

src/calibre/gui2/tweak_book/editor/smart/html.py

src/calibre/gui2/viewer/gestures.py

files removed:
recipes/icons/kdefamily_pl.png

recipes/kdefamily_pl.recipe

src/calibre/gui2/store/stores/foyles_uk_plugin.py

files modified:
Changelog.yaml

manual/conf.py

manual/conversion.rst

manual/custom.py

manual/diff.rst

manual/edit.rst

manual/epub.py

manual/faq.rst

manual/templates/layout.html

recipes/abc_es.recipe

recipes/ap.recipe

recipes/cosmopolitan_uk.recipe

recipes/cumhuriyet.recipe

recipes/gosc_niedzielny.recipe

recipes/kathemerini.recipe

recipes/mac_world_uk.recipe

recipes/nrc-nl-epub.recipe

recipes/nytimesbook.recipe

recipes/wired_it.recipe

resources/builtin_recipes.xml

resources/builtin_recipes.zip

resources/compiled_coffeescript.zip

resources/ebook-convert-complete.pickle

resources/images.qrc

resources/localization/locales.zip

resources/localization/stats.pickle

resources/quick_start.epub

setup/installer/__init__.py

setup/iso_639/pl.po

setup/iso_639/ru.po

setup/plugins_mirror.py

setup/resources.py

src/calibre/__init__.py

src/calibre/constants.py

src/calibre/customize/builtins.py

src/calibre/db/cache.py

src/calibre/debug.py

src/calibre/devices/kobo/driver.py

src/calibre/ebooks/chardet.py

src/calibre/ebooks/conversion/plugins/epub_output.py

src/calibre/ebooks/conversion/plugins/pdf_output.py

src/calibre/ebooks/html/input.py

src/calibre/ebooks/metadata/__init__.py

src/calibre/ebooks/metadata/meta.py

src/calibre/ebooks/metadata/opf2.py

src/calibre/ebooks/metadata/pdf.py

src/calibre/ebooks/metadata/sources/edelweiss.py

src/calibre/ebooks/mobi/reader/mobi8.py

src/calibre/ebooks/oeb/base.py

src/calibre/ebooks/oeb/display/paged.coffee

src/calibre/ebooks/oeb/parse_utils.py

src/calibre/ebooks/oeb/polish/check/links.py

src/calibre/ebooks/oeb/polish/check/main.py

src/calibre/ebooks/oeb/polish/check/parsing.py

src/calibre/ebooks/oeb/polish/choose.coffee

src/calibre/ebooks/oeb/polish/container.py

src/calibre/ebooks/oeb/polish/css.py

src/calibre/ebooks/oeb/polish/errors.py

src/calibre/ebooks/oeb/polish/font_stats.coffee

src/calibre/ebooks/oeb/polish/parsing.py

src/calibre/ebooks/oeb/polish/preview.coffee

src/calibre/ebooks/oeb/polish/split.py

src/calibre/ebooks/oeb/polish/tests/container.py

src/calibre/ebooks/oeb/polish/tests/parsing.py

src/calibre/ebooks/oeb/polish/toc.py

src/calibre/ebooks/oeb/polish/utils.py

src/calibre/ebooks/oeb/transforms/rasterize.py

src/calibre/ebooks/oeb/transforms/split.py

src/calibre/ebooks/pdf/render/from_html.py

src/calibre/ebooks/pdf/render/graphics.py

src/calibre/ebooks/pdf/render/serialize.py

src/calibre/gui2/__init__.py

src/calibre/gui2/actions/add.py

src/calibre/gui2/actions/copy_to_library.py

src/calibre/gui2/actions/next_match.py

src/calibre/gui2/actions/preferences.py

src/calibre/gui2/actions/restart.py

src/calibre/gui2/actions/similar_books.py

src/calibre/gui2/auto_add.py

src/calibre/gui2/comments_editor.py

src/calibre/gui2/complete2.py

src/calibre/gui2/dialogs/duplicates.py

src/calibre/gui2/dialogs/message_box.py

src/calibre/gui2/dialogs/metadata_bulk.py

src/calibre/gui2/email.py

src/calibre/gui2/init.py

src/calibre/gui2/jobs.py

src/calibre/gui2/layout.py

src/calibre/gui2/preferences/email.ui

src/calibre/gui2/preferences/email_ui.py

src/calibre/gui2/preferences/emailp.py

src/calibre/gui2/preferences/tweaks.py

src/calibre/gui2/preferences/tweaks.ui

src/calibre/gui2/preferences/tweaks_ui.py

src/calibre/gui2/progress_indicator/QProgressIndicator.cpp

src/calibre/gui2/progress_indicator/QProgressIndicator.h

src/calibre/gui2/progress_indicator/QProgressIndicator.sip

src/calibre/gui2/store/stores/amazon_de_plugin.py

src/calibre/gui2/store/stores/amazon_es_plugin.py

src/calibre/gui2/store/stores/amazon_fr_plugin.py

src/calibre/gui2/store/stores/amazon_it_plugin.py

src/calibre/gui2/store/stores/amazon_uk_plugin.py

src/calibre/gui2/store/stores/cdp_plugin.py

src/calibre/gui2/store/stores/mills_boon_uk_plugin.py

src/calibre/gui2/store/stores/publio_plugin.py

src/calibre/gui2/store/stores/woblink_plugin.py

src/calibre/gui2/store/stores/wolnelektury_plugin.py

src/calibre/gui2/toc/location.py

src/calibre/gui2/toc/main.py

src/calibre/gui2/tweak_book/boss.py

src/calibre/gui2/tweak_book/diff/main.py

src/calibre/gui2/tweak_book/diff/view.py

src/calibre/gui2/tweak_book/editor/syntax/base.py

src/calibre/gui2/tweak_book/editor/syntax/html.py

src/calibre/gui2/tweak_book/editor/text.py

src/calibre/gui2/tweak_book/editor/themes.py

src/calibre/gui2/tweak_book/editor/widget.py

src/calibre/gui2/tweak_book/file_list.py

src/calibre/gui2/tweak_book/main.py

src/calibre/gui2/tweak_book/preview.py

src/calibre/gui2/tweak_book/save.py

src/calibre/gui2/tweak_book/ui.py

src/calibre/gui2/tweak_book/undo.py

src/calibre/gui2/viewer/documentview.py

src/calibre/gui2/viewer/main_ui.py

src/calibre/gui2/viewer/toc.py

src/calibre/library/catalogs/epub_mobi.py

src/calibre/library/catalogs/epub_mobi_builder.py

src/calibre/library/cli.py

src/calibre/linux.py

src/calibre/translations/af.po

src/calibre/translations/ar.po

src/calibre/translations/ast.po

src/calibre/translations/az.po

src/calibre/translations/ber.po

src/calibre/translations/bg.po

src/calibre/translations/bn.po

src/calibre/translations/br.po

src/calibre/translations/bs.po

src/calibre/translations/ca.po

src/calibre/translations/calibre.pot

src/calibre/translations/cs.po

src/calibre/translations/cy.po

src/calibre/translations/da.po

src/calibre/translations/de.po

src/calibre/translations/el.po

src/calibre/translations/en_AU.po

src/calibre/translations/en_CA.po

src/calibre/translations/en_GB.po

src/calibre/translations/eo.po

src/calibre/translations/es.po

src/calibre/translations/et.po

src/calibre/translations/eu.po

src/calibre/translations/fa.po

src/calibre/translations/fi.po

src/calibre/translations/fil.po

src/calibre/translations/fo.po

src/calibre/translations/fr.po

src/calibre/translations/fr_CA.po

src/calibre/translations/fur.po

src/calibre/translations/gl.po

src/calibre/translations/gu.po

src/calibre/translations/he.po

src/calibre/translations/hi.po

src/calibre/translations/him.po

src/calibre/translations/hr.po

src/calibre/translations/hu.po

src/calibre/translations/id.po

src/calibre/translations/is.po

src/calibre/translations/it.po

src/calibre/translations/ja.po

src/calibre/translations/jv.po

src/calibre/translations/ka.po

src/calibre/translations/kn.po

src/calibre/translations/ko.po

src/calibre/translations/ku.po

src/calibre/translations/lt.po

src/calibre/translations/ltg.po

src/calibre/translations/lv.po

src/calibre/translations/mk.po

src/calibre/translations/ml.po

src/calibre/translations/mn.po

src/calibre/translations/mr.po

src/calibre/translations/ms.po

src/calibre/translations/my.po

src/calibre/translations/nb.po

src/calibre/translations/nds.po

src/calibre/translations/nl.po

src/calibre/translations/nn.po

src/calibre/translations/oc.po

src/calibre/translations/pa.po

src/calibre/translations/pl.po

src/calibre/translations/pt.po

src/calibre/translations/pt_BR.po

src/calibre/translations/ro.po

src/calibre/translations/ru.po

src/calibre/translations/sc.po

src/calibre/translations/si.po

src/calibre/translations/sk.po

src/calibre/translations/sl.po

src/calibre/translations/sq.po

src/calibre/translations/sr.po

src/calibre/translations/sr@latin.po

src/calibre/translations/sv.po

src/calibre/translations/ta.po

src/calibre/translations/te.po

src/calibre/translations/th.po

src/calibre/translations/tr.po

src/calibre/translations/ug.po

src/calibre/translations/uk.po

src/calibre/translations/ur.po

src/calibre/translations/vi.po

src/calibre/translations/wa.po

src/calibre/translations/yi.po

src/calibre/translations/zh_CN.po

src/calibre/translations/zh_HK.po

src/calibre/translations/zh_TW.po

src/calibre/utils/config.py

src/calibre/utils/ipc/simple_worker.py

src/calibre/utils/ipython.py

src/calibre/utils/localization.py

src/calibre/utils/logging.py

src/calibre/utils/podofo/__init__.py

src/calibre/utils/podofo/doc.cpp

src/calibre/utils/terminal.py

src/calibre/web/jsbrowser/browser.py

Show diffs side-by-side

added added

removed removed

src/calibre/ebooks/oeb/polish/check/links.py

__license__ = 'GPL v3'

__copyright__ = '2013, Kovid Goyal <kovid at kovidgoyal.net>'

import os

from collections import defaultdict

from urlparse import urlparse

from calibre.ebooks.oeb.base import OEB_DOCS, OEB_STYLES

from calibre.ebooks.oeb.polish.container import OEB_FONTS

from calibre.ebooks.oeb.polish.utils import guess_type

from calibre.ebooks.oeb.polish.utils import guess_type, actual_case_for_name, corrected_case_for_name

from calibre.ebooks.oeb.polish.check.base import BaseError, WARN, INFO

class BadLink(BaseError):

' either fix, or remove the link.')

level = WARN

class CaseMismatch(BadLink):

def __init__(self, href, corrected_name, name, lnum, col):

BadLink.__init__(self, _('The linked to resource {0} does not exist').format(href), name, line=lnum, col=col)

self.HELP = _('The case of the link {0} and the case of the actual file it points to {1}'

' do not agree. You should change either the case of the link or rename the file.').format(

href, corrected_name)

self.INDIVIDUAL_FIX = _('Change the case of the link to match the actual file')

self.corrected_name = corrected_name

self.href = href

def __call__(self, container):

frag = urlparse(self.href).fragment

nhref = container.name_to_href(self.corrected_name, self.name)

if frag:

nhref += '#' + frag

orig_href = self.href

class LinkReplacer(object):

replaced = False

def __call__(self, url):

if url != orig_href:

return url

self.replaced = True

return nhref

replacer = LinkReplacer()

container.replace_links(self.name, replacer)

return replacer.replaced

class BadDestinationType(BaseError):

level = WARN

def __init__(self, link_source, link_dest, link_elem):

BaseError.__init__(self, _('Link points to a file that is not a text document'), link_source, line=link_elem.sourceline)

self.HELP = _('The link "{0}" points to a file <i>{1}</i> that is not a text (HTML) document.'

' Many ebook readers will be unable to follow such a link. You should'

' either remove the link or change it to point to a text document.'

' For example, if it points to an image, you can create small wrapper'

' document that contains the image and change the link to point to that.').format(

link_elem.get('href'), link_dest)

self.bad_href = link_elem.get('href')

class FileLink(BadLink):

HELP = _('This link uses the file:// URL scheme. This does not work with many ebook readers.'

125

' The recommended mimetype for files with the extension "{2}" is {3}.'

126

' You should change either the file extension or the mimetype in the OPF.').format(

127

name, opf_mt, ext, ext_mt)

self.INDIVIDUAL_FIX = _('Change the mimetype for this file in the OPF to %s') % ext_mt

128

if opf_mt in OEB_DOCS and name in {n for n, l in container.spine_names}:

129

self.INDIVIDUAL_FIX = _('Change the file extension to .xhtml')

130

self.change_ext_to = 'xhtml'

131

else:

132

self.INDIVIDUAL_FIX = _('Change the mimetype for this file in the OPF to %s') % ext_mt

133

self.change_ext_to = None

134

135

def __call__(self, container):

136

changed = False

for item in container.opf_xpath('//opf:manifest/opf:item[@href and @media-type="%s"]' % self.opf_mt):

name = container.href_to_name(item.get('href'), container.opf_name)

if name == self.file_name:

changed = True

item.set('media-type', self.ext_mt)

container.mime_map[name] = self.ext_mt

if changed:

container.dirty(container.opf_name)

137

if self.change_ext_to is not None:

138

from calibre.ebooks.oeb.polish.replace import rename_files

139

new_name = self.file_name.rpartition('.')[0] + '.' + self.change_ext_to

140

c = 0

141

while container.has_name(new_name):

142

c += 1

143

new_name = self.file_name.rpartition('.')[0] + ('%d.' % c) + self.change_ext_to

144

rename_files(container, {self.file_name:new_name})

145

changed = True

146

else:

147

for item in container.opf_xpath('//opf:manifest/opf:item[@href and @media-type="%s"]' % self.opf_mt):

148

name = container.href_to_name(item.get('href'), container.opf_name)

149

if name == self.file_name:

150

changed = True

151

item.set('media-type', self.ext_mt)

152

container.mime_map[name] = self.ext_mt

153

if changed:

154

container.dirty(container.opf_name)

155

return changed

156

157

def check_mimetypes(container):

107

165

a(MimetypeMismatch(container, name, mt, gt))

108

166

return errors

109

167

168

def check_link_destinations(container):

169

errors = []

170

for name, mt in container.mime_map.iteritems():

171

if mt in OEB_DOCS:

172

for a in container.parsed(name).xpath('//*[local-name()="a" and @href]'):

173

tname = container.href_to_name(a.get('href'), name)

174

if tname and tname in container.mime_map and container.mime_map[tname] not in OEB_DOCS:

175

errors.append(BadDestinationType(name, tname, a))

176

return errors

177

110

178

def check_links(container):

111

179

links_map = defaultdict(set)

112

180

xml_types = {guess_type('a.opf'), guess_type('a.ncx')}

128

196

if tname in container.mime_map:

129

197

links_map[name].add(tname)

130

198

else:

131

a(BadLink(_('The linked resource %s is a directory') % fl(href), name, lnum, col))

199

# Filesystem says the file exists, but it is not in

200

# the mime_map, so either there is a case mismatch

201

# or the link is a directory

202

apath = container.name_to_abspath(tname)

203

if os.path.isdir(apath):

204

a(BadLink(_('The linked resource %s is a directory') % fl(href), name, lnum, col))

205

else:

206

a(CaseMismatch(href, actual_case_for_name(container, tname), name, lnum, col))

132

207

else:

133

a(BadLink(_('The linked resource %s does not exist') % fl(href), name, lnum, col))

208

cname = corrected_case_for_name(container, tname)

209

if cname is not None:

210

a(CaseMismatch(href, cname, name, lnum, col))

211

else:

212

a(BadLink(_('The linked resource %s does not exist') % fl(href), name, lnum, col))

134

213

else:

135

214

purl = urlparse(href)

136

215

if purl.scheme == 'file':

Older »