~ubuntu-branches/debian/sid/calibre/sid

« back to all changes in this revision

Viewing changes to src/calibre/ebooks/oeb/polish/toc.py

Committer: Package Import Robot
Author(s): Martin Pitt
Date: 2014-02-27 07:48:06 UTC
mto: This revision was merged to the branch mainline in revision 74.
Revision ID: package-import@ubuntu.com-20140227074806-64wdebb3ptosxhhx

Tags: upstream-1.25.0+dfsg

Import upstream version 1.25.0+dfsg

files added:
manual/templates/epub_cover_template.html

recipes/disinformatico.recipe

recipes/gosc_full.recipe

recipes/icons/gosc_full.png

recipes/les_echos.recipe

resources/images/beautify.png

src/calibre/ebooks/metadata/xmp.py

src/calibre/gui2/tweak_book/diff/highlight.py

src/calibre/gui2/tweak_book/editor/smart

src/calibre/gui2/tweak_book/editor/smart/__init__.py

src/calibre/gui2/tweak_book/editor/smart/html.py

src/calibre/gui2/viewer/gestures.py

files removed:
recipes/icons/kdefamily_pl.png

recipes/kdefamily_pl.recipe

src/calibre/gui2/store/stores/foyles_uk_plugin.py

files modified:
Changelog.yaml

manual/conf.py

manual/conversion.rst

manual/custom.py

manual/diff.rst

manual/edit.rst

manual/epub.py

manual/faq.rst

manual/templates/layout.html

recipes/abc_es.recipe

recipes/ap.recipe

recipes/cosmopolitan_uk.recipe

recipes/cumhuriyet.recipe

recipes/gosc_niedzielny.recipe

recipes/kathemerini.recipe

recipes/mac_world_uk.recipe

recipes/nrc-nl-epub.recipe

recipes/nytimesbook.recipe

recipes/wired_it.recipe

resources/builtin_recipes.xml

resources/builtin_recipes.zip

resources/compiled_coffeescript.zip

resources/ebook-convert-complete.pickle

resources/images.qrc

resources/localization/locales.zip

resources/localization/stats.pickle

resources/quick_start.epub

setup/installer/__init__.py

setup/iso_639/pl.po

setup/iso_639/ru.po

setup/plugins_mirror.py

setup/resources.py

src/calibre/__init__.py

src/calibre/constants.py

src/calibre/customize/builtins.py

src/calibre/db/cache.py

src/calibre/debug.py

src/calibre/devices/kobo/driver.py

src/calibre/ebooks/chardet.py

src/calibre/ebooks/conversion/plugins/epub_output.py

src/calibre/ebooks/conversion/plugins/pdf_output.py

src/calibre/ebooks/html/input.py

src/calibre/ebooks/metadata/__init__.py

src/calibre/ebooks/metadata/meta.py

src/calibre/ebooks/metadata/opf2.py

src/calibre/ebooks/metadata/pdf.py

src/calibre/ebooks/metadata/sources/edelweiss.py

src/calibre/ebooks/mobi/reader/mobi8.py

src/calibre/ebooks/oeb/base.py

src/calibre/ebooks/oeb/display/paged.coffee

src/calibre/ebooks/oeb/parse_utils.py

src/calibre/ebooks/oeb/polish/check/links.py

src/calibre/ebooks/oeb/polish/check/main.py

src/calibre/ebooks/oeb/polish/check/parsing.py

src/calibre/ebooks/oeb/polish/choose.coffee

src/calibre/ebooks/oeb/polish/container.py

src/calibre/ebooks/oeb/polish/css.py

src/calibre/ebooks/oeb/polish/errors.py

src/calibre/ebooks/oeb/polish/font_stats.coffee

src/calibre/ebooks/oeb/polish/parsing.py

src/calibre/ebooks/oeb/polish/preview.coffee

src/calibre/ebooks/oeb/polish/split.py

src/calibre/ebooks/oeb/polish/tests/container.py

src/calibre/ebooks/oeb/polish/tests/parsing.py

src/calibre/ebooks/oeb/polish/toc.py

src/calibre/ebooks/oeb/polish/utils.py

src/calibre/ebooks/oeb/transforms/rasterize.py

src/calibre/ebooks/oeb/transforms/split.py

src/calibre/ebooks/pdf/render/from_html.py

src/calibre/ebooks/pdf/render/graphics.py

src/calibre/ebooks/pdf/render/serialize.py

src/calibre/gui2/__init__.py

src/calibre/gui2/actions/add.py

src/calibre/gui2/actions/copy_to_library.py

src/calibre/gui2/actions/next_match.py

src/calibre/gui2/actions/preferences.py

src/calibre/gui2/actions/restart.py

src/calibre/gui2/actions/similar_books.py

src/calibre/gui2/auto_add.py

src/calibre/gui2/comments_editor.py

src/calibre/gui2/complete2.py

src/calibre/gui2/dialogs/duplicates.py

src/calibre/gui2/dialogs/message_box.py

src/calibre/gui2/dialogs/metadata_bulk.py

src/calibre/gui2/email.py

src/calibre/gui2/init.py

src/calibre/gui2/jobs.py

src/calibre/gui2/layout.py

src/calibre/gui2/preferences/email.ui

src/calibre/gui2/preferences/email_ui.py

src/calibre/gui2/preferences/emailp.py

src/calibre/gui2/preferences/tweaks.py

src/calibre/gui2/preferences/tweaks.ui

src/calibre/gui2/preferences/tweaks_ui.py

src/calibre/gui2/progress_indicator/QProgressIndicator.cpp

src/calibre/gui2/progress_indicator/QProgressIndicator.h

src/calibre/gui2/progress_indicator/QProgressIndicator.sip

src/calibre/gui2/store/stores/amazon_de_plugin.py

src/calibre/gui2/store/stores/amazon_es_plugin.py

src/calibre/gui2/store/stores/amazon_fr_plugin.py

src/calibre/gui2/store/stores/amazon_it_plugin.py

src/calibre/gui2/store/stores/amazon_uk_plugin.py

src/calibre/gui2/store/stores/cdp_plugin.py

src/calibre/gui2/store/stores/mills_boon_uk_plugin.py

src/calibre/gui2/store/stores/publio_plugin.py

src/calibre/gui2/store/stores/woblink_plugin.py

src/calibre/gui2/store/stores/wolnelektury_plugin.py

src/calibre/gui2/toc/location.py

src/calibre/gui2/toc/main.py

src/calibre/gui2/tweak_book/boss.py

src/calibre/gui2/tweak_book/diff/main.py

src/calibre/gui2/tweak_book/diff/view.py

src/calibre/gui2/tweak_book/editor/syntax/base.py

src/calibre/gui2/tweak_book/editor/syntax/html.py

src/calibre/gui2/tweak_book/editor/text.py

src/calibre/gui2/tweak_book/editor/themes.py

src/calibre/gui2/tweak_book/editor/widget.py

src/calibre/gui2/tweak_book/file_list.py

src/calibre/gui2/tweak_book/main.py

src/calibre/gui2/tweak_book/preview.py

src/calibre/gui2/tweak_book/save.py

src/calibre/gui2/tweak_book/ui.py

src/calibre/gui2/tweak_book/undo.py

src/calibre/gui2/viewer/documentview.py

src/calibre/gui2/viewer/main_ui.py

src/calibre/gui2/viewer/toc.py

src/calibre/library/catalogs/epub_mobi.py

src/calibre/library/catalogs/epub_mobi_builder.py

src/calibre/library/cli.py

src/calibre/linux.py

src/calibre/translations/af.po

src/calibre/translations/ar.po

src/calibre/translations/ast.po

src/calibre/translations/az.po

src/calibre/translations/ber.po

src/calibre/translations/bg.po

src/calibre/translations/bn.po

src/calibre/translations/br.po

src/calibre/translations/bs.po

src/calibre/translations/ca.po

src/calibre/translations/calibre.pot

src/calibre/translations/cs.po

src/calibre/translations/cy.po

src/calibre/translations/da.po

src/calibre/translations/de.po

src/calibre/translations/el.po

src/calibre/translations/en_AU.po

src/calibre/translations/en_CA.po

src/calibre/translations/en_GB.po

src/calibre/translations/eo.po

src/calibre/translations/es.po

src/calibre/translations/et.po

src/calibre/translations/eu.po

src/calibre/translations/fa.po

src/calibre/translations/fi.po

src/calibre/translations/fil.po

src/calibre/translations/fo.po

src/calibre/translations/fr.po

src/calibre/translations/fr_CA.po

src/calibre/translations/fur.po

src/calibre/translations/gl.po

src/calibre/translations/gu.po

src/calibre/translations/he.po

src/calibre/translations/hi.po

src/calibre/translations/him.po

src/calibre/translations/hr.po

src/calibre/translations/hu.po

src/calibre/translations/id.po

src/calibre/translations/is.po

src/calibre/translations/it.po

src/calibre/translations/ja.po

src/calibre/translations/jv.po

src/calibre/translations/ka.po

src/calibre/translations/kn.po

src/calibre/translations/ko.po

src/calibre/translations/ku.po

src/calibre/translations/lt.po

src/calibre/translations/ltg.po

src/calibre/translations/lv.po

src/calibre/translations/mk.po

src/calibre/translations/ml.po

src/calibre/translations/mn.po

src/calibre/translations/mr.po

src/calibre/translations/ms.po

src/calibre/translations/my.po

src/calibre/translations/nb.po

src/calibre/translations/nds.po

src/calibre/translations/nl.po

src/calibre/translations/nn.po

src/calibre/translations/oc.po

src/calibre/translations/pa.po

src/calibre/translations/pl.po

src/calibre/translations/pt.po

src/calibre/translations/pt_BR.po

src/calibre/translations/ro.po

src/calibre/translations/ru.po

src/calibre/translations/sc.po

src/calibre/translations/si.po

src/calibre/translations/sk.po

src/calibre/translations/sl.po

src/calibre/translations/sq.po

src/calibre/translations/sr.po

src/calibre/translations/sr@latin.po

src/calibre/translations/sv.po

src/calibre/translations/ta.po

src/calibre/translations/te.po

src/calibre/translations/th.po

src/calibre/translations/tr.po

src/calibre/translations/ug.po

src/calibre/translations/uk.po

src/calibre/translations/ur.po

src/calibre/translations/vi.po

src/calibre/translations/wa.po

src/calibre/translations/yi.po

src/calibre/translations/zh_CN.po

src/calibre/translations/zh_HK.po

src/calibre/translations/zh_TW.po

src/calibre/utils/config.py

src/calibre/utils/ipc/simple_worker.py

src/calibre/utils/ipython.py

src/calibre/utils/localization.py

src/calibre/utils/logging.py

src/calibre/utils/podofo/__init__.py

src/calibre/utils/podofo/doc.cpp

src/calibre/utils/terminal.py

src/calibre/web/jsbrowser/browser.py

Show diffs side-by-side

added added

removed removed

src/calibre/ebooks/oeb/polish/toc.py

import re

from urlparse import urlparse

from collections import deque, Counter, OrderedDict

from collections import Counter, OrderedDict

from functools import partial

from operator import itemgetter

from lxml import etree

from lxml.builder import ElementMaker

from calibre import __version__

from calibre.ebooks.oeb.base import XPath, uuid_id, xml2text, NCX, NCX_NS, XML, XHTML

from calibre.ebooks.oeb.base import XPath, uuid_id, xml2text, NCX, NCX_NS, XML, XHTML, XHTML_NS, serialize

from calibre.ebooks.oeb.polish.errors import MalformedMarkup

from calibre.ebooks.oeb.polish.utils import guess_type

from calibre.ebooks.oeb.polish.pretty import pretty_html_tree

from calibre.utils.localization import get_lang, canonicalize_lang, lang_as_iso639_1

ns = etree.FunctionNamespace('calibre_xpath_extensions')

347

350

toc.add(text, name)

348

351

return toc

349

352

350

def node_from_loc(root, loc):

351

body = root.xpath('//*[local-name()="body"]')[0]

352

locs = deque(loc)

353

node = body

354

while locs:

353

def node_from_loc(root, locs, totals=None):

354

node = root.xpath('//*[local-name()="body"]')[0]

355

for i, loc in enumerate(locs):

355

356

children = tuple(node.iterchildren(etree.Element))

356

node = children[locs[0]]

357

locs.popleft()

357

if totals is not None and totals[i] != len(children):

358

raise MalformedMarkup()

359

node = children[loc]

358

360

return node

359

361

360

def add_id(container, name, loc):

362

def add_id(container, name, loc, totals=None):

361

363

root = container.parsed(name)

362

node = node_from_loc(root, loc)

364

try:

365

node = node_from_loc(root, loc, totals=totals)

366

except MalformedMarkup:

367

# The webkit HTML parser and the container parser have yielded

368

# different node counts, this can happen if the file is valid XML

369

# but contains constructs like nested <p> tags. So force parse it

370

# with the HTML 5 parser and try again.

371

raw = container.raw_data(name)

372

root = container.parse_xhtml(raw, fname=name, force_html5_parse=True)

373

try:

374

node = node_from_loc(root, loc, totals=totals)

375

except MalformedMarkup:

376

raise MalformedMarkup(_('The file %s has malformed markup. Try running the Fix HTML tool'

377

' before editing.') % name)

378

container.replace(name, root)

379

363

380

node.set('id', node.get('id', uuid_id()))

364

381

container.commit_item(name, keep_parsed=True)

365

382

return node.get('id')

457

474

commit_toc(container, toc)

458

475

return True

459

476

return False

477

478

def find_inline_toc(container):

479

for name, linear in container.spine_names:

480

if container.parsed(name).xpath('//*[local-name()="body" and @id="calibre_generated_inline_toc"]'):

481

return name

482

483

def create_inline_toc(container, title=None):

484

title = title or _('Table of Contents')

485

toc = get_toc(container)

486

if len(toc) == 0:

487

return None

488

toc_name = find_inline_toc(container)

489

490

def process_node(html_parent, toc, level=1, indent=' '):

491

li = html_parent.makeelement(XHTML('li'))

492

li.tail = '\n'+ (indent*level)

493

html_parent.append(li)

494

name, frag = toc.dest, toc.frag

495

href = '#'

496

if name:

497

href = container.name_to_href(name, toc_name)

498

if frag:

499

href += '#' + frag

500

a = li.makeelement(XHTML('a'), href=href)

501

a.text = toc.title

502

li.append(a)

503

if len(toc) > 0:

504

parent = li.makeelement(XHTML('ul'))

505

li.append(parent)

506

a.tail = '\n\n' + (indent*(level+2))

507

parent.text = '\n'+(indent*(level+3))

508

parent.tail = '\n\n' + (indent*(level+1))

509

for child in toc:

510

process_node(parent, child, level+3)

511

parent[-1].tail = '\n' + (indent*(level+2))

512

513

E = ElementMaker(namespace=XHTML_NS, nsmap={None:XHTML_NS})

514

html = E.html(

515

E.head(

516

E.title(title),

517

E.style('''

518

li { list-style-type: none; padding-left: 2em; margin-left: 0}

519

a { text-decoration: none }

520

a:hover { color: red }''', type='text/css'),

521

522

E.body(

523

E.h2(title),

524

E.ul(),

525

id="calibre_generated_inline_toc",

526

)

527

)

528

529

name = toc_name

530

for child in toc:

531

process_node(html[1][1], child)

532

pretty_html_tree(container, html)

533

raw = serialize(html, 'text/html')

534

if name is None:

535

name, c = 'toc.xhtml', 0

536

while container.has_name(name):

537

c += 1

538

name = 'toc%d.xhtml' % c

539

container.add_file(name, raw, spine_index=0)

540

else:

541

with container.open(name, 'wb') as f:

542

f.write(raw)

543

return name

544

Older »