← Back to branch summary

~ubuntu-branches/ubuntu/karmic/calibre/karmic-updates

~ubuntu-branches/ubuntu/karmic/calibre/karmic-updates

« back to all changes in this revision

Viewing changes to src/calibre/web/feeds/recipes/recipe_zaobao.py

Committer: Bazaar Package Importer
Author(s): Martin Pitt
Date: 2009-04-05 18:42:16 UTC
mfrom: (1.1.7 sid)
Revision ID: james.westby@ubuntu.com-20090405184216-cyb0x4edrwjcaw33

Tags: 0.5.9+dfsg-1

http://bugs.debian.org/525339

http://bugs.debian.org/522059

* New upstream release. (Closes: #525339)
* manpages-installation.patch: Encode generated manpages as UTF-8, to avoid
  UnicodeDecodeErrors when writing them out to files.
* debian/control: Demote calibre dependency of calibre-bin to Recommends:,
  which is sufficient and avoids a circular dependency. (Closes: #522059)
* debian/control: Drop build dependency help2man, current version does not
  need it any more.
* debian/control: Drop versioned build dependency on python-mechanize,
  current sid version is enough.
* debian/rules: Copy "setup.py install" command from cdbs'
  python-distutils.mk, since the current version broke this. This is a
  hackish workaround until #525436 gets fixed.
* debian/rules: Drop using $(wildcard ), use `ls`; the former does not work
  any more.

files added:
session.vim

src/calibre/devices/eb600

src/calibre/devices/eb600/__init__.py

src/calibre/devices/eb600/driver.py

src/calibre/ebooks/metadata/fetch.py

src/calibre/ebooks/metadata/google_books.py

src/calibre/ebooks/metadata/topaz.py

src/calibre/gui2/dialogs/test_email.ui

src/calibre/gui2/images/gmail_logo.png

src/calibre/gui2/images/mail.svg

src/calibre/gui2/images/news/24sata.png

src/calibre/gui2/images/news/24sata_rs.png

src/calibre/gui2/images/news/adventuregamers.png

src/calibre/gui2/images/news/azstarnet.png

src/calibre/gui2/images/news/coding_horror.png

src/calibre/gui2/images/news/corriere_della_sera_en.png

src/calibre/gui2/images/news/corriere_della_sera_it.png

src/calibre/gui2/images/news/der_standard.png

src/calibre/gui2/images/news/diepresse.png

src/calibre/gui2/images/news/dnevni_avaz.png

src/calibre/gui2/images/news/glas_srpske.png

src/calibre/gui2/images/news/hna.png

src/calibre/gui2/images/news/instapaper.png

src/calibre/gui2/images/news/krstarica.png

src/calibre/gui2/images/news/krstarica_en.png

src/calibre/gui2/images/news/laprensa_ni.png

src/calibre/gui2/images/news/miami_herald.png

src/calibre/gui2/images/news/msdnmag_en.png

src/calibre/gui2/images/news/nacional_cro.png

src/calibre/gui2/images/news/nytimes_sub.png

src/calibre/gui2/images/news/nzz_ger.png

src/calibre/gui2/images/news/politico.png

src/calibre/gui2/images/news/scott_hanselman.png

src/calibre/gui2/images/news/seattle_times.png

src/calibre/gui2/images/news/stackoverflow.png

src/calibre/gui2/images/news/tanjug.png

src/calibre/gui2/images/news/telepolis_artikel.png

src/calibre/gui2/images/news/vecernji_list.png

src/calibre/gui2/images/news/wikinews_en.png

src/calibre/trac/plugins/htdocs/images/binary_logo.png

src/calibre/trac/plugins/htdocs/images/foresight_logo.png

src/calibre/trac/plugins/htdocs/images/linux_mint_logo.png

src/calibre/translations/da.po

src/calibre/translations/hr.po

src/calibre/translations/ja.po

src/calibre/translations/uk.po

src/calibre/utils/Zeroconf.py

src/calibre/utils/help2man.py

src/calibre/utils/mdns.py

src/calibre/utils/rss_gen.py

src/calibre/utils/smtp.py

src/calibre/utils/winshell.py

src/calibre/web/feeds/recipes/recipe_24sata.py

src/calibre/web/feeds/recipes/recipe_24sata_rs.py

src/calibre/web/feeds/recipes/recipe_adventuregamers.py

src/calibre/web/feeds/recipes/recipe_azstarnet.py

src/calibre/web/feeds/recipes/recipe_coding_horror.py

src/calibre/web/feeds/recipes/recipe_corriere_della_sera_en.py

src/calibre/web/feeds/recipes/recipe_corriere_della_sera_it.py

src/calibre/web/feeds/recipes/recipe_daily_mail.py

src/calibre/web/feeds/recipes/recipe_der_standard.py

src/calibre/web/feeds/recipes/recipe_diepresse.py

src/calibre/web/feeds/recipes/recipe_dnevni_avaz.py

src/calibre/web/feeds/recipes/recipe_dnevnik_cro.py

src/calibre/web/feeds/recipes/recipe_ecogeek.py

src/calibre/web/feeds/recipes/recipe_glas_srpske.py

src/calibre/web/feeds/recipes/recipe_hna.py

src/calibre/web/feeds/recipes/recipe_instapaper.py

src/calibre/web/feeds/recipes/recipe_krstarica.py

src/calibre/web/feeds/recipes/recipe_krstarica_en.py

src/calibre/web/feeds/recipes/recipe_laprensa_ni.py

src/calibre/web/feeds/recipes/recipe_mediapart.py

src/calibre/web/feeds/recipes/recipe_miami_herald.py

src/calibre/web/feeds/recipes/recipe_mondedurable.py

src/calibre/web/feeds/recipes/recipe_moneynews.py

src/calibre/web/feeds/recipes/recipe_msdnmag_en.py

src/calibre/web/feeds/recipes/recipe_nacional_cro.py

src/calibre/web/feeds/recipes/recipe_new_york_review_of_books_no_sub.py

src/calibre/web/feeds/recipes/recipe_nzz_ger.py

src/calibre/web/feeds/recipes/recipe_politico.py

src/calibre/web/feeds/recipes/recipe_scott_hanselman.py

src/calibre/web/feeds/recipes/recipe_seattle_times.py

src/calibre/web/feeds/recipes/recipe_stackoverflow.py

src/calibre/web/feeds/recipes/recipe_tanjug.py

src/calibre/web/feeds/recipes/recipe_telepolis_artikel.py

src/calibre/web/feeds/recipes/recipe_the_register.py

src/calibre/web/feeds/recipes/recipe_vecernji_list.py

src/calibre/web/feeds/recipes/recipe_wikinews_en.py

src/calibre/web/feeds/recipes/recipe_zaobao.py

src/calibre/www

src/calibre/www/__init__.py

src/calibre/www/apps

src/calibre/www/apps/__init__.py

src/calibre/www/apps/blog

src/calibre/www/apps/blog/CHANGELOG.yml

src/calibre/www/apps/blog/README.txt

src/calibre/www/apps/blog/__init__.py

src/calibre/www/apps/blog/admin.py

src/calibre/www/apps/blog/feeds.py

src/calibre/www/apps/blog/managers.py

src/calibre/www/apps/blog/models.py

src/calibre/www/apps/blog/sitemap.py

src/calibre/www/apps/blog/templates

src/calibre/www/apps/blog/templates/admin

src/calibre/www/apps/blog/templates/admin/blog

src/calibre/www/apps/blog/templates/admin/blog/post

src/calibre/www/apps/blog/templates/admin/blog/post/change_form.html

src/calibre/www/apps/blog/templates/base.html

src/calibre/www/apps/blog/templates/blog

src/calibre/www/apps/blog/templates/blog/base_blog.html

src/calibre/www/apps/blog/templates/blog/category_detail.html

src/calibre/www/apps/blog/templates/blog/category_list.html

src/calibre/www/apps/blog/templates/blog/post_archive_day.html

src/calibre/www/apps/blog/templates/blog/post_archive_month.html

src/calibre/www/apps/blog/templates/blog/post_archive_year.html

src/calibre/www/apps/blog/templates/blog/post_detail.html

src/calibre/www/apps/blog/templates/blog/post_list.html

src/calibre/www/apps/blog/templates/blog/post_search.html

src/calibre/www/apps/blog/templates/feeds

src/calibre/www/apps/blog/templates/feeds/posts_description.html

src/calibre/www/apps/blog/templates/feeds/posts_title.html

src/calibre/www/apps/blog/templates/inlines

src/calibre/www/apps/blog/templates/inlines/default.html

src/calibre/www/apps/blog/templatetags

src/calibre/www/apps/blog/templatetags/__init__.py

src/calibre/www/apps/blog/templatetags/blog.py

src/calibre/www/apps/blog/tests.py

src/calibre/www/apps/blog/urls.py

src/calibre/www/apps/blog/views.py

src/calibre/www/apps/feedjack

src/calibre/www/apps/feedjack/__init__.py

src/calibre/www/apps/feedjack/admin.py

src/calibre/www/apps/feedjack/fjcache.py

src/calibre/www/apps/feedjack/fjcloud.py

src/calibre/www/apps/feedjack/fjlib.py

src/calibre/www/apps/feedjack/models.py

src/calibre/www/apps/feedjack/update.py

src/calibre/www/apps/feedjack/urls.py

src/calibre/www/apps/feedjack/views.py

src/calibre/www/apps/inlines

src/calibre/www/apps/inlines/CHANGELOG.yml

src/calibre/www/apps/inlines/README.txt

src/calibre/www/apps/inlines/__init__.py

src/calibre/www/apps/inlines/admin.py

src/calibre/www/apps/inlines/models.py

src/calibre/www/apps/inlines/parser.py

src/calibre/www/apps/inlines/templatetags

src/calibre/www/apps/inlines/templatetags/__init__.py

src/calibre/www/apps/inlines/templatetags/inlines.py

src/calibre/www/kovid

src/calibre/www/kovid/__init__.py

src/calibre/www/kovid/manage.py

src/calibre/www/kovid/settings.py

src/calibre/www/kovid/urls.py

src/calibre/www/planet

src/calibre/www/planet/README.rst

src/calibre/www/planet/__init__.py

src/calibre/www/planet/manage.py

src/calibre/www/planet/settings.py

src/calibre/www/planet/test

src/calibre/www/planet/test/planet.db

src/calibre/www/planet/test/test.sh

src/calibre/www/planet/urls.py

src/calibre/www/publish.sh

src/calibre/www/settings.py

src/calibre/www/static

src/calibre/www/static/img

src/calibre/www/static/img/button-atom.png

src/calibre/www/static/img/button-css.png

src/calibre/www/static/img/button-django.png

src/calibre/www/static/img/button-foaf.png

src/calibre/www/static/img/button-hacker.png

src/calibre/www/static/img/button-opml.png

src/calibre/www/static/img/button-rss.png

src/calibre/www/static/img/button-xhtml.png

src/calibre/www/static/img/faces

src/calibre/www/static/img/faces/calibre.png

src/calibre/www/static/img/faces/john.png

src/calibre/www/static/img/faces/nobody.png

src/calibre/www/static/img/feed.png

src/calibre/www/static/img/logo.png

src/calibre/www/static/styles

src/calibre/www/static/styles/base.css

src/calibre/www/static/styles/codebox.css

src/calibre/www/static/styles/planet.css

src/calibre/www/templates

src/calibre/www/templates/404.html

src/calibre/www/templates/500.html

src/calibre/www/templates/base.html

src/calibre/www/templates/feedjack

src/calibre/www/templates/feedjack/default

src/calibre/www/templates/feedjack/default/post_list.html

src/calibre/www/templates/feedjack/foaf.xml

src/calibre/www/templates/feedjack/opml.xml

src/tagging

src/tagging/__init__.py

src/tagging/admin.py

src/tagging/fields.py

src/tagging/forms.py

src/tagging/generic.py

src/tagging/managers.py

src/tagging/models.py

src/tagging/settings.py

src/tagging/templatetags

src/tagging/templatetags/__init__.py

src/tagging/templatetags/tagging_tags.py

src/tagging/utils.py

src/tagging/views.py

todo

files removed:
debian/man/mobi-meta.txt

src/calibre/ezPyCrypto.py

src/odf/ooostyles.py

todo-2.6

files modified:
debian/changelog

debian/control

debian/man/names

debian/patches/build_debug.patch

debian/patches/bundled_cssutils_profiles.patch

debian/patches/manpages-installation.patch

debian/patches/remove_postinstall.patch

debian/rules

installer/linux/freeze.py

installer/osx/freeze.py

installer/windows/calibre/calibre.mpi

installer/windows/freeze.py

setup.py

src/calibre/__init__.py

src/calibre/constants.py

src/calibre/customize/builtins.py

src/calibre/customize/ui.py

src/calibre/debug.py

src/calibre/devices/__init__.py

src/calibre/devices/cybookg3/driver.py

src/calibre/devices/interface.py

src/calibre/devices/kindle/driver.py

src/calibre/devices/mime.py

src/calibre/devices/prs500/driver.py

src/calibre/devices/prs505/driver.py

src/calibre/devices/usbms/device.py

src/calibre/devices/usbms/driver.py

src/calibre/ebooks/BeautifulSoup.py

src/calibre/ebooks/__init__.py

src/calibre/ebooks/chardet/__init__.py

src/calibre/ebooks/epub/__init__.py

src/calibre/ebooks/epub/from_html.py

src/calibre/ebooks/epub/iterator.py

src/calibre/ebooks/epub/split.py

src/calibre/ebooks/html.py

src/calibre/ebooks/lrf/comic/convert_from.py

src/calibre/ebooks/lrf/html/convert_from.py

src/calibre/ebooks/lrf/lrs/convert_from.py

src/calibre/ebooks/lrf/meta.py

src/calibre/ebooks/lrf/objects.py

src/calibre/ebooks/lrf/pdf/convert_from.py

src/calibre/ebooks/metadata/__init__.py

src/calibre/ebooks/metadata/isbndb.py

src/calibre/ebooks/metadata/library_thing.py

src/calibre/ebooks/metadata/lit.py

src/calibre/ebooks/metadata/meta.py

src/calibre/ebooks/metadata/mobi.py

src/calibre/ebooks/metadata/opf2.py

src/calibre/ebooks/metadata/pdf.py

src/calibre/ebooks/metadata/toc.py

src/calibre/ebooks/mobi/from_any.py

src/calibre/ebooks/mobi/mobiml.py

src/calibre/ebooks/mobi/reader.py

src/calibre/ebooks/mobi/writer.py

src/calibre/ebooks/oeb/base.py

src/calibre/ebooks/oeb/stylizer.py

src/calibre/ebooks/oeb/transforms/htmltoc.py

src/calibre/ebooks/oeb/transforms/manglecase.py

src/calibre/gui2/__init__.py

src/calibre/gui2/add.py

src/calibre/gui2/device.py

src/calibre/gui2/dialogs/comicconf.ui

src/calibre/gui2/dialogs/config.py

src/calibre/gui2/dialogs/config.ui

src/calibre/gui2/dialogs/epub.py

src/calibre/gui2/dialogs/fetch_metadata.py

src/calibre/gui2/dialogs/fetch_metadata.ui

src/calibre/gui2/dialogs/jobs.py

src/calibre/gui2/dialogs/lrf_single.ui

src/calibre/gui2/dialogs/metadata_bulk.py

src/calibre/gui2/dialogs/metadata_single.py

src/calibre/gui2/dialogs/metadata_single.ui

src/calibre/gui2/dialogs/password.ui

src/calibre/gui2/dialogs/scheduler.py

src/calibre/gui2/dialogs/scheduler.ui

src/calibre/gui2/dialogs/search.py

src/calibre/gui2/dialogs/user_profiles.py

src/calibre/gui2/images/news/telepolis.png

src/calibre/gui2/jobs2.py

src/calibre/gui2/library.py

src/calibre/gui2/lrf_renderer/config.ui

src/calibre/gui2/lrf_renderer/document.py

src/calibre/gui2/main.py

src/calibre/gui2/main.ui

src/calibre/gui2/tools.py

src/calibre/gui2/viewer/documentview.py

src/calibre/gui2/viewer/js.py

src/calibre/gui2/viewer/main.py

src/calibre/gui2/widgets.py

src/calibre/library/__init__.py

src/calibre/library/cli.py

src/calibre/library/database2.py

src/calibre/library/server.py

src/calibre/libunrar.py

src/calibre/linux.py

src/calibre/manual/faq.rst

src/calibre/parallel.py

src/calibre/ptempfile.py

src/calibre/startup.py

src/calibre/trac/donations/server.py

src/calibre/trac/plugins/download.py

src/calibre/trac/plugins/templates/linux.html

src/calibre/translations/ar.po

src/calibre/translations/bg.po

src/calibre/translations/ca.po

src/calibre/translations/cs.po

src/calibre/translations/de.po

src/calibre/translations/el.po

src/calibre/translations/es.po

src/calibre/translations/fr.po

src/calibre/translations/gl.po

src/calibre/translations/he.po

src/calibre/translations/hu.po

src/calibre/translations/it.po

src/calibre/translations/nb.po

src/calibre/translations/nds.po

src/calibre/translations/nl.po

src/calibre/translations/pl.po

src/calibre/translations/pt.po

src/calibre/translations/ro.po

src/calibre/translations/ru.po

src/calibre/translations/sk.po

src/calibre/translations/sl.po

src/calibre/translations/sv.po

src/calibre/translations/te.po

src/calibre/web/feeds/__init__.py

src/calibre/web/feeds/news.py

src/calibre/web/feeds/recipes/__init__.py

src/calibre/web/feeds/recipes/recipe_b92.py

src/calibre/web/feeds/recipes/recipe_blic.py

src/calibre/web/feeds/recipes/recipe_exiled.py

src/calibre/web/feeds/recipes/recipe_faznet.py

src/calibre/web/feeds/recipes/recipe_iht.py

src/calibre/web/feeds/recipes/recipe_joelonsoftware.py

src/calibre/web/feeds/recipes/recipe_linuxdevices.py

src/calibre/web/feeds/recipes/recipe_new_scientist.py

src/calibre/web/feeds/recipes/recipe_new_yorker.py

src/calibre/web/feeds/recipes/recipe_nin.py

src/calibre/web/feeds/recipes/recipe_nspm.py

src/calibre/web/feeds/recipes/recipe_nytimes.py

src/calibre/web/feeds/recipes/recipe_nytimes_sub.py

src/calibre/web/feeds/recipes/recipe_security_watch.py

src/calibre/web/feeds/recipes/recipe_spiegelde.py

src/calibre/web/feeds/recipes/recipe_sueddeutsche.py

src/calibre/web/feeds/recipes/recipe_telepolis.py

src/calibre/web/feeds/recipes/recipe_time_magazine.py

src/calibre/web/feeds/recipes/recipe_tomshardware.py

src/calibre/web/feeds/recipes/recipe_tomshardware_de.py

src/calibre/web/feeds/recipes/recipe_usatoday.py

src/calibre/web/feeds/recipes/recipe_vreme.py

src/calibre/web/feeds/recipes/recipe_wash_post.py

src/calibre/web/fetch/simple.py

src/odf/attrconverters.py

src/odf/element.py

src/odf/elementtypes.py

src/odf/grammar.py

src/odf/load.py

src/odf/namespaces.py

src/odf/odf2xhtml.py

src/odf/odfmanifest.py

src/odf/office.py

src/odf/opendocument.py

src/odf/userfield.py

src/odf/xforms.py

src/pyPdf/generic.py

src/pyPdf/pdf.py

upload.py

Show diffs side-by-side

added added

removed removed

src/calibre/web/feeds/recipes/recipe_zaobao.py

1

#!/usr/bin/env python

2

3

__license__ = 'GPL v3'

4

__copyright__ = '2009, Pu Bo <pubo at pubolab.com>'

5

'''

6

zaobao.com

7

'''

8

import time, os, traceback, sys

9

from calibre.web.feeds.news import BasicNewsRecipe

10

from calibre.web.feeds import feeds_from_index, Feed, Article

11

from BeautifulSoup import Tag

12

13

class ZAOBAO(BasicNewsRecipe):

14

title = u'\u8054\u5408\u65e9\u62a5\u7f51 zaobao.com'

15

__author__ = 'Pu Bo'

16

description = 'News from zaobao.com'

17

no_stylesheets = True

18

recursions = 1

19

language = _('Chinese')

20

encoding = 'gbk'

21

# multithreaded_fetch = True

22

23

keep_only_tags = [

24

dict(name='table', attrs={'cellpadding':'9'}),

25

dict(name='table', attrs={'class':'cont'}),

26

dict(name='div', attrs={'id':'content'}),

27

dict(name='span', attrs={'class':'page'}),

28

]

29

30

remove_tags = [

31

dict(name='table', attrs={'cellspacing':'9'}),

32

]

33

34

extra_css = '\

35

@font-face {font-family: "serif1";src:url(res:///opt/sony/ebook/FONT/tt0011m_.ttf)}\n\

36

body{font-family: serif1, serif}\n\

37

.article_description{font-family: serif1, serif}\n\

38

p{font-family: serif1, serif}\n\

39

h1 {font-weight: bold; font-size: large;}\n\

40

h2 {font-size: large;}\n\

41

.title {font-size: large;}\n\

42

.article {font-size:medium}\n\

43

.navbar {font-size: small}\n\

44

.feed{font-size: medium}\n\

45

.small{font-size: small; padding-right: 8%}\n'

46

47

INDEXES = [

48

(u'\u65b0\u95fb\u56fe\u7247', u'http://www.zaobao.com/photoweb/photoweb_idx.shtml')

49

]

50

MAX_ITEMS_IN_INDEX = 10

51

52

DESC_SENSE = u'\u8054\u5408\u65e9\u62a5\u7f51'

53

54

feeds = [

55

(u'\u5373\u65f6\u62a5\u9053', u'http://realtime.zaobao.com/news.xml'),

56

(u'\u4e2d\u56fd\u65b0\u95fb', u'http://www.zaobao.com/zg/zg.xml'),

57

(u'\u56fd\u9645\u65b0\u95fb', u'http://www.zaobao.com/gj/gj.xml'),

58

(u'\u4e16\u754c\u62a5\u520a\u6587\u8403', u'http://www.zaobao.com/wencui/wencui.xml'),

59

(u'\u4e1c\u5357\u4e9a\u65b0\u95fb', u'http://www.zaobao.com/yx/yx.xml'),

60

(u'\u65b0\u52a0\u5761\u65b0\u95fb', u'http://www.zaobao.com/sp/sp.xml'),

61

(u'\u4eca\u65e5\u89c2\u70b9', u'http://www.zaobao.com/yl/yl.xml'),

62

(u'\u4e2d\u56fd\u8d22\u7ecf', u'http://www.zaobao.com/cz/cz.xml'),

63

(u'\u72ee\u57ce\u8d22\u7ecf', u'http://www.zaobao.com/cs/cs.xml'),

64

(u'\u5168\u7403\u8d22\u7ecf', u'http://www.zaobao.com/cg/cg.xml'),

65

(u'\u65e9\u62a5\u4f53\u80b2', u'http://www.zaobao.com/ty/ty.xml'),

66

(u'\u65e9\u62a5\u526f\u520a', u'http://www.zaobao.com/fk/fk.xml'),

67

]

68

69

def postprocess_html(self, soup, first):

70

for tag in soup.findAll(name=['table', 'tr', 'td']):

71

tag.name = 'div'

72

return soup

73

74

def parse_feeds(self):

75

self.log_debug(_('ZAOBAO overrided parse_feeds()'))

76

parsed_feeds = BasicNewsRecipe.parse_feeds(self)

77

78

for id, obj in enumerate(self.INDEXES):

79

title, url = obj

80

articles = []

81

soup = self.index_to_soup(url)

82

83

for i, item in enumerate(soup.findAll('li')):

84

if i >= self.MAX_ITEMS_IN_INDEX:

85

break

86

a = item.find('a')

87

if a and a.has_key('href'):

88

a_url = a['href']

89

a_title = self.tag_to_string(a)

90

date = ''

91

description = ''

92

self.log_debug(_('adding %s at %s')%(a_title,a_url))

93

articles.append({

94

'title':a_title,

95

'date':date,

96

'url':a_url,

97

'description':description

98

})

99

100

pfeeds = feeds_from_index([(title, articles)], oldest_article=self.oldest_article,

101

max_articles_per_feed=self.max_articles_per_feed)

102

103

self.log_debug(_('adding %s to feed')%(title))

104

for feed in pfeeds:

105

self.log_debug(_('adding feed: %s')%(feed.title))

106

feed.description = self.DESC_SENSE

107

parsed_feeds.append(feed)

108

for a, article in enumerate(feed):

109

self.log_debug(_('added article %s from %s')%(article.title, article.url))

110

self.log_debug(_('added feed %s')%(feed.title))

111

112

for i, feed in enumerate(parsed_feeds):

113

# workaorund a strange problem: Somethimes the xml encoding is not apllied correctly by parse()

114

weired_encoding_detected = False

115

if not isinstance(feed.description, unicode) and self.encoding and feed.description:

116

self.log_debug(_('Feed %s is not encoded correctly, manually replace it')%(feed.title))

117

feed.description = feed.description.decode(self.encoding, 'replace')

118

elif feed.description.find(self.DESC_SENSE) == -1 and self.encoding and feed.description:

119

self.log_debug(_('Feed %s is weired encoded, manually redo all')%(feed.title))

120

feed.description = feed.description.encode('cp1252', 'replace').decode(self.encoding, 'replace')

121

weired_encoding_detected = True

122

123

for a, article in enumerate(feed):

124

if not isinstance(article.title, unicode) and self.encoding:

125

article.title = article.title.decode(self.encoding, 'replace')

126

if not isinstance(article.summary, unicode) and self.encoding and article.summary:

127

article.summary = article.summary.decode(self.encoding, 'replace')

128

article.text_summary = article.summary

129

if not isinstance(article.text_summary, unicode) and self.encoding and article.text_summary:

130

article.text_summary = article.text_summary.decode(self.encoding, 'replace')

131

article.summary = article.text_summary

132

if weired_encoding_detected:

133

if article.title:

134

article.title = article.title.encode('cp1252', 'replace').decode(self.encoding, 'replace')

135

if article.summary:

136

article.summary = article.summary.encode('cp1252', 'replace').decode(self.encoding, 'replace')

137

if article.text_summary:

138

article.text_summary = article.text_summary.encode('cp1252', 'replace').decode(self.encoding, 'replace')

139

140

if article.title == "Untitled article":

141

self.log_debug(_('Removing empty article %s from %s')%(article.title, article.url))

142

# remove the article

143

feed.articles[a:a+1] = []

144

return parsed_feeds

145

146

def get_browser(self):

147

br = BasicNewsRecipe.get_browser()

148

br.addheaders.append(('Pragma', 'no-cache'))

149

return br

b'\\ No newline at end of file'

Older »