9
9
class DeStandaard(BasicNewsRecipe):
10
10
title = u'De Standaard'
11
11
__author__ = u'Darko Miletic'
13
14
description = u'News from Belgium'
15
16
max_articles_per_feed = 100
16
17
no_stylesheets = True
17
18
use_embedded_content = False
19
keep_only_tags = [dict(name='div' , attrs={'id':'_parts_midContainer_div'})]
20
remove_tags_after = dict(name='h3', attrs={'title':'Binnenland'})
22
dict(name='h3' , attrs={'title':'Binnenland' })
23
,dict(name='p' , attrs={'class':'by' })
24
,dict(name='div' , attrs={'class':'articlesright'})
25
,dict(name='a' , attrs={'class':'help' })
26
,dict(name='a' , attrs={'class':'archive' })
27
,dict(name='a' , attrs={'class':'print' })
28
,dict(name='a' , attrs={'class':'email' })
21
keep_only_tags = [dict(name='div' , attrs={'id':['intro','continued']})]
32
(u'De Standaard Online', u'http://feeds.feedburner.com/dso-front')
23
feeds = [(u'De Standaard Online', u'http://feeds.feedburner.com/dso-front')]
26
def get_article_url(self, article):
27
return article.get('guid', None)
29
def print_version(self, url):
30
return url.replace('/Detail.aspx?','/PrintArtikel.aspx?')