~ubuntu-branches/ubuntu/natty/miro/natty

Viewing changes to lib/feed.py

Committer: Bazaar Package Importer
Author(s): Bryce Harrington
Date: 2011-01-22 02:46:33 UTC
mfrom: (1.4.10 upstream) (1.7.5 experimental)
Revision ID: james.westby@ubuntu.com-20110122024633-kjme8u93y2il5nmf

Tags: 3.5.1-1ubuntu1

* Merge from debian.  Remaining ubuntu changes:
  - Use python 2.7 instead of python 2.6
  - Relax dependency on python-dbus to >= 0.83.0

files added:
.pc/100_catch_keyerror_in_update_items.patch/lib

.pc/100_catch_keyerror_in_update_items.patch/lib/frontends

.pc/100_catch_keyerror_in_update_items.patch/lib/frontends/widgets

.pc/100_catch_keyerror_in_update_items.patch/lib/frontends/widgets/itemlist.py

.pc/10_movies_dir.patch/linux

.pc/10_movies_dir.patch/linux/plat

.pc/10_movies_dir.patch/linux/plat/config.py

.pc/50_miro_debug_fix.patch/linux

.pc/50_miro_debug_fix.patch/linux/setup.py

.pc/debian-changes-3.5.1-1

.pc/debian-changes-3.5.1-1/lib

.pc/debian-changes-3.5.1-1/lib/frontends

.pc/debian-changes-3.5.1-1/lib/frontends/widgets

.pc/debian-changes-3.5.1-1/lib/frontends/widgets/gtk

.pc/debian-changes-3.5.1-1/lib/frontends/widgets/gtk/webkitgtkhacks.c

debian/patches/debian-changes-3.5.1-1

lib/__init__.py

lib/app.py

lib/appconfig.py

lib/autodiscover.py

lib/autodler.py

lib/autoupdate.py

lib/clock.py

lib/commandline.py

lib/config.py

lib/controller.py

lib/convert20database.py

lib/crashreport.py

lib/database.py

lib/databasehelper.py

lib/databaselog.py

lib/databasesanity.py

lib/databaseupgrade.py

lib/datastructures.py

lib/dbupgradeprogress.py

lib/debugutil.py

lib/dialogs.py

lib/displaytext.py

lib/dl_daemon

lib/dl_daemon/Democracy_Downloader.py

lib/dl_daemon/__init__.py

lib/dl_daemon/command.py

lib/dl_daemon/daemon.py

lib/dl_daemon/download.py

lib/dl_daemon/private

lib/dl_daemon/private/__init__.py

lib/dl_daemon/private/config.py

lib/dl_daemon/private/httpauth.py

lib/dl_daemon/private/resources.py

lib/download_utils.py

lib/downloader.py

lib/eventloop.py

lib/fasttypes.c

lib/feed.py

lib/feedparser.py

lib/feedparserutil.py

lib/feedupdate.py

lib/filetypes.py

lib/fileutil.py

lib/flashscraper.py

lib/folder.py

lib/frontends

lib/frontends/__init__.py

lib/frontends/cli

lib/frontends/cli/README

lib/frontends/cli/__init__.py

lib/frontends/cli/application.py

lib/frontends/cli/clidialog.py

lib/frontends/cli/events.py

lib/frontends/cli/interpreter.py

lib/frontends/cli/util.py

lib/frontends/shell

lib/frontends/shell/__init__.py

lib/frontends/shell/application.py

lib/frontends/widgets

lib/frontends/widgets/__init__.py

lib/frontends/widgets/addtoplaylistdialog.py

lib/frontends/widgets/application.py

lib/frontends/widgets/browser.py

lib/frontends/widgets/cellpack.py

lib/frontends/widgets/crashdialog.py

lib/frontends/widgets/diagnostics.py

lib/frontends/widgets/dialogs.py

lib/frontends/widgets/dialogwidgets.py

lib/frontends/widgets/displays.py

lib/frontends/widgets/downloadscontroller.py

lib/frontends/widgets/feedcontroller.py

lib/frontends/widgets/feedsettingspanel.py

lib/frontends/widgets/firsttimedialog.py

lib/frontends/widgets/gtk

lib/frontends/widgets/gtk/__init__.py

lib/frontends/widgets/gtk/audio.py

lib/frontends/widgets/gtk/base.py

lib/frontends/widgets/gtk/const.py

lib/frontends/widgets/gtk/controls.py

lib/frontends/widgets/gtk/customcontrols.py

lib/frontends/widgets/gtk/drawing.py

lib/frontends/widgets/gtk/fontsize.py

lib/frontends/widgets/gtk/keymap.py

lib/frontends/widgets/gtk/layout.py

lib/frontends/widgets/gtk/layoutmanager.py

lib/frontends/widgets/gtk/persistentwindow.py

lib/frontends/widgets/gtk/preferenceswindow.py

lib/frontends/widgets/gtk/pygtkhacks.pyx

lib/frontends/widgets/gtk/searchentry.py

lib/frontends/widgets/gtk/simple.py

lib/frontends/widgets/gtk/sniffer.py

lib/frontends/widgets/gtk/tableview.py

lib/frontends/widgets/gtk/textlayout.py

lib/frontends/widgets/gtk/threads.py

lib/frontends/widgets/gtk/timer.py

lib/frontends/widgets/gtk/trayicon.py

lib/frontends/widgets/gtk/video.py

lib/frontends/widgets/gtk/weakconnect.py

lib/frontends/widgets/gtk/webkitgtkhacks.c

lib/frontends/widgets/gtk/webkitgtkhacks.pyx

lib/frontends/widgets/gtk/widgets.py

lib/frontends/widgets/gtk/widgetset.py

lib/frontends/widgets/gtk/window.py

lib/frontends/widgets/gtk/wrappermap.py

lib/frontends/widgets/gtk/xpcom

lib/frontends/widgets/gtk/xpcom/HttpObserver.cc

lib/frontends/widgets/gtk/xpcom/HttpObserver.h

lib/frontends/widgets/imagebutton.py

lib/frontends/widgets/imagepool.py

lib/frontends/widgets/itemcontextmenu.py

lib/frontends/widgets/itemedit.py

lib/frontends/widgets/itemlist.py

lib/frontends/widgets/itemlistcontroller.py

lib/frontends/widgets/itemlistwidgets.py

lib/frontends/widgets/linkhandler.py

lib/frontends/widgets/menus.py

lib/frontends/widgets/newfeed.py

lib/frontends/widgets/newfolder.py

lib/frontends/widgets/newsearchfeed.py

lib/frontends/widgets/playback.py

lib/frontends/widgets/playlist.py

lib/frontends/widgets/prefpanel.py

lib/frontends/widgets/quitconfirmation.py

lib/frontends/widgets/removefeeds.py

lib/frontends/widgets/rundialog.py

lib/frontends/widgets/search.py

lib/frontends/widgets/searchbox.py

lib/frontends/widgets/segmented.py

lib/frontends/widgets/separator.py

lib/frontends/widgets/statictabs.py

lib/frontends/widgets/style.py

lib/frontends/widgets/tablist.py

lib/frontends/widgets/tablistmanager.py

lib/frontends/widgets/util.py

lib/frontends/widgets/videobox.py

lib/frontends/widgets/videoconversionscontroller.py

lib/frontends/widgets/watchedfolders.py

lib/frontends/widgets/widgetconst.py

lib/frontends/widgets/widgetutil.py

lib/frontends/widgets/window.py

lib/frontendstate.py

lib/gtcache.py

lib/guide.py

lib/httpauth.py

lib/httpauthtools.py

lib/httpclient.py

lib/iconcache.py

lib/iso639.py

lib/item.py

lib/messagehandler.py

lib/messages.py

lib/models.py

lib/moviedata.py

lib/net.py

lib/opml.py

lib/player.py

lib/playlist.py

lib/prefs.py

lib/schema.py

lib/schemav79.py

lib/search.py

lib/searchengines.py

lib/signals.py

lib/singleclick.py

lib/startup.py

lib/storedatabase.py

lib/subscription.py

lib/tabs.py

lib/test

lib/test/__init__.py

lib/test/conversionstest.py

lib/test/databasesanitytest.py

lib/test/databasetest.py

lib/test/datastructurestest.py

lib/test/downloadertest.py

lib/test/feedparsertest.py

lib/test/feedtest.py

lib/test/filetypestest.py

lib/test/flashscrapertest.py

lib/test/framework.py

lib/test/gtcachetest.py

lib/test/httpclienttest.py

lib/test/httpdownloadertest.py

lib/test/iconcachetest.py

lib/test/itemtest.py

lib/test/messagetest.py

lib/test/networktest.py

lib/test/opmltest.py

lib/test/parseurltest.py

lib/test/playlisttest.py

lib/test/schedulertest.py

lib/test/schematest.py

lib/test/signalstest.py

lib/test/sparkletest.py

lib/test/storedatabasetest.py

lib/test/strippertest.py

lib/test/subscriptiontest.py

lib/test/testhttpserver.py

lib/test/unicodetest.py

lib/test/utiltest.py

lib/test/xhtmltest.py

lib/theme.py

lib/trapcall.py

lib/u3info.py

lib/util.py

lib/videoconversion.py

lib/xhtmltools.py

linux

linux/Makefile

linux/README

linux/helperscripts

linux/helperscripts/README

linux/helperscripts/fedora_12.sh

linux/helperscripts/fedora_13.sh

linux/helperscripts/ubuntu_karmic_9_10.sh

linux/helperscripts/ubuntu_lucid_10_4.sh

linux/helperscripts/ubuntu_maverick_10_10.sh

linux/icons

linux/icons/hicolor

linux/icons/hicolor/128x128

linux/icons/hicolor/128x128/apps

linux/icons/hicolor/128x128/apps/miro.png

linux/icons/hicolor/24x24

linux/icons/hicolor/24x24/apps

linux/icons/hicolor/24x24/apps/miro.png

linux/icons/hicolor/48x48

linux/icons/hicolor/48x48/apps

linux/icons/hicolor/48x48/apps/miro.png

linux/icons/hicolor/72x72

linux/icons/hicolor/72x72/apps

linux/icons/hicolor/72x72/apps/miro.png

linux/miro.1

linux/miro.desktop

linux/miro.real

linux/miro.xml

linux/miro.xpm

linux/plat

linux/plat/__init__.py

linux/plat/clconverter.py

linux/plat/config.py

linux/plat/frontends

linux/plat/frontends/__init__.py

linux/plat/frontends/widgets

linux/plat/frontends/widgets/__init__.py

linux/plat/frontends/widgets/application.py

linux/plat/frontends/widgets/mediakeys.py

linux/plat/frontends/widgets/prefpanelset.py

linux/plat/frontends/widgets/threads.py

linux/plat/frontends/widgets/timer.py

linux/plat/frontends/widgets/webkitbrowser.py

linux/plat/frontends/widgets/widgetset.py

linux/plat/onetime.py

linux/plat/options.py

linux/plat/renderers

linux/plat/renderers/__init__.py

linux/plat/renderers/gst_extractor.py

linux/plat/renderers/gstreamerrenderer.py

linux/plat/resources.py

linux/plat/screensaver.py

linux/plat/upgrade.py

linux/plat/utils.py

linux/plat/xlibhelper.pyx

linux/pylintrc

linux/run.sh

linux/setup.py

osx/Info.plist

osx/Miro.icns

osx/Miro.py

osx/README

osx/Resources-DMG

osx/Resources-DMG/background.tiff

osx/Resources-DMG/dmg-ds-store

osx/Resources-Widgets

osx/Resources-Widgets/Credits.html

osx/Resources-Widgets/MainMenu.nib

osx/Resources-Widgets/MainMenu.nib/classes.nib

osx/Resources-Widgets/MainMenu.nib/info.nib

osx/Resources-Widgets/MainMenu.nib/objects.nib

osx/Resources-Widgets/OverlayPalette.nib

osx/Resources-Widgets/OverlayPalette.nib/designable.nib

osx/Resources-Widgets/OverlayPalette.nib/keyedobjects.nib

osx/Resources-Widgets/dock_badge_1_2.png

osx/Resources-Widgets/dock_badge_3.png

osx/Resources-Widgets/dock_badge_4.png

osx/Resources-Widgets/dock_badge_5.png

osx/Resources-Widgets/fs-button-enterfullscreen-alt.png

osx/Resources-Widgets/fs-button-enterfullscreen.png

osx/Resources-Widgets/fs-button-exitfullscreen-alt.png

osx/Resources-Widgets/fs-button-exitfullscreen.png

osx/Resources-Widgets/fs-button-next-alt.png

osx/Resources-Widgets/fs-button-next.png

osx/Resources-Widgets/fs-button-pause-alt.png

osx/Resources-Widgets/fs-button-pause.png

osx/Resources-Widgets/fs-button-play-alt.png

osx/Resources-Widgets/fs-button-play.png

osx/Resources-Widgets/fs-button-previous-alt.png

osx/Resources-Widgets/fs-button-previous.png

osx/Resources-Widgets/fs-button-seekback-alt.png

osx/Resources-Widgets/fs-button-seekback.png

osx/Resources-Widgets/fs-button-seekforward-alt.png

osx/Resources-Widgets/fs-button-seekforward.png

osx/Resources-Widgets/fs-button-stop-alt.png

osx/Resources-Widgets/fs-button-stop.png

osx/Resources-Widgets/fs-button-subtitles-alt.png

osx/Resources-Widgets/fs-button-subtitles.png

osx/Resources-Widgets/fs-progress-slider.png

osx/Resources-Widgets/fs-track-progress.png

osx/Resources-Widgets/fs-volume-slider.png

osx/Resources-Widgets/pref_item_conversions.png

osx/Resources-Widgets/pref_item_disk_space.png

osx/Resources-Widgets/pref_item_downloads.png

osx/Resources-Widgets/pref_item_feeds.png

osx/Resources-Widgets/pref_item_folders.png

osx/Resources-Widgets/pref_item_general.png

osx/Resources-Widgets/pref_item_playback.png

osx/Resources-Widgets/search_popup_triangle.png

osx/Resources-Widgets/warmup.mov

osx/binary_kit_version

osx/build.sh

osx/modules

osx/modules/_growl.c

osx/modules/_growlImage.m

osx/modules/idletime.c

osx/modules/keychain.c

osx/modules/qtcomp.c

osx/plat

osx/plat/__init__.py

osx/plat/bundle.py

osx/plat/config.py

osx/plat/filenames.py

osx/plat/frontends

osx/plat/frontends/__init__.py

osx/plat/frontends/widgets

osx/plat/frontends/widgets/__init__.py

osx/plat/frontends/widgets/application.py

osx/plat/frontends/widgets/audio.py

osx/plat/frontends/widgets/base.py

osx/plat/frontends/widgets/browser.py

osx/plat/frontends/widgets/const.py

osx/plat/frontends/widgets/control.py

osx/plat/frontends/widgets/customcontrol.py

osx/plat/frontends/widgets/drawing.py

osx/plat/frontends/widgets/drawingwidgets.py

osx/plat/frontends/widgets/helpers.py

osx/plat/frontends/widgets/layout.py

osx/plat/frontends/widgets/layoutmanager.py

osx/plat/frontends/widgets/mediatypes.py

osx/plat/frontends/widgets/osxmenus.py

osx/plat/frontends/widgets/overlay.py

osx/plat/frontends/widgets/prefpanelset.py

osx/plat/frontends/widgets/quicktime.py

osx/plat/frontends/widgets/rect.py

osx/plat/frontends/widgets/simple.py

osx/plat/frontends/widgets/sniffer.py

osx/plat/frontends/widgets/sparkleupdater.py

osx/plat/frontends/widgets/tablemodel.py

osx/plat/frontends/widgets/tableview.py

osx/plat/frontends/widgets/threads.py

osx/plat/frontends/widgets/timer.py

osx/plat/frontends/widgets/video.py

osx/plat/frontends/widgets/viewport.py

osx/plat/frontends/widgets/widgetset.py

osx/plat/frontends/widgets/window.py

osx/plat/frontends/widgets/wrappermap.py

osx/plat/growl.py

osx/plat/migrateappname.py

osx/plat/resources.py

osx/plat/script_codes.py

osx/plat/utils.py

osx/qt_extractor.py

osx/run.sh

osx/setup.py

osx/setup_binarykit.sh

osx/setup_sandbox.sh

resources/conversions

resources/conversions/android.conv

resources/conversions/apple.conv

resources/conversions/others.conv

resources/images/clear-image.png

resources/images/fullscreen_enter.png

resources/images/fullscreen_exit.png

resources/images/icon-conversions.png

resources/images/icon-conversions_large.png

resources/images/pref-tab-conversions.png

resources/locale/hy.mo

resources/locale/hy.po

resources/locale/kw.mo

resources/locale/kw.po

resources/testdata/httpserver

resources/testdata/httpserver/foo.txt

resources/testdata/httpserver/linux-screen.jpg

resources/testdata/httpserver/redirect.html

resources/testdata/httpserver/test with spaces.txt

resources/testdata/httpserver/test.txt

windows

windows/Miro.ico

windows/Miro.nsi

windows/Miro.py

windows/Miro_Downloader.py

windows/README

windows/binary_kit_version

windows/clean.sh

windows/get_requirements.sh

windows/icons

windows/icons/hicolor

windows/icons/hicolor/128x128

windows/icons/hicolor/128x128/apps

windows/icons/hicolor/128x128/apps/miro.png

windows/miro-install-generic.bmp

windows/miro-install-image.bmp

windows/miro-installer-generic.ico

windows/miro-installer.ico

windows/mirotest.py

windows/moviedata_util.py

windows/overrides

windows/overrides/site.py

windows/plat

windows/plat/__init__.py

windows/plat/clipboard.py

windows/plat/commandline.py

windows/plat/config.py

windows/plat/fontinfo.py

windows/plat/frontends

windows/plat/frontends/__init__.py

windows/plat/frontends/widgets

windows/plat/frontends/widgets/XULRunnerBrowser

windows/plat/frontends/widgets/XULRunnerBrowser/FixFocus.cpp

windows/plat/frontends/widgets/XULRunnerBrowser/FixFocus.h

windows/plat/frontends/widgets/XULRunnerBrowser/Init.cpp

windows/plat/frontends/widgets/XULRunnerBrowser/Init.h

windows/plat/frontends/widgets/XULRunnerBrowser/MiroBrowserEmbed.cpp

windows/plat/frontends/widgets/XULRunnerBrowser/MiroBrowserEmbed.h

windows/plat/frontends/widgets/XULRunnerBrowser/MiroWindowCreator.cpp

windows/plat/frontends/widgets/XULRunnerBrowser/MiroWindowCreator.h

windows/plat/frontends/widgets/XULRunnerBrowser/xulrunnerbrowser.pyx

windows/plat/frontends/widgets/__init__.py

windows/plat/frontends/widgets/application.py

windows/plat/frontends/widgets/browser.py

windows/plat/frontends/widgets/flash.py

windows/plat/frontends/widgets/prefpanelset.py

windows/plat/frontends/widgets/threads.py

windows/plat/frontends/widgets/timer.py

windows/plat/frontends/widgets/update.py

windows/plat/frontends/widgets/widgetset.py

windows/plat/migrateappname.py

windows/plat/options.py

windows/plat/pipeipc.py

windows/plat/prelogger.py

windows/plat/proxyfind.py

windows/plat/pyxpcomcalls.py

windows/plat/renderers

windows/plat/renderers/__init__.py

windows/plat/renderers/vlc.py

windows/plat/resources.py

windows/plat/screensaver.py

windows/plat/specialfolders.py

windows/plat/utils.py

windows/plat/xulhelper.py

windows/run.sh

windows/setup.py

windows/setup_binarykit.sh

windows/test.sh

windows/zugo-silent.exe

files removed:
.pc/100_catch_keyerror_in_update_items.patch/portable

.pc/100_catch_keyerror_in_update_items.patch/portable/frontends

.pc/100_catch_keyerror_in_update_items.patch/portable/frontends/widgets

.pc/100_catch_keyerror_in_update_items.patch/portable/frontends/widgets/itemlist.py

.pc/101_player_undefined_elapsed_time.patch

.pc/101_player_undefined_elapsed_time.patch/portable

.pc/101_player_undefined_elapsed_time.patch/portable/player.py

.pc/10_movies_dir.patch/platform

.pc/10_movies_dir.patch/platform/gtk-x11

.pc/10_movies_dir.patch/platform/gtk-x11/plat

.pc/10_movies_dir.patch/platform/gtk-x11/plat/config.py

.pc/10_movies_dir.patch/platform/gtk-x11/plat/upgrade.py

.pc/20_no_autoupdate.patch

.pc/20_no_autoupdate.patch/portable

.pc/20_no_autoupdate.patch/portable/startup.py

.pc/50_miro_debug_fix.patch/platform

.pc/50_miro_debug_fix.patch/platform/gtk-x11

.pc/50_miro_debug_fix.patch/platform/gtk-x11/setup.py

debian/patches/101_player_undefined_elapsed_time.patch

debian/patches/20_no_autoupdate.patch

notes

notes/vlc-packages.mak

platform

platform/gtk-x11

platform/gtk-x11/Makefile

platform/gtk-x11/README

platform/gtk-x11/icons

platform/gtk-x11/icons/hicolor

platform/gtk-x11/icons/hicolor/128x128

platform/gtk-x11/icons/hicolor/128x128/apps

platform/gtk-x11/icons/hicolor/128x128/apps/miro.png

platform/gtk-x11/icons/hicolor/24x24

platform/gtk-x11/icons/hicolor/24x24/apps

platform/gtk-x11/icons/hicolor/24x24/apps/miro.png

platform/gtk-x11/icons/hicolor/48x48

platform/gtk-x11/icons/hicolor/48x48/apps

platform/gtk-x11/icons/hicolor/48x48/apps/miro.png

platform/gtk-x11/icons/hicolor/72x72

platform/gtk-x11/icons/hicolor/72x72/apps

platform/gtk-x11/icons/hicolor/72x72/apps/miro.png

platform/gtk-x11/miro.1

platform/gtk-x11/miro.desktop

platform/gtk-x11/miro.real

platform/gtk-x11/miro.xml

platform/gtk-x11/miro.xpm

platform/gtk-x11/plat

platform/gtk-x11/plat/__init__.py

platform/gtk-x11/plat/config.py

platform/gtk-x11/plat/frontends

platform/gtk-x11/plat/frontends/__init__.py

platform/gtk-x11/plat/frontends/widgets

platform/gtk-x11/plat/frontends/widgets/__init__.py

platform/gtk-x11/plat/frontends/widgets/application.py

platform/gtk-x11/plat/frontends/widgets/mediakeys.py

platform/gtk-x11/plat/frontends/widgets/prefpanelset.py

platform/gtk-x11/plat/frontends/widgets/threads.py

platform/gtk-x11/plat/frontends/widgets/timer.py

platform/gtk-x11/plat/frontends/widgets/webkitbrowser.py

platform/gtk-x11/plat/frontends/widgets/widgetset.py

platform/gtk-x11/plat/idletime.py

platform/gtk-x11/plat/onetime.py

platform/gtk-x11/plat/options.py

platform/gtk-x11/plat/renderers

platform/gtk-x11/plat/renderers/__init__.py

platform/gtk-x11/plat/renderers/gst_extractor.py

platform/gtk-x11/plat/renderers/gstreamerrenderer.py

platform/gtk-x11/plat/resources.py

platform/gtk-x11/plat/screensaver.py

platform/gtk-x11/plat/upgrade.py

platform/gtk-x11/plat/utils.py

platform/gtk-x11/plat/xlibhelper.pyx

platform/gtk-x11/pylintrc

platform/gtk-x11/run.sh

platform/gtk-x11/setup.py

platform/osx

platform/osx/Info.plist

platform/osx/Miro.icns

platform/osx/Miro.py

platform/osx/README

platform/osx/Resources-DMG

platform/osx/Resources-DMG/background.tiff

platform/osx/Resources-DMG/dmg-ds-store

platform/osx/Resources-Widgets

platform/osx/Resources-Widgets/Credits.html

platform/osx/Resources-Widgets/MainMenu.nib

platform/osx/Resources-Widgets/MainMenu.nib/classes.nib

platform/osx/Resources-Widgets/MainMenu.nib/info.nib

platform/osx/Resources-Widgets/MainMenu.nib/objects.nib

platform/osx/Resources-Widgets/OverlayPalette.nib

platform/osx/Resources-Widgets/OverlayPalette.nib/designable.nib

platform/osx/Resources-Widgets/OverlayPalette.nib/keyedobjects.nib

platform/osx/Resources-Widgets/dock_badge_1_2.png

platform/osx/Resources-Widgets/dock_badge_3.png

platform/osx/Resources-Widgets/dock_badge_4.png

platform/osx/Resources-Widgets/dock_badge_5.png

platform/osx/Resources-Widgets/fs-button-enterfullscreen-alt.png

platform/osx/Resources-Widgets/fs-button-enterfullscreen.png

platform/osx/Resources-Widgets/fs-button-exitfullscreen-alt.png

platform/osx/Resources-Widgets/fs-button-exitfullscreen.png

platform/osx/Resources-Widgets/fs-button-next-alt.png

platform/osx/Resources-Widgets/fs-button-next.png

platform/osx/Resources-Widgets/fs-button-pause-alt.png

platform/osx/Resources-Widgets/fs-button-pause.png

platform/osx/Resources-Widgets/fs-button-play-alt.png

platform/osx/Resources-Widgets/fs-button-play.png

platform/osx/Resources-Widgets/fs-button-previous-alt.png

platform/osx/Resources-Widgets/fs-button-previous.png

platform/osx/Resources-Widgets/fs-button-seekback-alt.png

platform/osx/Resources-Widgets/fs-button-seekback.png

platform/osx/Resources-Widgets/fs-button-seekforward-alt.png

platform/osx/Resources-Widgets/fs-button-seekforward.png

platform/osx/Resources-Widgets/fs-button-stop-alt.png

platform/osx/Resources-Widgets/fs-button-stop.png

platform/osx/Resources-Widgets/fs-button-subtitles-alt.png

platform/osx/Resources-Widgets/fs-button-subtitles.png

platform/osx/Resources-Widgets/fs-progress-slider.png

platform/osx/Resources-Widgets/fs-track-progress.png

platform/osx/Resources-Widgets/fs-volume-slider.png

platform/osx/Resources-Widgets/pref_item_disk_space.png

platform/osx/Resources-Widgets/pref_item_downloads.png

platform/osx/Resources-Widgets/pref_item_feeds.png

platform/osx/Resources-Widgets/pref_item_folders.png

platform/osx/Resources-Widgets/pref_item_general.png

platform/osx/Resources-Widgets/pref_item_playback.png

platform/osx/Resources-Widgets/search_popup_triangle.png

platform/osx/Resources-Widgets/warmup.mov

platform/osx/binary_kit_version

platform/osx/build.sh

platform/osx/modules

platform/osx/modules/_growl.c

platform/osx/modules/_growlImage.m

platform/osx/modules/idletime.c

platform/osx/modules/keychain.c

platform/osx/modules/qtcomp.c

platform/osx/modules/shading.m

platform/osx/patch_objc_module.sh

platform/osx/plat

platform/osx/plat/__init__.py

platform/osx/plat/bundle.py

platform/osx/plat/config.py

platform/osx/plat/filenames.py

platform/osx/plat/frontends

platform/osx/plat/frontends/__init__.py

platform/osx/plat/frontends/widgets

platform/osx/plat/frontends/widgets/__init__.py

platform/osx/plat/frontends/widgets/application.py

platform/osx/plat/frontends/widgets/audio.py

platform/osx/plat/frontends/widgets/base.py

platform/osx/plat/frontends/widgets/browser.py

platform/osx/plat/frontends/widgets/const.py

platform/osx/plat/frontends/widgets/control.py

platform/osx/plat/frontends/widgets/customcontrol.py

platform/osx/plat/frontends/widgets/drawing.py

platform/osx/plat/frontends/widgets/drawingwidgets.py

platform/osx/plat/frontends/widgets/helpers.py

platform/osx/plat/frontends/widgets/layout.py

platform/osx/plat/frontends/widgets/layoutmanager.py

platform/osx/plat/frontends/widgets/mediatypes.py

platform/osx/plat/frontends/widgets/osxmenus.py

platform/osx/plat/frontends/widgets/overlay.py

platform/osx/plat/frontends/widgets/prefpanelset.py

platform/osx/plat/frontends/widgets/quicktime.py

platform/osx/plat/frontends/widgets/rect.py

platform/osx/plat/frontends/widgets/simple.py

platform/osx/plat/frontends/widgets/sniffer.py

platform/osx/plat/frontends/widgets/sparkleupdater.py

platform/osx/plat/frontends/widgets/tablemodel.py

platform/osx/plat/frontends/widgets/tableview.py

platform/osx/plat/frontends/widgets/threads.py

platform/osx/plat/frontends/widgets/timer.py

platform/osx/plat/frontends/widgets/video.py

platform/osx/plat/frontends/widgets/viewport.py

platform/osx/plat/frontends/widgets/widgetset.py

platform/osx/plat/frontends/widgets/window.py

platform/osx/plat/frontends/widgets/wrappermap.py

platform/osx/plat/growl.py

platform/osx/plat/migrateappname.py

platform/osx/plat/resources.py

platform/osx/plat/script_codes.py

platform/osx/plat/utils.py

platform/osx/qt_extractor.py

platform/osx/run.sh

platform/osx/setup.py

platform/osx/setup_binarykit.sh

platform/osx/setup_sandbox.sh

platform/osx/setup_sandbox_10.4.sh

platform/osx/test

platform/osx/test/setup-unittests.py

platform/osx/test/unittests.py

platform/osx/test/unittests.sh

platform/windows-xul

platform/windows-xul/Miro.ico

platform/windows-xul/Miro.nsi

platform/windows-xul/Miro.py

platform/windows-xul/Miro_Downloader.py

platform/windows-xul/README

platform/windows-xul/binary_kit_version

platform/windows-xul/clean.sh

platform/windows-xul/icons

platform/windows-xul/icons/hicolor

platform/windows-xul/icons/hicolor/128x128

platform/windows-xul/icons/hicolor/128x128/apps

platform/windows-xul/icons/hicolor/128x128/apps/miro.png

platform/windows-xul/miro-install-generic.bmp

platform/windows-xul/miro-install-image.bmp

platform/windows-xul/miro-installer-generic.ico

platform/windows-xul/miro-installer.ico

platform/windows-xul/mirotest.py

platform/windows-xul/moviedata_util.py

platform/windows-xul/overrides

platform/windows-xul/overrides/site.py

platform/windows-xul/plat

platform/windows-xul/plat/__init__.py

platform/windows-xul/plat/clipboard.py

platform/windows-xul/plat/commandline.py

platform/windows-xul/plat/config.py

platform/windows-xul/plat/frontends

platform/windows-xul/plat/frontends/__init__.py

platform/windows-xul/plat/frontends/widgets

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/FixFocus.cpp

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/FixFocus.h

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/Init.cpp

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/Init.h

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/MiroBrowserEmbed.cpp

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/MiroBrowserEmbed.h

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/MiroWindowCreator.cpp

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/MiroWindowCreator.h

platform/windows-xul/plat/frontends/widgets/XULRunnerBrowser/xulrunnerbrowser.pyx

platform/windows-xul/plat/frontends/widgets/__init__.py

platform/windows-xul/plat/frontends/widgets/application.py

platform/windows-xul/plat/frontends/widgets/browser.py

platform/windows-xul/plat/frontends/widgets/flash.py

platform/windows-xul/plat/frontends/widgets/prefpanelset.py

platform/windows-xul/plat/frontends/widgets/threads.py

platform/windows-xul/plat/frontends/widgets/timer.py

platform/windows-xul/plat/frontends/widgets/update.py

platform/windows-xul/plat/frontends/widgets/widgetset.py

platform/windows-xul/plat/idletime.py

platform/windows-xul/plat/migrateappname.py

platform/windows-xul/plat/miro_urlparse.py

platform/windows-xul/plat/options.py

platform/windows-xul/plat/pipeipc.py

platform/windows-xul/plat/prelogger.py

platform/windows-xul/plat/proxyfind.py

platform/windows-xul/plat/pyxpcomcalls.py

platform/windows-xul/plat/renderers

platform/windows-xul/plat/renderers/__init__.py

platform/windows-xul/plat/renderers/vlc.py

platform/windows-xul/plat/resources.py

platform/windows-xul/plat/screensaver.py

platform/windows-xul/plat/specialfolders.py

platform/windows-xul/plat/utils.py

platform/windows-xul/plat/xulhelper.py

platform/windows-xul/run.sh

platform/windows-xul/setup.py

platform/windows-xul/setup_binarykit.sh

platform/windows-xul/test.sh

portable

portable/__init__.py

portable/adscraper.py

portable/app.py

portable/appconfig.py

portable/autodiscover.py

portable/autodler.py

portable/autoupdate.py

portable/clock.py

portable/commandline.py

portable/config.py

portable/controller.py

portable/convert20database.py

portable/database.py

portable/databasehelper.py

portable/databaselog.py

portable/databasesanity.py

portable/databaseupgrade.py

portable/datastructures.py

portable/dbupgradeprogress.py

portable/dialogs.py

portable/displaytext.py

portable/dl_daemon

portable/dl_daemon/Democracy_Downloader.py

portable/dl_daemon/__init__.py

portable/dl_daemon/command.py

portable/dl_daemon/daemon.py

portable/dl_daemon/download.py

portable/dl_daemon/private

portable/dl_daemon/private/__init__.py

portable/dl_daemon/private/config.py

portable/dl_daemon/private/httpauth.py

portable/dl_daemon/private/resources.py

portable/download_utils.py

portable/downloader.py

portable/eventloop.py

portable/fasttypes.c

portable/feed.py

portable/feedparser.py

portable/feedparserutil.py

portable/feedupdate.py

portable/filetypes.py

portable/fileutil.py

portable/flashscraper.py

portable/folder.py

portable/frontends

portable/frontends/__init__.py

portable/frontends/cli

portable/frontends/cli/README

portable/frontends/cli/__init__.py

portable/frontends/cli/application.py

portable/frontends/cli/clidialog.py

portable/frontends/cli/events.py

portable/frontends/cli/interpreter.py

portable/frontends/cli/util.py

portable/frontends/shell

portable/frontends/shell/__init__.py

portable/frontends/shell/application.py

portable/frontends/widgets

portable/frontends/widgets/__init__.py

portable/frontends/widgets/addtoplaylistdialog.py

portable/frontends/widgets/application.py

portable/frontends/widgets/browser.py

portable/frontends/widgets/cellpack.py

portable/frontends/widgets/crashdialog.py

portable/frontends/widgets/diagnostics.py

portable/frontends/widgets/dialogs.py

portable/frontends/widgets/dialogwidgets.py

portable/frontends/widgets/displays.py

portable/frontends/widgets/downloadscontroller.py

portable/frontends/widgets/feedcontroller.py

portable/frontends/widgets/feedsettingspanel.py

portable/frontends/widgets/firsttimedialog.py

portable/frontends/widgets/gtk

portable/frontends/widgets/gtk/__init__.py

portable/frontends/widgets/gtk/audio.py

portable/frontends/widgets/gtk/base.py

portable/frontends/widgets/gtk/const.py

portable/frontends/widgets/gtk/controls.py

portable/frontends/widgets/gtk/customcontrols.py

portable/frontends/widgets/gtk/drawing.py

portable/frontends/widgets/gtk/fontsize.py

portable/frontends/widgets/gtk/keymap.py

portable/frontends/widgets/gtk/layout.py

portable/frontends/widgets/gtk/layoutmanager.py

portable/frontends/widgets/gtk/persistentwindow.py

portable/frontends/widgets/gtk/preferenceswindow.py

portable/frontends/widgets/gtk/pygtkhacks.pyx

portable/frontends/widgets/gtk/searchentry.py

portable/frontends/widgets/gtk/simple.py

portable/frontends/widgets/gtk/sniffer.py

portable/frontends/widgets/gtk/tableview.py

portable/frontends/widgets/gtk/textlayout.py

portable/frontends/widgets/gtk/threads.py

portable/frontends/widgets/gtk/timer.py

portable/frontends/widgets/gtk/trayicon.py

portable/frontends/widgets/gtk/video.py

portable/frontends/widgets/gtk/weakconnect.py

portable/frontends/widgets/gtk/widgets.py

portable/frontends/widgets/gtk/widgetset.py

portable/frontends/widgets/gtk/window.py

portable/frontends/widgets/gtk/wrappermap.py

portable/frontends/widgets/gtk/xpcom

portable/frontends/widgets/gtk/xpcom/HttpObserver.cc

portable/frontends/widgets/gtk/xpcom/HttpObserver.h

portable/frontends/widgets/imagebutton.py

portable/frontends/widgets/imagepool.py

portable/frontends/widgets/itemcontextmenu.py

portable/frontends/widgets/itemedit.py

portable/frontends/widgets/itemlist.py

portable/frontends/widgets/itemlistcontroller.py

portable/frontends/widgets/itemlistwidgets.py

portable/frontends/widgets/linkhandler.py

portable/frontends/widgets/menus.py

portable/frontends/widgets/newfeed.py

portable/frontends/widgets/newfolder.py

portable/frontends/widgets/newsearchfeed.py

portable/frontends/widgets/playback.py

portable/frontends/widgets/playlist.py

portable/frontends/widgets/prefpanel.py

portable/frontends/widgets/quitwhiledownloading.py

portable/frontends/widgets/removefeeds.py

portable/frontends/widgets/rundialog.py

portable/frontends/widgets/search.py

portable/frontends/widgets/searchbox.py

portable/frontends/widgets/segmented.py

portable/frontends/widgets/separator.py

portable/frontends/widgets/statictabs.py

portable/frontends/widgets/style.py

portable/frontends/widgets/tablist.py

portable/frontends/widgets/tablistmanager.py

portable/frontends/widgets/util.py

portable/frontends/widgets/videobox.py

portable/frontends/widgets/watchedfolders.py

portable/frontends/widgets/widgetconst.py

portable/frontends/widgets/widgetutil.py

portable/frontends/widgets/window.py

portable/frontendstate.py

portable/gtcache.py

portable/guide.py

portable/httpauth.py

portable/httpclient.py

portable/iconcache.py

portable/iso_639.py

portable/item.py

portable/messagehandler.py

portable/messages.py

portable/models.py

portable/moviedata.py

portable/opml.py

portable/player.py

portable/playlist.py

portable/prefs.py

portable/schema.py

portable/schemav79.py

portable/search.py

portable/searchengines.py

portable/signals.py

portable/singleclick.py

portable/startup.py

portable/storedatabase.py

portable/subscription.py

portable/tabs.py

portable/test

portable/test/__init__.py

portable/test/databasesanitytest.py

portable/test/databasetest.py

portable/test/datastructurestest.py

portable/test/feedparsertest.py

portable/test/feedtest.py

portable/test/filetypestest.py

portable/test/framework.py

portable/test/gtcachetest.py

portable/test/httpclienttest.py

portable/test/httpdownloadertest.py

portable/test/iconcachetest.py

portable/test/itemtest.py

portable/test/messagetest.py

portable/test/parseurltest.py

portable/test/playlisttest.py

portable/test/schedulertest.py

portable/test/schematest.py

portable/test/signalstest.py

portable/test/sparkletest.py

portable/test/storedatabasetest.py

portable/test/strippertest.py

portable/test/subscriptiontest.py

portable/test/unicodetest.py

portable/test/utiltest.py

portable/test/xhtmltest.py

portable/theme.py

portable/trapcall.py

portable/u3info.py

portable/util.py

portable/xhtmltools.py

files modified:
.pc/applied-patches

ADOPTERS

CREDITS

LAYOUT

README

debian/README.Debian

debian/changelog

debian/control

debian/patches/100_catch_keyerror_in_update_items.patch

debian/patches/10_movies_dir.patch

debian/patches/50_miro_debug_fix.patch

debian/patches/series

debian/rules

resources/app.config.template

resources/locale/README

resources/locale/af.mo

resources/locale/af.po

resources/locale/ar.mo

resources/locale/ar.po

resources/locale/be.mo

resources/locale/be.po

resources/locale/bg.mo

resources/locale/bg.po

resources/locale/bn.mo

resources/locale/bn.po

resources/locale/br.mo

resources/locale/br.po

resources/locale/bs.mo

resources/locale/bs.po

resources/locale/ca.mo

resources/locale/ca.po

resources/locale/ckb.mo

resources/locale/ckb.po

resources/locale/cs.mo

resources/locale/cs.po

resources/locale/csb.mo

resources/locale/csb.po

resources/locale/cy.mo

resources/locale/cy.po

resources/locale/da.mo

resources/locale/da.po

resources/locale/de.mo

resources/locale/de.po

resources/locale/el.mo

resources/locale/el.po

resources/locale/en_AU.mo

resources/locale/en_AU.po

resources/locale/en_CA.mo

resources/locale/en_CA.po

resources/locale/en_GB.mo

resources/locale/en_GB.po

resources/locale/eo.mo

resources/locale/eo.po

resources/locale/es.mo

resources/locale/es.po

resources/locale/et.mo

resources/locale/et.po

resources/locale/eu.mo

resources/locale/eu.po

resources/locale/export-strings.sh

resources/locale/fa.mo

resources/locale/fa.po

resources/locale/fi.mo

resources/locale/fi.po

resources/locale/fil.mo

resources/locale/fil.po

resources/locale/fo.mo

resources/locale/fo.po

resources/locale/fr.mo

resources/locale/fr.po

resources/locale/fy.mo

resources/locale/fy.po

resources/locale/ga.mo

resources/locale/ga.po

resources/locale/gl.mo

resources/locale/gl.po

resources/locale/gu.mo

resources/locale/gu.po

resources/locale/he.mo

resources/locale/he.po

resources/locale/hi.mo

resources/locale/hi.po

resources/locale/hr.mo

resources/locale/hr.po

resources/locale/hu.mo

resources/locale/hu.po

resources/locale/id.mo

resources/locale/id.po

resources/locale/import-translations.py

resources/locale/is.mo

resources/locale/is.po

resources/locale/it.mo

resources/locale/it.po

resources/locale/ja.mo

resources/locale/ja.po

resources/locale/ka.mo

resources/locale/ka.po

resources/locale/kk.mo

resources/locale/kk.po

resources/locale/km.mo

resources/locale/km.po

resources/locale/kn.mo

resources/locale/kn.po

resources/locale/ko.mo

resources/locale/ko.po

resources/locale/ku.mo

resources/locale/ku.po

resources/locale/lb.mo

resources/locale/lb.po

resources/locale/lt.mo

resources/locale/lt.po

resources/locale/lv.mo

resources/locale/lv.po

resources/locale/messages.pot

resources/locale/mk.mo

resources/locale/mk.po

resources/locale/ml.mo

resources/locale/ml.po

resources/locale/mr.mo

resources/locale/mr.po

resources/locale/ms.mo

resources/locale/ms.po

resources/locale/mt.mo

resources/locale/mt.po

resources/locale/nb.mo

resources/locale/nb.po

resources/locale/nds.mo

resources/locale/nds.po

resources/locale/ne.mo

resources/locale/ne.po

resources/locale/nl.mo

resources/locale/nl.po

resources/locale/nn.mo

resources/locale/nn.po

resources/locale/oc.mo

resources/locale/oc.po

resources/locale/pa.mo

resources/locale/pa.po

resources/locale/pl.mo

resources/locale/pl.po

resources/locale/pt.mo

resources/locale/pt.po

resources/locale/pt_BR.mo

resources/locale/pt_BR.po

resources/locale/ro.mo

resources/locale/ro.po

resources/locale/ru.mo

resources/locale/ru.po

resources/locale/si.mo

resources/locale/si.po

resources/locale/sk.mo

resources/locale/sk.po

resources/locale/sl.mo

resources/locale/sl.po

resources/locale/sq.mo

resources/locale/sq.po

resources/locale/sr.mo

resources/locale/sr.po

resources/locale/sv.mo

resources/locale/sv.po

resources/locale/ta.mo

resources/locale/ta.po

resources/locale/te.mo

resources/locale/te.po

resources/locale/th.mo

resources/locale/th.po

resources/locale/tl.mo

resources/locale/tl.po

resources/locale/tr.mo

resources/locale/tr.po

resources/locale/uk.mo

resources/locale/uk.po

resources/locale/ur.mo

resources/locale/ur.po

resources/locale/vi.mo

resources/locale/vi.po

resources/locale/zh_CN.mo

resources/locale/zh_CN.po

resources/locale/zh_HK.mo

resources/locale/zh_HK.po

resources/locale/zh_TW.mo

resources/locale/zh_TW.po

resources/locale/zu.mo

resources/locale/zu.po

resources/testdata/stripperdata/README

Show diffs side-by-side

added added

removed removed

lib/feed.py

# Miro - an RSS based video player application

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA

# In addition, as a special exception, the copyright holders give

# permission to link the code of portions of this program with the OpenSSL

# library.

# You must obey the GNU General Public License in all respects for all of

# the code used other than OpenSSL. If you modify file(s) with this

# exception, you may extend this exception to your version of the file(s),

# but you are not obligated to do so. If you do not wish to do so, delete

# this exception statement from your version. If you delete this exception

# statement from all source files in the program, then also delete it here.

"""``miro.feed`` -- Holds ``Feed`` class and related things.

FIXME - talk about Feed architecture here

"""

from HTMLParser import HTMLParser, HTMLParseError

from cStringIO import StringIO

from datetime import datetime, timedelta

from miro.gtcache import gettext as _

from miro.feedparser import FeedParserDict

from urlparse import urljoin

from miro.xhtmltools import (unescape, xhtmlify, fix_xml_header,

fix_html_header, urlencode)

import os

import re

import xml

from miro.database import DDBObject, ObjectNotFoundError

from miro.httpclient import grab_url

from miro import app

from miro import autodler

from miro import config

from miro import iconcache

from miro import databaselog

from miro import dialogs

from miro import download_utils

from miro import eventloop

from miro import feedupdate

from miro import flashscraper

from miro import models

from miro import prefs

from miro.plat import resources

from miro import downloader

from miro.util import (returns_unicode, returns_filename, unicodify, check_u,

check_f, quote_unicode_url, escape, to_uni,

is_url, stringify)

from miro import fileutil

from miro.plat.utils import filename_to_unicode, make_url_safe, unmake_url_safe

from miro import filetypes

from miro.item import FeedParserValues

from miro import searchengines

import logging

from miro.clock import clock

WHITESPACE_PATTERN = re.compile(r"^[ \t\r\n]*$")

DEFAULT_FEED_ICON = "images/feedicon.png"

DEFAULT_FEED_ICON_TABLIST = "images/icon-rss.png"

@returns_unicode

def default_feed_icon_url():

return resources.url(DEFAULT_FEED_ICON)

def default_feed_icon_path():

return resources.path(DEFAULT_FEED_ICON)

def default_tablist_feed_icon_path():

return resources.path(DEFAULT_FEED_ICON_TABLIST)

# Notes on character set encoding of feeds:

# The parsing libraries built into Python mostly use byte strings

# instead of unicode strings. However, sometimes they get "smart" and

# try to convert the byte stream to a unicode stream automatically.

# What does what when isn't clearly documented

# We use the function to_uni() to fix those smart conversions

# If you run into Unicode crashes, adding that function in the

# appropriate place should fix it.

100

101

# Universal Feed Parser http://feedparser.org/

102

# Licensed under Python license

103

from miro import feedparser

104

105

def add_feed_from_file(fn):

106

"""Adds a new feed using USM

107

"""

108

check_f(fn)

109

d = feedparser.parse(fn)

110

if d.feed.has_key('links'):

111

for link in d.feed['links']:

112

if link['rel'] == 'start' or link['rel'] == 'self':

113

Feed(link['href'])

114

return

115

if d.feed.has_key('link'):

116

add_feed_from_web_page(d.feed.link)

117

118

def add_feed_from_web_page(url):

119

"""Adds a new feed based on a link tag in a web page

120

"""

121

check_u(url)

122

def callback(info):

123

url = HTMLFeedURLParser().get_link(info['updated-url'], info['body'])

124

if url:

125

Feed(url)

126

def errback(error):

127

logging.warning ("unhandled error in add_feed_from_web_page: %s", error)

128

grab_url(url, callback, errback)

129

130

FILE_MATCH_RE = re.compile(r"^file://.")

131

SEARCH_URL_MATCH_RE = re.compile('^dtv:savedsearch/(.*)\?q=(.*)')

132

133

def validate_feed_url(url):

134

"""URL validitation and normalization

135

"""

136

check_u(url)

137

if is_url(url):

138

return True

139

if FILE_MATCH_RE.match(url) is not None:

140

return True

141

return False

142

143

def normalize_feed_url(url):

144

check_u(url)

145

# Valid URL are returned as-is

146

if validate_feed_url(url):

147

return url

148

149

originalURL = url

150

url = url.strip()

151

152

# Check valid schemes with invalid separator

153

match = re.match(r"^(http|https):/*(.*)$", url)

154

if match is not None:

155

url = "%s://%s" % match.group(1, 2)

156

157

# Replace invalid schemes by http

158

match = re.match(r"^(([A-Za-z]*):/*)*(.*)$", url)

159

if match and match.group(2) in ['feed', 'podcast', 'fireant', None]:

160

url = "http://%s" % match.group(3)

161

elif match and match.group(1) == 'feeds':

162

url = "https://%s" % match.group(3)

163

164

# Make sure there is a leading / character in the path

165

match = re.match(r"^(http|https)://[^/]*$", url)

166

if match is not None:

167

url = url + "/"

168

169

url = quote_unicode_url(url)

170

171

if not validate_feed_url(url):

172

logging.info ("unable to normalize URL %s", originalURL)

173

return originalURL

174

else:

175

return url

176

177

def make_search_url(engine, term):

178

"""Create a URL for a search feed.

179

"""

180

return u'dtv:savedsearch/%s?q=%s' % (engine, term)

181

182

def _config_change(key, value):

183

"""Handle configuration changes so we can update feed update frequencies

184

"""

185

if key is prefs.CHECK_CHANNELS_EVERY_X_MN.key:

186

for feed in Feed.make_view():

187

update_freq = 0

188

try:

189

update_freq = feed.parsed["feed"]["ttl"]

190

except (AttributeError, KeyError):

191

pass

192

feed.set_update_frequency(update_freq)

193

194

config.add_change_callback(_config_change)

195

196

# Wait X seconds before updating the feeds at startup

197

INITIAL_FEED_UPDATE_DELAY = 5.0

198

199

class FeedImpl(DDBObject):

200

"""Actual implementation of a basic feed.

201

"""

202

def setup_new(self, url, ufeed, title=None):

203

check_u(url)

204

if title:

205

check_u(title)

206

self.url = url

207

self.ufeed = ufeed

208

self.ufeed_id = ufeed.id

209

self.title = title

210

self.created = datetime.now()

211

self.updating = False

212

self.thumbURL = None

213

self.initialUpdate = True

214

self.updateFreq = config.get(prefs.CHECK_CHANNELS_EVERY_X_MN) * 60

215

216

@classmethod

217

def orphaned_view(cls):

218

table_name = app.db.table_name(cls)

219

return cls.make_view("feed.id is NULL",

220

joins={'feed': 'feed.feed_impl_id=%s.id' % table_name})

221

222

def _get_items(self):

223

return self.ufeed.items

224

items = property(_get_items)

225

226

def on_signal_change(self):

227

self.ufeed.signal_change()

228

229

@returns_unicode

230

def get_base_href(self):

231

"""Get a URL to use in the <base> tag for this channel. This is used

232

for relative links in this channel's items.

233

"""

234

return escape(self.url)

235

236

def set_update_frequency(self, frequency):

237

"""Sets the update frequency (in minutes).

238

A frequency of -1 means that auto-update is disabled.

239

"""

240

try:

241

frequency = int(frequency)

242

except ValueError:

243

frequency = -1

244

245

if frequency < 0:

246

self.cancel_update_events()

247

self.updateFreq = -1

248

else:

249

new_freq = max(config.get(prefs.CHECK_CHANNELS_EVERY_X_MN), frequency) * 60

250

if new_freq != self.updateFreq:

251

self.updateFreq = new_freq

252

self.schedule_update_events(-1)

253

self.ufeed.signal_change()

254

255

def schedule_update_events(self, firstTriggerDelay):

256

self.cancel_update_events()

257

if firstTriggerDelay >= 0:

258

self.scheduler = eventloop.add_timeout(firstTriggerDelay, self.update, "Feed update (%s)" % self.get_title())

259

else:

260

if self.updateFreq > 0:

261

self.scheduler = eventloop.add_timeout(self.updateFreq, self.update, "Feed update (%s)" % self.get_title())

262

263

def cancel_update_events(self):

264

if hasattr(self, 'scheduler') and self.scheduler is not None:

265

self.scheduler.cancel()

266

self.scheduler = None

267

268

def update(self):

269

"""Subclasses should override this

270

"""

271

self.schedule_update_events(-1)

272

273

def default_thumbnail_path(self):

274

"""Get the path to our thumbnail when there isn't a downloaded icon"""

275

return default_feed_icon_path()

276

277

@returns_unicode

278

def get_title(self):

279

"""Returns the title of the feed

280

"""

281

try:

282

title = self.title

283

if title is None or WHITESPACE_PATTERN.match(title):

284

if self.ufeed.baseTitle is not None:

285

title = self.ufeed.baseTitle

286

else:

287

title = self.url

288

return title

289

except AttributeError:

290

return u""

291

292

@returns_unicode

293

def get_url(self):

294

"""Returns the URL of the feed

295

"""

296

return self.url

297

298

@returns_unicode

299

def get_base_url(self):

300

"""Returns the URL of the feed

301

"""

302

try:

303

return self.url

304

except AttributeError:

305

return u""

306

307

@returns_unicode

308

def get_link(self):

309

"""Returns a link to a webpage associated with the feed

310

"""

311

return self.ufeed.get_base_href()

312

313

@returns_unicode

314

def get_thumbnail_url(self):

315

"""Returns the URL of a thumbnail associated with the feed

316

"""

317

return self.thumbURL

318

319

@returns_unicode

320

def get_license(self):

321

"""Returns URL of license assocaited with the feed

322

"""

323

return u""

324

325

def setup_restored(self):

326

self.updating = False

327

328

def remove(self):

329

self.on_remove()

330

DDBObject.remove(self)

331

332

def on_remove(self):

333

"""Called when the feed uses this FeedImpl is removed from the DB.

334

subclasses can perform cleanup here."""

335

pass

336

337

def __str__(self):

338

return "%s - %s" % (self.__class__.__name__, stringify(self.get_title()))

339

340

def clean_old_items(self):

341

"""

342

Called to remove old items which are no longer in the feed.

343

344

Items that are currently in the feed should always be kept.

345

"""

346

pass

347

348

class Feed(DDBObject, iconcache.IconCacheOwnerMixin):

349

"""This class is a magic class that can become any type of feed it wants

350

351

It works by passing on attributes to the actual feed.

352

"""

353

ICON_CACHE_VITAL = True

354

355

def setup_new(self, url, initiallyAutoDownloadable=None,

356

section=u'video', search_term=None, title=None):

357

check_u(url)

358

if initiallyAutoDownloadable == None:

359

mode = config.get(prefs.CHANNEL_AUTO_DEFAULT)

360

# note that this is somewhat duplicated in

361

# set_auto_download_mode

362

if mode == u'all':

363

self.getEverything = True

364

self.autoDownloadable = True

365

elif mode == u'new':

366

self.getEverything = False

367

self.autoDownloadable = True

368

elif mode == u'off':

369

self.getEverything = False

370

self.autoDownloadable = False

371

else:

372

raise ValueError("Bad auto-download mode: %s" % mode)

373

374

else:

375

self.autoDownloadable = initiallyAutoDownloadable

376

self.getEverything = False

377

378

self.section = section

379

self.maxNew = 3

380

self.maxOldItems = None

381

self.expire = u"system"

382

self.expireTime = None

383

self.fallBehind = -1

384

self.last_viewed = datetime.min

385

386

self.baseTitle = None

387

self.origURL = url

388

self.errorState = False

389

self.loading = True

390

self._actualFeed = None

391

self._set_feed_impl(FeedImpl(url, self, title))

392

self.setup_new_icon_cache()

393

self.informOnError = True

394

self.folder_id = None

395

self.searchTerm = search_term

396

self.userTitle = None

397

self.visible = True

398

self.setup_common()

399

400

def setup_restored(self):

401

restored_feeds.append(self)

402

self._actualFeed = None

403

self.informOnError = False

404

self.setup_common()

405

406

def setup_common(self):

407

self.create_signal('update-finished')

408

self.download = None

409

self.wasUpdating = False

410

self.inlineSearchTerm = None

411

self.calc_item_list()

412

413

def _get_actual_feed(self):

414

# first try to load from actualFeed from the DB

415

if self._actualFeed is None:

416

for klass in (FeedImpl, RSSFeedImpl, SavedSearchFeedImpl,

417

ScraperFeedImpl, SearchFeedImpl, DirectoryFeedImpl,

418

DirectoryWatchFeedImpl, SearchDownloadsFeedImpl,

419

ManualFeedImpl, SingleFeedImpl):

420

try:

421

self._actualFeed = klass.get_by_id(self.feed_impl_id)

422

self._actualFeed.ufeed = self

423

break

424

except ObjectNotFoundError:

425

pass

426

# otherwise, make a new FeedImpl

427

if self._actualFeed is None:

428

self._set_feed_impl(FeedImpl(self.origURL, self))

429

self.signal_change()

430

return self._actualFeed

431

432

actualFeed = property(_get_actual_feed)

433

434

@classmethod

435

def get_by_url(cls, url):

436

return cls.make_view('origURL=?', (url,)).get_singleton()

437

438

@classmethod

439

def get_by_url_and_search(cls, url, searchTerm):

440

if searchTerm is not None:

441

view = cls.make_view('origURL=? AND searchTerm=?',

442

(url, searchTerm))

443

else:

444

view = cls.make_view('origURL=? AND searchTerm IS NULL', (url,))

445

return view.get_singleton()

446

447

@classmethod

448

def get_manual_feed(cls):

449

return cls.get_by_url('dtv:manualFeed')

450

451

@classmethod

452

def get_directory_feed(cls):

453

return cls.get_by_url('dtv:directoryfeed')

454

455

@classmethod

456

def get_search_feed(cls):

457

return cls.get_by_url('dtv:search')

458

459

@classmethod

460

def get_search_downloads_feed(cls):

461

return cls.get_by_url('dtv:searchDownloads')

462

463

@classmethod

464

def folder_view(cls, id):

465

return cls.make_view('folder_id=?', (id,))

466

467

@classmethod

468

def visible_video_view(cls):

469

return cls.make_view("visible AND section='video'")

470

471

@classmethod

472

def watched_folder_view(cls):

473

return cls.make_view("origURL LIKE 'dtv:directoryfeed:%'")

474

475

@classmethod

476

def visible_audio_view(cls):

477

return cls.make_view("visible AND section='audio'")

478

479

def on_db_insert(self):

480

self.generate_feed(True)

481

482

def in_folder(self):

483

return self.folder_id is not None

484

485

def _set_feed_impl(self, feed_impl):

486

if self._actualFeed is not None:

487

self._actualFeed.remove()

488

self._actualFeed = feed_impl

489

self.feed_impl_id = feed_impl.id

490

491

def signal_change(self, needs_save=True, needs_signal_folder=False):

492

if needs_signal_folder:

493

folder = self.get_folder()

494

if folder:

495

folder.signal_change(needs_save=False)

496

DDBObject.signal_change (self, needs_save=needs_save)

497

498

def on_signal_change(self):

499

is_updating = bool(self.actualFeed.updating)

500

if self.wasUpdating and not is_updating:

501

self.emit('update-finished')

502

self.wasUpdating = is_updating

503

504

def calc_item_list(self):

505

self.items = models.Item.feed_view(self.id)

506

self.visible_items = models.Item.visible_feed_view(self.id)

507

self.downloaded_items = models.Item.feed_downloaded_view(self.id)

508

self.downloading_items = models.Item.feed_downloading_view(self.id)

509

self.available_items = models.Item.feed_available_view(self.id)

510

self.auto_pending_items = models.Item.feed_auto_pending_view(self.id)

511

self.unwatched_items = models.Item.feed_unwatched_view(self.id)

512

513

def update_after_restore(self):

514

if self.actualFeed.__class__ == FeedImpl:

515

# Our initial FeedImpl was never updated, call

516

# generate_feed again

517

self.loading = True

518

eventloop.add_idle(lambda: self.generate_feed(True), "generate_feed")

519

else:

520

self.schedule_update_events(INITIAL_FEED_UPDATE_DELAY)

521

522

def clean_old_items(self):

523

if self.actualFeed:

524

return self.actualFeed.clean_old_items()

525

526

def invalidate_counts(self):

527

for cached_count_attr in ('_num_available', '_num_unwatched',

528

'_num_downloaded', '_num_downloading'):

529

if cached_count_attr in self.__dict__:

530

del self.__dict__[cached_count_attr]

531

532

def recalc_counts(self):

533

self.invalidate_counts()

534

self.signal_change(needs_save=False)

535

if self.in_folder():

536

self.get_folder().signal_change(needs_save=False)

537

538

def num_downloaded(self):

539

"""Returns the number of downloaded items in the feed.

540

"""

541

try:

542

return self._num_downloaded

543

except AttributeError:

544

self._num_downloaded = self.downloaded_items.count()

545

return self._num_downloaded

546

547

def num_downloading(self):

548

"""Returns the number of downloading items in the feed.

549

"""

550

try:

551

return self._num_downloading

552

except AttributeError:

553

self._num_downloading = self.downloading_items.count()

554

return self._num_downloading

555

556

def num_unwatched(self):

557

"""Returns string with number of unwatched videos in feed

558

"""

559

try:

560

return self._num_unwatched

561

except AttributeError:

562

self._num_unwatched = self.unwatched_items.count()

563

return self._num_unwatched

564

565

def num_available(self):

566

"""Returns string with number of available videos in feed

567

"""

568

try:

569

return self._num_available

570

except AttributeError:

571

self._num_available = (self.available_items.count() -

572

self.auto_pending_items.count())

573

return self._num_available

574

575

def get_viewed(self):

576

"""Returns true iff this feed has been looked at

577

"""

578

return self.last_viewed != datetime.min

579

580

def mark_as_viewed(self):

581

"""Sets the last time the feed was viewed to now

582

"""

583

self.last_viewed = datetime.now()

584

try:

585

del self._num_available

586

except AttributeError:

587

pass

588

if self.in_folder():

589

self.get_folder().signal_change()

590

self.signal_change()

591

592

def start_manual_download(self):

593

next_ = None

594

for item in self.items:

595

if item.is_pending_manual_download():

596

if next_ is None:

597

next_ = item

598

elif item.get_pub_date_parsed() > next_.get_pub_date_parsed():

599

next_ = item

600

if next_ is not None:

601

next_.download(autodl=False)

602

603

def start_auto_download(self):

604

next = None

605

for item in self.items:

606

if item.is_eligible_for_auto_download():

607

if next is None:

608

next = item

609

elif item.get_pub_date_parsed() > next.get_pub_date_parsed():

610

next = item

611

if next is not None:

612

next.download(autodl = True)

613

614

def expiring_items(self):

615

# items in watched folders never expire

616

if self.is_watched_folder():

617

return []

618

if self.expire == u'never':

619

return []

620

elif self.expire == u'system':

621

expire_after_x_days = config.get(prefs.EXPIRE_AFTER_X_DAYS)

622

if expire_after_x_days == -1:

623

return []

624

delta = timedelta(days=expire_after_x_days)

625

else:

626

delta = self.expireTime

627

return models.Item.feed_expiring_view(self.id, datetime.now() - delta)

628

629

def expire_items(self):

630

"""Expires items from the feed that are ready to expire.

631

"""

632

for item in self.expiring_items():

633

item.expire()

634

635

def signal_items(self):

636

for item in self.items:

637

item.signal_change(needs_save=False)

638

639

def icon_changed(self):

640

"""See item.get_thumbnail to figure out which items to send

641

signals for.

642

"""

643

self.signal_change(needs_save=False)

644

for item in self.items:

645

if not (item.icon_cache.isValid() or

646

item.screenshot or

647

item.isContainerItem):

648

item.signal_change(needs_save=False)

649

650

def get_id(self):

651

return DDBObject.get_id(self)

652

653

@returns_unicode

654

def get_search_term(self):

655

self.confirm_db_thread()

656

return self.searchTerm

657

658

def is_updating(self):

659

return self.loading or (self.actualFeed and self.actualFeed.updating)

660

661

@returns_unicode

662

def get_title(self):

663

if self.userTitle is not None:

664

return self.userTitle

665

666

title = self.actualFeed.get_title()

667

if self.searchTerm is not None:

668

title = u"%s for '%s'" % (title, self.searchTerm)

669

return title

670

671

def has_original_title(self):

672

return self.userTitle == None

673

674

def set_title(self, title):

675

self.confirm_db_thread()

676

self.userTitle = title

677

self.signal_change()

678

679

def revert_title(self):

680

self.set_title(None)

681

682

def set_visible(self, visible):

683

if self.visible == visible:

684

return

685

self.visible = visible

686

self.signal_change()

687

688

@returns_unicode

689

def get_autodownload_mode(self):

690

self.confirm_db_thread()

691

if self.autoDownloadable:

692

if self.getEverything:

693

return u'all'

694

else:

695

return u'new'

696

else:

697

return u'off'

698

699

def set_auto_download_mode(self, mode):

700

# note that this is somewhat duplicated in setup_new

701

if mode == u'all':

702

self.getEverything = True

703

self.autoDownloadable = True

704

elif mode == u'new':

705

self.getEverything = False

706

self.autoDownloadable = True

707

elif mode == u'off':

708

self.autoDownloadable = False

709

else:

710

raise ValueError("Bad auto-download mode: %s" % mode)

711

self.signal_change()

712

self.signal_items()

713

714

def set_expiration(self, type_, time_):

715

"""Sets the expiration attributes. Valid types are u'system',

716

u'feed' and u'never'.

717

718

Expiration time is in hour(s).

719

"""

720

self.confirm_db_thread()

721

self.expire = type_

722

self.expireTime = timedelta(hours=time_)

723

724

if self.expire == u"never":

725

for item in self.items:

726

if item.is_downloaded():

727

item.save()

728

729

self.signal_change()

730

self.signal_items()

731

732

def set_max_new(self, max_new):

733

"""Sets the maxNew attributes. -1 means unlimited.

734

"""

735

self.confirm_db_thread()

736

oldMaxNew = self.maxNew

737

self.maxNew = max_new

738

self.signal_change()

739

if self.maxNew >= oldMaxNew or self.maxNew < 0:

740

autodler.AUTO_DOWNLOADER.start_downloads()

741

742

def set_max_old_items(self, maxOldItems):

743

self.confirm_db_thread()

744

oldMaxOldItems = self.maxOldItems

745

if maxOldItems == -1:

746

maxOldItems = None

747

self.maxOldItems = maxOldItems

748

self.signal_change()

749

if (maxOldItems is not None and

750

(oldMaxOldItems is None or oldMaxOldItems > maxOldItems)):

751

# the actual feed updating code takes care of expiring the old

752

# items

753

self.actualFeed.clean_old_items()

754

755

def update(self):

756

self.confirm_db_thread()

757

if not self.id_exists():

758

return

759

if self.loading:

760

return

761

elif self.errorState:

762

self.loading = True

763

self.errorState = False

764

self.signal_change()

765

return self.generate_feed()

766

self.actualFeed.update()

767

768

def get_folder(self):

769

self.confirm_db_thread()

770

if self.in_folder():

771

return models.ChannelFolder.get_by_id(self.folder_id)

772

else:

773

return None

774

775

def set_folder(self, new_folder, update_trackers=True):

776

self.confirm_db_thread()

777

old_folder = self.get_folder()

778

if new_folder is old_folder:

779

return

780

if new_folder is not None:

781

self.folder_id = new_folder.get_id()

782

else:

783

self.folder_id = None

784

self.signal_change()

785

if update_trackers:

786

models.Item.update_folder_trackers()

787

if new_folder:

788

new_folder.signal_change(needs_save=False)

789

if old_folder:

790

old_folder.signal_change(needs_save=False)

791

792

@staticmethod

793

def bulk_set_folders(folder_assignments):

794

"""Set the folders for multiple feeds at once.

795

796

This method is optimized to be a bit faster than calling

797

set_folder() for each individual folder.

798

"""

799

for child, folder in folder_assignments:

800

child.set_folder(folder, update_trackers=False)

801

models.Item.update_folder_trackers()

802

803

def generate_feed(self, removeOnError=False):

804

newFeed = None

805

if self.origURL == u"dtv:directoryfeed":

806

newFeed = DirectoryFeedImpl(self)

807

self.visible = False

808

elif (self.origURL.startswith(u"dtv:directoryfeed:")):

809

url = self.origURL[len(u"dtv:directoryfeed:"):]

810

dir_ = unmake_url_safe(url)

811

newFeed = DirectoryWatchFeedImpl(self, dir_)

812

elif self.origURL == u"dtv:search":

813

newFeed = SearchFeedImpl(self)

814

self.visible = False

815

elif self.origURL == u"dtv:searchDownloads":

816

newFeed = SearchDownloadsFeedImpl(self)

817

self.visible = False

818

elif self.origURL == u"dtv:manualFeed":

819

newFeed = ManualFeedImpl(self)

820

self.visible = False

821

elif self.origURL == u"dtv:singleFeed":

822

newFeed = SingleFeedImpl(self)

823

self.visible = False

824

elif SEARCH_URL_MATCH_RE.match(self.origURL):

825

newFeed = SavedSearchFeedImpl(self.origURL, self)

826

else:

827

self.download = grab_url(self.origURL,

828

lambda info: self._generate_feed_callback(info, removeOnError),

829

lambda error: self._generate_feed_errback(error, removeOnError),

830

default_mime_type=u'application/rss+xml')

831

logging.debug ("added async callback to create feed %s", self.origURL)

832

if newFeed:

833

self.finish_generate_feed(newFeed)

834

835

def is_watched_folder(self):

836

return self.origURL.startswith("dtv:directoryfeed:")

837

838

def _handle_feed_loading_error(self, errorDescription):

839

self.download = None

840

self.errorState = True

841

self.loading = False

842

self.signal_change()

843

if self.informOnError:

844

title = _('Error loading feed')

845

description = _(

846

"Couldn't load the feed at %(url)s (%(errordescription)s)."

847

) % { "url": self.url, "errordescription": errorDescription }

848

description += "\n\n"

849

description += _("Would you like to keep the feed?")

850

d = dialogs.ChoiceDialog(title, description, dialogs.BUTTON_KEEP,

851

dialogs.BUTTON_DELETE)

852

def callback(dialog):

853

if dialog.choice == dialogs.BUTTON_DELETE and self.id_exists():

854

self.remove()

855

d.run(callback)

856

self.informOnError = False

857

delay = config.get(prefs.CHECK_CHANNELS_EVERY_X_MN)

858

eventloop.add_timeout(delay, self.update, "update failed feed")

859

860

def _generate_feed_errback(self, error, removeOnError):

861

if not self.id_exists():

862

return

863

logging.info("Warning couldn't load feed at %s (%s)",

864

self.origURL, error)

865

self._handle_feed_loading_error(error.getFriendlyDescription())

866

867

def _generate_feed_callback(self, info, removeOnError):

868

"""This is called by grab_url to generate a feed based on

869

the type of data found at the given URL

870

"""

871

# FIXME: This probably should be split up a bit. The logic is

872

# a bit daunting

873

874

# Note that all of the raw XML and HTML in this function is in

875

# byte string format

876

877

if not self.id_exists():

878

return

879

if info['updated-url'] != self.origURL and \

880

not self.origURL.startswith('dtv:'): # we got redirected

881

f = lookup_feed(info['updated-url'], self.searchTerm)

882

if f is not None: # already have this feed, so delete us

883

self.remove()

884

return

885

self.download = None

886

modified = unicodify(info.get('last-modified'))

887

etag = unicodify(info.get('etag'))

888

contentType = unicodify(info.get('content-type', u'text/html'))

889

890

# Some smarty pants serve RSS feeds with a text/html content-type...

891

# So let's do some really simple sniffing first.

892

apparentlyRSS = filetypes.is_maybe_rss(info['body'])

893

old_title = self.actualFeed.title

894

895

# Definitely an HTML feed

896

if (((contentType.startswith(u'text/html') or

897

contentType.startswith(u'application/xhtml+xml'))

898

and not apparentlyRSS)):

899

#print "Scraping HTML"

900

html = info['body']

901

if info.has_key('charset'):

902

html = fix_html_header(html, info['charset'])

903

charset = unicodify(info['charset'])

904

else:

905

charset = None

906

self.ask_for_scrape(info, html, charset)

907

#It's some sort of feed we don't know how to scrape

908

elif (contentType.startswith(u'application/rdf+xml')

909

or contentType.startswith(u'application/atom+xml')):

910

#print "ATOM or RDF"

911

html = info['body']

912

if info.has_key('charset'):

913

xmldata = fix_xml_header(html, info['charset'])

914

else:

915

xmldata = html

916

self.finish_generate_feed(RSSFeedImpl(unicodify(info['updated-url']),

917

initialHTML=xmldata,etag=etag,modified=modified, ufeed=self,

918

title=old_title))

919

# If it's not HTML, we can't be sure what it is.

920

921

# If we get generic XML, it's probably RSS, but it still could

922

# be XHTML.

923

924

# application/rss+xml links are definitely feeds. However, they

925

# might be pre-enclosure RSS, so we still have to download them

926

# and parse them before we can deal with them correctly.

927

elif (apparentlyRSS or

928

contentType.startswith(u'application/rss+xml') or

929

contentType.startswith(u'application/podcast+xml') or

930

contentType.startswith(u'text/xml') or

931

contentType.startswith(u'application/xml') or

932

(contentType.startswith(u'text/plain') and

933

(unicodify(info['updated-url']).endswith(u'.xml') or

934

unicodify(info['updated-url']).endswith(u'.rss')))):

935

#print " It's doesn't look like HTML..."

936

html = info["body"]

937

if info.has_key('charset'):

938

xmldata = fix_xml_header(html, info['charset'])

939

html = fix_html_header(html, info['charset'])

940

charset = unicodify(info['charset'])

941

else:

942

xmldata = html

943

charset = None

944

# FIXME html and xmldata can be non-unicode at this point

945

parser = xml.sax.make_parser()

946

parser.setFeature(xml.sax.handler.feature_namespaces, 1)

947

parser.setFeature(xml.sax.handler.feature_external_ges, 0)

948

handler = RSSLinkGrabber(unicodify(info['redirected-url']), charset)

949

parser.setContentHandler(handler)

950

parser.setErrorHandler(handler)

951

try:

952

parser.parse(StringIO(xmldata))

953

except UnicodeDecodeError:

954

logging.exception ("Unicode issue parsing... %s",

955

xmldata[0:300])

956

self.finish_generate_feed(None)

957

if removeOnError:

958

self.remove()

959

except (SystemExit, KeyboardInterrupt):

960

raise

961

except:

962

#it doesn't parse as RSS, so it must be HTML

963

#print " Nevermind! it's HTML"

964

self.ask_for_scrape(info, html, charset)

965

else:

966

#print " It's RSS with enclosures"

967

self.finish_generate_feed(RSSFeedImpl(

968

unicodify(info['updated-url']),

969

initialHTML=xmldata, etag=etag, modified=modified,

970

ufeed=self, title=old_title))

971

else:

972

self._handle_feed_loading_error(_("Bad content-type"))

973

974

def finish_generate_feed(self, feedImpl):

975

self.confirm_db_thread()

976

self.loading = False

977

if feedImpl is not None:

978

self._set_feed_impl(feedImpl)

979

self.errorState = False

980

else:

981

self.errorState = True

982

self.signal_change()

983

984

def ask_for_scrape(self, info, initialHTML, charset):

985

title = _("Channel is not compatible with %(appname)s",

986

{"appname": config.get(prefs.SHORT_APP_NAME)})

987

description = _(

988

"This channel is not compatible with %(appname)s "

989

"but we'll try our best to grab the files. It may take extra time "

990

"to list the videos, and descriptions may look funny.\n"

991

"\n"

992

"Please contact the publishers of %(url)s and ask if they can supply a "

993

"feed in a format that will work with %(appname)s.\n"

994

"\n"

995

"Do you want to try to load this channel anyway?",

996

{"url": info["updated-url"],

997

"appname": config.get(prefs.SHORT_APP_NAME)}

998

)

999

dialog = dialogs.ChoiceDialog(title, description, dialogs.BUTTON_YES,

1000

dialogs.BUTTON_NO)

1001

1002

def callback(dialog):

1003

if not self.id_exists():

1004

return

1005

if dialog.choice == dialogs.BUTTON_YES:

1006

uinfo = unicodify(info)

1007

impl = ScraperFeedImpl(uinfo['updated-url'],

1008

initialHTML=initialHTML, etag=uinfo.get('etag'),

1009

modified=uinfo.get('modified'), charset=charset,

1010

ufeed=self)

1011

self.finish_generate_feed(impl)

1012

else:

1013

self.remove()

1014

dialog.run(callback)

1015

1016

def get_actual_feed(self):

1017

return self.actualFeed

1018

1019

# Many attributes come from whatever FeedImpl subclass we're using.

1020

def attr_from_feed_impl(name):

1021

def getter(self):

1022

return getattr(self.actualFeed, name)

1023

return property(getter)

1024

1025

for name in ( 'set_update_frequency', 'schedule_update_events',

1026

'cancel_update_events',

1027

'get_url', 'get_base_url',

1028

'get_base_href', 'get_link',

1029

'get_thumbnail_url', 'get_license', 'url', 'title', 'created',

1030

'thumbURL', 'dir', 'preserve_downloads', 'lookup', 'reset',

1031

'engine', 'query',

1032

1033

locals()[name] = attr_from_feed_impl(name)

1034

1035

@returns_unicode

1036

def get_expiration_type(self):

1037

"""Returns "feed," "system," or "never"

1038

"""

1039

self.confirm_db_thread()

1040

return self.expire

1041

1042

1043

def get_max_new(self):

1044

"""Returns "unlimited" or the maximum number of items this

1045

feed wants

1046

"""

1047

self.confirm_db_thread()

1048

if self.maxNew < 0:

1049

return u"unlimited"

1050

else:

1051

return self.maxNew

1052

1053

def get_max_old_items(self):

1054

"""Returns the number of items to remember past the current

1055

contents of the feed. If self.maxOldItems is None, then this

1056

returns "system" indicating that the caller should look up the

1057

default in prefs.MAX_OLD_ITEMS_DEFAULT.

1058

"""

1059

self.confirm_db_thread()

1060

if self.maxOldItems is None:

1061

return u"system"

1062

1063

return self.maxOldItems

1064

1065

def get_expiration_time(self):

1066

"""Returns the total absolute expiration time in hours.

1067

WARNING: 'system' and 'never' expiration types return 0

1068

"""

1069

self.confirm_db_thread()

1070

expireAfterSetting = config.get(prefs.EXPIRE_AFTER_X_DAYS)

1071

if ((self.expireTime is None or self.expire == 'never'

1072

or (self.expire == 'system' and expireAfterSetting <= 0))):

1073

return 0

1074

else:

1075

return (self.expireTime.days * 24 +

1076

self.expireTime.seconds / 3600)

1077

1078

def is_autodownloadable(self):

1079

"""Returns true iff item is autodownloadable

1080

"""

1081

self.confirm_db_thread()

1082

return self.autoDownloadable

1083

1084

def remove(self, move_items_to=None):

1085

"""Remove the feed.

1086

1087

If move_items_to is None (the default), the items in this feed

1088

will be removed too. If move_items_to is given, the items in

1089

this feed will be moved to that feed.

1090

"""

1091

self.confirm_db_thread()

1092

1093

if isinstance(self.actualFeed, DirectoryWatchFeedImpl):

1094

move_items_to = None

1095

self.cancel_update_events()

1096

if self.download is not None:

1097

self.download.cancel()

1098

self.download = None

1099

to_remove = []

1100

for item in self.items:

1101

if move_items_to is not None and item.is_downloaded():

1102

item.set_feed(move_items_to.get_id())

1103

else:

1104

to_remove.append(item)

1105

app.bulk_sql_manager.start()

1106

try:

1107

for item in to_remove:

1108

item.remove()

1109

finally:

1110

app.bulk_sql_manager.finish()

1111

self.remove_icon_cache()

1112

DDBObject.remove(self)

1113

self.actualFeed.remove()

1114

1115

def thumbnail_valid(self):

1116

return self.icon_cache and self.icon_cache.isValid()

1117

1118

def calc_tablist_thumbnail(self):

1119

if self.thumbnail_valid():

1120

return fileutil.expand_filename(self.icon_cache.get_filename())

1121

else:

1122

return default_tablist_feed_icon_path()

1123

1124

@returns_filename

1125

def get_thumbnail_path(self):

1126

self.confirm_db_thread()

1127

if self.thumbnail_valid():

1128

return fileutil.expand_filename(self.icon_cache.get_filename())

1129

else:

1130

return self.actualFeed.default_thumbnail_path()

1131

1132

def has_downloaded_items(self):

1133

return self.num_downloaded() > 0

1134

1135

def has_downloading_items(self):

1136

return self.num_downloading() > 0

1137

1138

def __str__(self):

1139

return "Feed - %s" % stringify(self.get_title())

1140

1141

class ThrottledUpdateFeedImpl(FeedImpl):

1142

"""Feed Impl that uses the feedupdate module to schedule it's

1143

updates. Only a limited number of ThrottledUpdateFeedImpl objects

1144

will be updating at any given time.

1145

"""

1146

1147

def schedule_update_events(self, firstTriggerDelay):

1148

feedupdate.cancel_update(self.ufeed)

1149

if firstTriggerDelay >= 0:

1150

feedupdate.schedule_update(firstTriggerDelay, self.ufeed,

1151

self.update)

1152

else:

1153

if self.updateFreq > 0:

1154

feedupdate.schedule_update(self.updateFreq, self.ufeed,

1155

self.update)

1156

1157

class RSSFeedImplBase(ThrottledUpdateFeedImpl):

1158

"""

1159

Base class from which RSSFeedImpl and SavedSearchFeedImpl derive.

1160

"""

1161

def setup_new(self, url, ufeed, title):

1162

FeedImpl.setup_new(self, url, ufeed, title)

1163

self.schedule_update_events(0)

1164

1165

def _handle_new_entry(self, entry, fp_values, channel_title):

1166

"""Handle getting a new entry from a feed."""

1167

enclosure = fp_values.first_video_enclosure

1168

if ((self.url.startswith('file://') and enclosure

1169

and enclosure['url'].startswith('file://'))):

1170

path = download_utils.get_file_url_path(enclosure['url'])

1171

item = models.FileItem(path, fp_values=fp_values,

1172

feed_id=self.ufeed.id, channel_title=channel_title)

1173

else:

1174

item = models.Item(fp_values, feed_id=self.ufeed.id,

1175

eligibleForAutoDownload=not self.initialUpdate,

1176

channel_title=channel_title)

1177

if not item.matches_search(self.ufeed.searchTerm):

1178

item.remove()

1179

1180

def remember_old_items(self):

1181

self.old_items = set(self.items)

1182

1183

def create_items_for_parsed(self, parsed):

1184

"""Update the feed using parsed XML passed in"""

1185

app.bulk_sql_manager.start()

1186

try:

1187

self._create_items_for_parsed(parsed)

1188

finally:

1189

app.bulk_sql_manager.finish()

1190

1191

def _create_items_for_parsed(self, parsed):

1192

# This is a HACK for Yahoo! search which doesn't provide

1193

# enclosures

1194

for entry in parsed['entries']:

1195

if 'enclosures' not in entry:

1196

try:

1197

url = entry['link']

1198

except KeyError:

1199

continue

1200

mimetype = filetypes.guess_mime_type(url)

1201

if mimetype is not None:

1202

entry['enclosures'] = [{'url': to_uni(url),

1203

'type': to_uni(mimetype)}]

1204

elif flashscraper.is_maybe_flashscrapable(url):

1205

entry['enclosures'] = [{'url': to_uni(url),

1206

'type': to_uni("video/flv")}]

1207

else:

1208

logging.info('unknown url type %s, not generating enclosure' % url)

1209

1210

channelTitle = None

1211

try:

1212

channelTitle = parsed["feed"]["title"]

1213

except KeyError:

1214

try:

1215

channelTitle = parsed["channel"]["title"]

1216

except KeyError:

1217

pass

1218

1219

if channelTitle != None and self._allow_feed_to_override_title():

1220

self.title = channelTitle

1221

if (parsed.feed.has_key('image') and

1222

parsed.feed.image.has_key('url') and

1223

self._allow_feed_to_override_thumbnail()):

1224

self.thumbURL = parsed.feed.image.url

1225

self.ufeed.icon_cache.request_update(is_vital=True)

1226

1227

items_byid = {}

1228

items_byURLTitle = {}

1229

items_nokey = []

1230

for item in self.items:

1231

try:

1232

items_byid[item.get_rss_id()] = item

1233

except KeyError:

1234

items_nokey.append(item)

1235

by_url_title_key = (item.url, item.entry_title)

1236

if by_url_title_key != (None, None):

1237

items_byURLTitle[by_url_title_key] = item

1238

for entry in parsed.entries:

1239

entry = self.add_scraped_thumbnail(entry)

1240

fp_values = FeedParserValues(entry)

1241

new = True

1242

if fp_values.data['rss_id'] is not None:

1243

id_ = fp_values.data['rss_id']

1244

if items_byid.has_key(id_):

1245

item = items_byid[id_]

1246

if not fp_values.compare_to_item(item):

1247

item.update_from_feed_parser_values(fp_values)

1248

new = False

1249

self.old_items.discard(item)

1250

if new:

1251

by_url_title_key = (fp_values.data['url'],

1252

fp_values.data['entry_title'])

1253

if by_url_title_key != (None, None):

1254

if items_byURLTitle.has_key(by_url_title_key):

1255

item = items_byURLTitle[by_url_title_key]

1256

if not fp_values.compare_to_item(item):

1257

item.update_from_feed_parser_values(fp_values)

1258

new = False

1259

self.old_items.discard(item)

1260

if new:

1261

for item in items_nokey:

1262

if fp_values.compare_to_item(item):

1263

new = False

1264

else:

1265

try:

1266

if fp_values.compare_to_item_enclosures(item):

1267

item.update_from_feed_parser_values(fp_values)

1268

new = False

1269

self.old_items.discard(item)

1270

except (SystemExit, KeyboardInterrupt):

1271

raise

1272

except:

1273

pass

1274

if new and fp_values.first_video_enclosure is not None:

1275

self._handle_new_entry(entry, fp_values, channelTitle)

1276

1277

def _allow_feed_to_override_title(self):

1278

"""Should the RSS feed override the default title?

1279

1280

Subclasses can override this method to change our behavior when

1281

parsing feed entries.

1282

"""

1283

return True

1284

1285

def _allow_feed_to_override_thumbnail(self):

1286

"""Should the RSS thumbnail override the default thumbnail?

1287

1288

Subclasses can override this method to change our behavior when

1289

parsing feed entries.

1290

"""

1291

return True

1292

1293

def update_finished(self):

1294

"""

1295

Called by subclasses to finish the update.

1296

"""

1297

if self.initialUpdate:

1298

self.initialUpdate = False

1299

startfrom = None

1300

itemToUpdate = None

1301

for latest in models.Item.latest_in_feed_view(self.ufeed_id):

1302

latest.eligibleForAutoDownload = True

1303

latest.signal_change()

1304

if self.ufeed.is_autodownloadable():

1305

self.ufeed.mark_as_viewed()

1306

self.ufeed.signal_change()

1307

1308

self.ufeed.recalc_counts()

1309

if hasattr(self, "old_items"):

1310

self.truncate_old_items()

1311

del self.old_items

1312

self.signal_change()

1313

1314

def truncate_old_items(self):

1315

"""Truncate items so that the number of items in this feed doesn't

1316

exceed self.get_max_old_items()

1317

1318

Items are only truncated if they don't exist in the feed anymore, and

1319

if the user hasn't downloaded them.

1320

"""

1321

limit = self.ufeed.get_max_old_items()

1322

if limit == u"system":

1323

limit = config.get(prefs.MAX_OLD_ITEMS_DEFAULT)

1324

1325

item_count = self.items.count()

1326

if item_count > config.get(prefs.TRUNCATE_CHANNEL_AFTER_X_ITEMS):

1327

truncate = item_count - config.get(prefs.TRUNCATE_CHANNEL_AFTER_X_ITEMS)

1328

if truncate > len(self.old_items):

1329

truncate = 0

1330

limit = min(limit, truncate)

1331

extra = len(self.old_items) - limit

1332

if extra <= 0:

1333

return

1334

1335

candidates = []

1336

for item in self.old_items:

1337

if item.downloader is None:

1338

candidates.append((item.creationTime, item))

1339

candidates.sort()

1340

for time, item in candidates[:extra]:

1341

item.remove()

1342

1343

def add_scraped_thumbnail(self, entry):

1344

# skip this if the entry already has a thumbnail.

1345

if entry.has_key('thumbnail'):

1346

return entry

1347

if entry.has_key('enclosures'):

1348

for enc in entry['enclosures']:

1349

if enc.has_key('thumbnail'):

1350

return entry

1351

return entry

1352

1353

class RSSFeedImpl(RSSFeedImplBase):

1354

1355

def setup_new(self, url, ufeed, title=None, initialHTML=None, etag=None,

1356

modified=None):

1357

RSSFeedImplBase.setup_new(self, url, ufeed, title)

1358

self.initialHTML = initialHTML

1359

self.etag = etag

1360

self.modified = modified

1361

self.download = None

1362

1363

@returns_unicode

1364

def get_base_href(self):

1365

try:

1366

return escape(self.parsed.link)

1367

except (SystemExit, KeyboardInterrupt):

1368

raise

1369

except:

1370

return FeedImpl.get_base_href(self)

1371

1372

@returns_unicode

1373

def get_link(self):

1374

"""Returns a link to a webpage associated with the feed

1375

"""

1376

self.ufeed.confirm_db_thread()

1377

try:

1378

return self.parsed.link

1379

except (SystemExit, KeyboardInterrupt):

1380

raise

1381

except:

1382

return u""

1383

1384

def feedparser_finished(self):

1385

self.updating = False

1386

self.schedule_update_events(-1)

1387

self.update_finished()

1388

1389

def feedparser_errback(self, e):

1390

if not self.ufeed.id_exists():

1391

return

1392

logging.info("Error updating feed: %s: %s", self.url, e)

1393

self.feedparser_finished()

1394

1395

def feedparser_callback(self, parsed):

1396

self.ufeed.confirm_db_thread()

1397

if not self.ufeed.id_exists():

1398

return

1399

if len(parsed.entries) == len(parsed.feed) == 0:

1400

logging.warn("Empty feed, not updating: %s", self.url)

1401

self.feedparser_finished()

1402

return

1403

start = clock()

1404

parsed = self.parsed = unicodify(parsed)

1405

self.remember_old_items()

1406

self.create_items_for_parsed(parsed)

1407

1408

try:

1409

updateFreq = self.parsed["feed"]["ttl"]

1410

except KeyError:

1411

updateFreq = 0

1412

self.set_update_frequency(updateFreq)

1413

1414

self.feedparser_finished()

1415

end = clock()

1416

if end - start > 1.0:

1417

logging.timing("feed update for: %s too slow (%.3f secs)",

1418

self.url, end - start)

1419

1420

def call_feedparser(self, html):

1421

self.ufeed.confirm_db_thread()

1422

eventloop.call_in_thread(self.feedparser_callback,

1423

self.feedparser_errback,

1424

feedparser.parse,

1425

"Feedparser callback - %s" % self.url, html)

1426

1427

def update(self):

1428

"""Updates a feed

1429

"""

1430

self.ufeed.confirm_db_thread()

1431

if not self.ufeed.id_exists():

1432

return

1433

if self.updating:

1434

return

1435

else:

1436

self.updating = True

1437

self.ufeed.signal_change(needs_save=False)

1438

if hasattr(self, 'initialHTML') and self.initialHTML is not None:

1439

html = self.initialHTML

1440

self.initialHTML = None

1441

self.call_feedparser(html)

1442

else:

1443

try:

1444

etag = self.etag

1445

except AttributeError:

1446

etag = None

1447

try:

1448

modified = self.modified

1449

except AttributeError:

1450

modified = None

1451

logging.info("updating %s", self.url)

1452

self.download = grab_url(self.url, self._update_callback,

1453

self._update_errback, etag=etag, modified=modified,

1454

default_mime_type=u'application/rss+xml')

1455

1456

def _update_errback(self, error):

1457

if not self.ufeed.id_exists():

1458

return

1459

logging.warn("WARNING: error in Feed.update for %s -- %s",

1460

self.ufeed, stringify(error))

1461

self.schedule_update_events(-1)

1462

self.updating = False

1463

self.ufeed.signal_change(needs_save=False)

1464

1465

def _update_callback(self, info):

1466

if not self.ufeed.id_exists():

1467

return

1468

if info.get('status') == 304:

1469

self.schedule_update_events(-1)

1470

self.updating = False

1471

self.ufeed.signal_change()

1472

return

1473

html = info['body']

1474

if info.has_key('charset'):

1475

html = fix_xml_header(html, info['charset'])

1476

1477

# FIXME HTML can be non-unicode here --NN

1478

self.url = unicodify(info['updated-url'])

1479

if info.has_key('etag'):

1480

self.etag = unicodify(info['etag'])

1481

else:

1482

self.etag = None

1483

if info.has_key('last-modified'):

1484

self.modified = unicodify(info['last-modified'])

1485

else:

1486

self.modified = None

1487

self.call_feedparser (html)

1488

1489

@returns_unicode

1490

def get_license(self):

1491

"""Returns the URL of the license associated with the feed

1492

"""

1493

try:

1494

return self.parsed["feed"]["license"]

1495

except (AttributeError, KeyError):

1496

pass

1497

return u""

1498

1499

def on_remove(self):

1500

if self.download is not None:

1501

self.download.cancel()

1502

self.download = None

1503

1504

def setup_restored(self):

1505

"""Called by pickle during deserialization

1506

"""

1507

FeedImpl.setup_restored(self)

1508

self.download = None

1509

1510

def clean_old_items(self):

1511

self.modified = None

1512

self.etag = None

1513

self.update()

1514

1515

class RSSMultiFeedBase(RSSFeedImplBase):

1516

def setup_new(self, url, ufeed, title):

1517

RSSFeedImplBase.setup_new(self, url, ufeed, title)

1518

self.etag = {}

1519

self.modified = {}

1520

self.download_dc = {}

1521

self.updating = 0

1522

self.urls = self.calc_urls()

1523

1524

def setup_restored(self):

1525

"""Called by pickle during deserialization

1526

"""

1527

RSSFeedImplBase.setup_restored(self)

1528

self.download_dc = {}

1529

self.updating = 0

1530

self.urls = self.calc_urls()

1531

1532

def calc_urls(self):

1533

"""Calculate the list of URLs to parse.

1534

1535

Subclasses must define this method.

1536

"""

1537

raise NotImplementedError()

1538

1539

def check_update_finished(self):

1540

if self.updating == 0:

1541

self.update_finished()

1542

self.schedule_update_events(-1)

1543

1544

def _allow_feed_to_override_title(self):

1545

return False

1546

1547

def feedparser_finished(self, url, needs_save=False):

1548

if not self.ufeed.id_exists():

1549

return

1550

self.updating -= 1

1551

self.check_update_finished()

1552

del self.download_dc[url]

1553

1554

def feedparser_errback(self, e, url):

1555

if not self.ufeed.id_exists() or url not in self.download_dc:

1556

return

1557

if e:

1558

logging.info("Error updating feed: %s (%s): %s", self.url, url, e)

1559

else:

1560

logging.info("Error updating feed: %s (%s)", self.url, url)

1561

self.feedparser_finished(url, True)

1562

1563

def feedparser_callback(self, parsed, url):

1564

self.ufeed.confirm_db_thread()

1565

if not self.ufeed.id_exists() or url not in self.download_dc:

1566

return

1567

start = clock()

1568

parsed = unicodify(parsed)

1569

self.create_items_for_parsed(parsed)

1570

self.feedparser_finished(url)

1571

end = clock()

1572

if end - start > 1.0:

1573

logging.timing("feed update for: %s too slow (%.3f secs)",

1574

self.url, end - start)

1575

1576

def call_feedparser(self, html, url):

1577

self.ufeed.confirm_db_thread()

1578

in_thread = False

1579

if in_thread:

1580

try:

1581

parsed = feedparser.parse(html)

1582

self.feedparser_callback(parsed, url)

1583

except (SystemExit, KeyboardInterrupt):

1584

raise

1585

except:

1586

self.feedparser_errback(self, None, url)

1587

raise

1588

else:

1589

eventloop.call_in_thread(

1590

lambda parsed, url=url: self.feedparser_callback(parsed, url),

1591

lambda e, url=url: self.feedparser_errback(e, url),

1592

feedparser.parse, "Feedparser callback - %s" % url, html)

1593

1594

def update(self):

1595

self.ufeed.confirm_db_thread()

1596

if not self.ufeed.id_exists():

1597

return

1598

if self.updating:

1599

return

1600

self.remember_old_items()

1601

for url in self.urls:

1602

etag = self.etag.get(url)

1603

modified = self.modified.get(url)

1604

self.download_dc[url] = grab_url(

1605

url,

1606

lambda x, url=url: self._update_callback(x, url),

1607

lambda x, url=url: self._update_errback(x, url),

1608

etag=etag, modified=modified,

1609

default_mime_type=u'application/rss+xml',)

1610

self.updating += 1

1611

1612

def _update_errback(self, error, url):

1613

if not self.ufeed.id_exists():

1614

return

1615

logging.warn("WARNING: error in Feed.update for %s (%s) -- %s",

1616

self.ufeed, stringify(url), stringify(error))

1617

self.schedule_update_events(-1)

1618

self.updating -= 1

1619

self.check_update_finished()

1620

self.ufeed.signal_change(needs_save=False)

1621

1622

def _update_callback(self, info, url):

1623

if not self.ufeed.id_exists():

1624

return

1625

if info.get('status') == 304:

1626

self.schedule_update_events(-1)

1627

self.updating -= 1

1628

self.check_update_finished()

1629

self.ufeed.signal_change()

1630

return

1631

html = info['body']

1632

if info.has_key('charset'):

1633

html = fix_xml_header(html, info['charset'])

1634

1635

# FIXME HTML can be non-unicode here --NN

1636

if info.get('updated-url') and url in self.urls:

1637

index = self.urls.index(url)

1638

self.urls[index] = unicodify(info['updated-url'])

1639

1640

if info.has_key('etag'):

1641

self.etag[url] = unicodify(info['etag'])

1642

else:

1643

self.etag[url] = None

1644

if info.has_key('last-modified'):

1645

self.modified[url] = unicodify(info['last-modified'])

1646

else:

1647

self.modified[url] = None

1648

self.call_feedparser (html, url)

1649

1650

def on_remove(self):

1651

self._cancel_all_downloads()

1652

1653

def _cancel_all_downloads(self):

1654

for dc in self.download_dc.values():

1655

dc.cancel()

1656

self.download_dc = {}

1657

self.updating = 0

1658

1659

def clean_old_items(self):

1660

self.modified = {}

1661

self.etag = {}

1662

self.update()

1663

1664

class SavedSearchFeedImpl(RSSMultiFeedBase):

1665

def setup_new(self, url, ufeed):

1666

self.parse_url(url)

1667

info = searchengines.get_engine_for_name(self.engine)

1668

title = to_uni(_("%(engine)s for '%(query)s'",

1669

{'engine': info.title, 'query': self.query}))

1670

RSSMultiFeedBase.setup_new(self, url, ufeed, title)

1671

1672

def default_thumbnail_path(self):

1673

info = searchengines.get_engine_for_name(self.engine)

1674

return searchengines.icon_path_for_engine(info)

1675

1676

def setup_restored(self):

1677

self.parse_url(self.url)

1678

RSSMultiFeedBase.setup_restored(self)

1679

1680

def _allow_feed_to_override_thumbnail(self):

1681

return False

1682

1683

def parse_url(self, url):

1684

m = SEARCH_URL_MATCH_RE.match(url)

1685

self.engine = m.group(1)

1686

self.query = m.group(2)

1687

1688

def calc_urls(self):

1689

return searchengines.get_request_urls(self.engine, self.query)

1690

1691

class ScraperFeedImpl(ThrottledUpdateFeedImpl):

1692

"""A feed based on un unformatted HTML or pre-enclosure RSS

1693

"""

1694

def setup_new(self, url, ufeed, title=None, initialHTML=None, etag=None,

1695

modified=None, charset=None):

1696

FeedImpl.setup_new(self, url, ufeed, title)

1697

self.initialHTML = initialHTML

1698

self.initialCharset = charset

1699

self.linkHistory = {}

1700

self.linkHistory[url] = {}

1701

self.tempHistory = {}

1702

if not etag is None:

1703

self.linkHistory[url]['etag'] = unicodify(etag)

1704

if not modified is None:

1705

self.linkHistory[url]['modified'] = unicodify(modified)

1706

self.downloads = set()

1707

1708

self.set_update_frequency(360)

1709

self.schedule_update_events(0)

1710

1711

def save_cache_history(self):

1712

"""This puts all of the caching information in tempHistory into the

1713

linkHistory. This should be called at the end of an updated so that

1714

the next time we update we don't unnecessarily follow old links

1715

"""

1716

self.ufeed.confirm_db_thread()

1717

for url in self.tempHistory.keys():

1718

self.linkHistory[url] = self.tempHistory[url]

1719

self.tempHistory = {}

1720

1721

def get_html(self, urlList, depth=0, linkNumber=0, top=False):

1722

"""Grabs HTML at the given URL, then processes it

1723

"""

1724

url = urlList.pop(0)

1725

#print "Grabbing %s" % url

1726

etag = None

1727

modified = None

1728

if self.linkHistory.has_key(url):

1729

etag = self.linkHistory[url].get('etag', None)

1730

modified = self.linkHistory[url].get('modified', None)

1731

def callback(info):

1732

if not self.ufeed.id_exists():

1733

return

1734

self.downloads.discard(download)

1735

try:

1736

self.process_downloaded_html(info, urlList, depth, linkNumber,

1737

top)

1738

finally:

1739

self.check_done()

1740

def errback(error):

1741

if not self.ufeed.id_exists():

1742

return

1743

self.downloads.discard(download)

1744

logging.info("WARNING unhandled error for ScraperFeedImpl.get_html: %s", error)

1745

self.check_done()

1746

download = grab_url(url, callback, errback, etag=etag,

1747

modified=modified, default_mime_type='text/html')

1748

self.downloads.add(download)

1749

1750

def process_downloaded_html(self, info, urlList, depth, linkNumber,

1751

top=False):

1752

self.ufeed.confirm_db_thread()

1753

#print "Done grabbing %s" % info['updated-url']

1754

1755

if not self.tempHistory.has_key(info['updated-url']):

1756

self.tempHistory[info['updated-url']] = {}

1757

if info.has_key('etag'):

1758

self.tempHistory[info['updated-url']]['etag'] = unicodify(info['etag'])

1759

if info.has_key('last-modified'):

1760

self.tempHistory[info['updated-url']]['modified'] = unicodify(info['last-modified'])

1761

1762

if info['status'] != 304 and info.has_key('body'):

1763

if info.has_key('charset'):

1764

subLinks = self.scrape_links(info['body'], info['redirected-url'], charset=info['charset'], setTitle=top)

1765

else:

1766

subLinks = self.scrape_links(info['body'], info['redirected-url'], setTitle=top)

1767

if top:

1768

self.process_links(subLinks, 0, linkNumber)

1769

else:

1770

self.process_links(subLinks, depth+1, linkNumber)

1771

if len(urlList) > 0:

1772

self.get_html(urlList, depth, linkNumber)

1773

1774

def check_done(self):

1775

if len(self.downloads) == 0:

1776

self.save_cache_history()

1777

self.updating = False

1778

self.ufeed.signal_change()

1779

self.schedule_update_events(-1)

1780

1781

def add_video_item(self, link, dict_, linkNumber):

1782

link = unicodify(link.strip())

1783

if dict_.has_key('title'):

1784

title = dict_['title']

1785

else:

1786

title = link

1787

for item in self.items:

1788

if item.get_url() == link:

1789

return

1790

# Anywhere we call this, we need to convert the input back to unicode

1791

title = feedparser.sanitizeHTML(title, "utf-8").decode('utf-8')

1792

if dict_.has_key('thumbnail') > 0:

1793

fp_dict = FeedParserDict({'title': title,

1794

'enclosures': [FeedParserDict({'url': link,

1795

'thumbnail': FeedParserDict({'url': dict_['thumbnail']})

1796

})]

1797

})

1798

else:

1799

fp_dict = FeedParserDict({'title': title,

1800

'enclosures': [FeedParserDict({'url': link})]

1801

})

1802

i = models.Item(FeedParserValues(fp_dict),

1803

linkNumber=linkNumber, feed_id=self.ufeed.id,

1804

eligibleForAutoDownload=False)

1805

if ((self.ufeed.searchTerm is not None

1806

and not i.matches_search(self.ufeed.searchTerm))):

1807

i.remove()

1808

return

1809

1810

def process_links(self, links, depth=0, linkNumber=0):

1811

# FIXME: compound names for titles at each depth??

1812

maxDepth = 2

1813

urls = links[0]

1814

links = links[1]

1815

# List of URLs that should be downloaded

1816

newURLs = []

1817

1818

if depth < maxDepth:

1819

for link in urls:

1820

if depth == 0:

1821

linkNumber += 1

1822

#print "Processing %s (%d)" % (link,linkNumber)

1823

1824

# FIXME: Using file extensions totally breaks the

1825

# standard and won't work with Broadcast Machine or

1826

# Blog Torrent. However, it's also a hell of a lot

1827

# faster than checking the mime type for every single

1828

# file, so for now, we're being bad boys. Uncomment

1829

# the elif to make this use mime types for HTTP GET URLs

1830

1831

mimetype = filetypes.guess_mime_type(link)

1832

if mimetype is None:

1833

mimetype = 'text/html'

1834

1835

#This is text of some sort: HTML, XML, etc.

1836

if ((mimetype.startswith('text/html') or

1837

mimetype.startswith('application/xhtml+xml') or

1838

mimetype.startswith('text/xml') or

1839

mimetype.startswith('application/xml') or

1840

mimetype.startswith('application/rss+xml') or

1841

mimetype.startswith('application/podcast+xml') or

1842

mimetype.startswith('application/atom+xml') or

1843

mimetype.startswith('application/rdf+xml') ) and

1844

depth < maxDepth -1):

1845

newURLs.append(link)

1846

1847

#This is a video

1848

elif (mimetype.startswith('video/') or

1849

mimetype.startswith('audio/') or

1850

mimetype == "application/ogg" or

1851

mimetype == "application/x-annodex" or

1852

mimetype == "application/x-bittorrent"):

1853

self.add_video_item(link, links[link], linkNumber)

1854

if len(newURLs) > 0:

1855

self.get_html(newURLs, depth, linkNumber)

1856

1857

def on_remove(self):

1858

for download in self.downloads:

1859

download.cancel()

1860

self.downloads = set()

1861

1862

def update(self):

1863

# FIXME: go through and add error handling

1864

self.ufeed.confirm_db_thread()

1865

if not self.ufeed.id_exists():

1866

return

1867

if self.updating:

1868

return

1869

else:

1870

self.updating = True

1871

self.ufeed.signal_change(needs_save=False)

1872

1873

if not self.initialHTML is None:

1874

html = self.initialHTML

1875

self.initialHTML = None

1876

redirURL = self.url

1877

status = 200

1878

charset = self.initialCharset

1879

self.initialCharset = None

1880

subLinks = self.scrape_links(html, redirURL, charset=charset,

1881

setTitle=True)

1882

self.process_links(subLinks, 0, 0)

1883

self.check_done()

1884

else:

1885

self.get_html([self.url], top=True)

1886

1887

def scrape_links(self, html, baseurl, setTitle=False, charset=None):

1888

try:

1889

if not charset is None:

1890

html = fix_html_header(html, charset)

1891

xmldata = html

1892

parser = xml.sax.make_parser()

1893

parser.setFeature(xml.sax.handler.feature_namespaces, 1)

1894

try:

1895

parser.setFeature(xml.sax.handler.feature_external_ges, 0)

1896

except (SystemExit, KeyboardInterrupt):

1897

raise

1898

except:

1899

pass

1900

if charset is not None:

1901

handler = RSSLinkGrabber(baseurl, charset)

1902

else:

1903

handler = RSSLinkGrabber(baseurl)

1904

parser.setContentHandler(handler)

1905

try:

1906

parser.parse(StringIO(xmldata))

1907

except IOError:

1908

pass

1909

except AttributeError:

1910

# bug in the python standard library causes this to be raised

1911

# sometimes. See #3201.

1912

pass

1913

links = handler.links

1914

linkDict = {}

1915

for link in links:

1916

if ((link[0].startswith('http://')

1917

or link[0].startswith('https://'))):

1918

if not linkDict.has_key(to_uni(link[0], charset)):

1919

linkDict[to_uni(link[0], charset)] = {}

1920

if not link[1] is None:

1921

linkDict[to_uni(link[0], charset)]['title'] = to_uni(link[1], charset).strip()

1922

if not link[2] is None:

1923

linkDict[to_uni(link[0], charset)]['thumbnail'] = to_uni(link[2], charset)

1924

if setTitle and not handler.title is None:

1925

self.ufeed.confirm_db_thread()

1926

try:

1927

self.title = to_uni(handler.title, charset)

1928

finally:

1929

self.ufeed.signal_change()

1930

return ([x[0] for x in links if x[0].startswith('http://') or x[0].startswith('https://')], linkDict)

1931

except (xml.sax.SAXException, ValueError, IOError, xml.sax.SAXNotRecognizedException):

1932

(links, linkDict) = self.scrape_html_links(html, baseurl,

1933

setTitle=setTitle,

1934

charset=charset)

1935

return (links, linkDict)

1936

1937

def scrape_html_links(self, html, baseurl, setTitle=False, charset=None):

1938

"""Given a string containing an HTML file, return a dictionary of

1939

links to titles and thumbnails

1940

"""

1941

lg = HTMLLinkGrabber()

1942

links = lg.get_links(html, baseurl)

1943

if setTitle and not lg.title is None:

1944

self.ufeed.confirm_db_thread()

1945

try:

1946

self.title = to_uni(lg.title, charset)

1947

finally:

1948

self.ufeed.signal_change()

1949

1950

linkDict = {}

1951

for link in links:

1952

if link[0].startswith('http://') or link[0].startswith('https://'):

1953

if not linkDict.has_key(to_uni(link[0], charset)):

1954

linkDict[to_uni(link[0], charset)] = {}

1955

if not link[1] is None:

1956

linkDict[to_uni(link[0], charset)]['title'] = to_uni(link[1], charset).strip()

1957

if not link[2] is None:

1958

linkDict[to_uni(link[0], charset)]['thumbnail'] = to_uni(link[2], charset)

1959

return ([x[0] for x in links

1960

if x[0].startswith('http://') or x[0].startswith('https://')],

1961

linkDict)

1962

1963

def setup_restored(self):

1964

"""Called by pickle during deserialization

1965

"""

1966

FeedImpl.setup_restored(self)

1967

self.downloads = set()

1968

self.tempHistory = {}

1969

1970

class DirectoryScannerImplBase(FeedImpl):

1971

"""Base class for FeedImpls that scan directories for items."""

1972

1973

def expire_items(self):

1974

"""Directory Items shouldn't automatically expire

1975

"""

1976

pass

1977

1978

def set_update_frequency(self, frequency):

1979

newFreq = frequency*60

1980

if newFreq != self.updateFreq:

1981

self.updateFreq = newFreq

1982

self.schedule_update_events(-1)

1983

1984

# the following methods much be implemented by subclasses

1985

def _scan_dir(self):

1986

raise NotImplementedError()

1987

1988

# the following methods may be implemented by subclasses if they need to

1989

def _before_update(self):

1990

pass

1991

1992

def _after_update(self):

1993

pass

1994

1995

def _add_known_files(self, known_files):

1996

pass

1997

1998

def _make_child(self, file_):

1999

models.FileItem(file_, feed_id=self.ufeed.id)

2000

2001

def update(self):

2002

self.ufeed.confirm_db_thread()

2003

2004

self._before_update()

2005

2006

# Calculate files known about by feeds other than the directory feed

2007

# Using a select statement is good here because we don't want to

2008

# construct all the Item objects if we don't need to.

2009

known_files = set(os.path.normcase(row[0]) for row in

2010

models.Item.select(['filename'],

2011

'filename IS NOT NULL AND '

2012

'(feed_id is NULL or feed_id != ?)', (self.ufeed_id,)))

2013

self._add_known_files(known_files)

2014

2015

# Remove items with deleted files or that that are in feeds

2016

to_remove = []

2017

for item in self.items:

2018

filename = item.get_filename()

2019

if (filename is None or

2020

not fileutil.isfile(filename) or

2021

os.path.normcase(filename) in known_files):

2022

to_remove.append(item)

2023

app.bulk_sql_manager.start()

2024

try:

2025

for item in to_remove:

2026

item.remove()

2027

finally:

2028

app.bulk_sql_manager.finish()

2029

2030

# now that we've checked for items that need to be removed, we

2031

# add our items to known_files so that they don't get added

2032

# multiple times to this feed.

2033

for x in self.items:

2034

known_files.add(os.path.normcase(x.get_filename()))

2035

2036

# adds any files we don't know about

2037

# files on the filesystem

2038

to_add = []

2039

scan_dir = self._scan_dir()

2040

if fileutil.isdir(scan_dir):

2041

all_files = fileutil.miro_allfiles(scan_dir)

2042

for file_ in all_files:

2043

file_ = os.path.normcase(file_)

2044

ufile = filename_to_unicode(file_)

2045

if (file_ not in known_files and

2046

filetypes.is_media_filename(ufile)):

2047

to_add.append(file_)

2048

2049

app.bulk_sql_manager.start()

2050

try:

2051

for file_ in to_add:

2052

self._make_child(file_)

2053

finally:

2054

app.bulk_sql_manager.finish()

2055

2056

self._after_update()

2057

self.schedule_update_events(-1)

2058

2059

class DirectoryWatchFeedImpl(DirectoryScannerImplBase):

2060

def setup_new(self, ufeed, directory):

2061

# calculate url and title arguments to FeedImpl's constructor

2062

if directory is not None:

2063

url = u"dtv:directoryfeed:%s" % make_url_safe(directory)

2064

else:

2065

url = u"dtv:directoryfeed"

2066

title = directory

2067

if title[-1] == '/':

2068

title = title[:-1]

2069

title = filename_to_unicode(os.path.basename(title)) + "/"

2070

2071

FeedImpl.setup_new(self, url=url, ufeed=ufeed, title=title)

2072

self.dir = directory

2073

self.firstUpdate = True

2074

self.set_update_frequency(5)

2075

self.schedule_update_events(0)

2076

2077

def _scan_dir(self):

2078

return self.dir

2079

2080

def _make_child(self, file_):

2081

models.FileItem(file_, feed_id=self.ufeed.id,

2082

mark_seen=self.firstUpdate)

2083

2084

def _after_update(self):

2085

if self.firstUpdate:

2086

self.firstUpdate = False

2087

self.signal_change()

2088

2089

class DirectoryFeedImpl(DirectoryScannerImplBase):

2090

"""A feed of all of the Movies we find in the movie folder that don't

2091

belong to a "real" feed. If the user changes her movies folder, this feed

2092

will continue to remember movies in the old folder.

2093

"""

2094

def setup_new(self, ufeed):

2095

FeedImpl.setup_new(self, url=u"dtv:directoryfeed", ufeed=ufeed, title=None)

2096

self.set_update_frequency(5)

2097

self.schedule_update_events(0)

2098

2099

def _before_update(self):

2100

# Make sure container items have created FileItems for their contents

2101

for container in models.Item.containers_view():

2102

container.find_new_children()

2103

2104

def _calc_known_files(self):

2105

pass

2106

2107

def _add_known_files(self, known_files):

2108

# prevents files in Incomplete Downloads and Conversions from being

2109

# turned into FileItems.

2110

movies_dir = config.get(prefs.MOVIES_DIRECTORY)

2111

2112

incomplete_dir = os.path.join(movies_dir, "Incomplete Downloads")

2113

known_files.add(os.path.normcase(incomplete_dir))

2114

2115

conversions_dir = os.path.join(movies_dir, "Conversions")

2116

known_files.add(os.path.normcase(conversions_dir))

2117

2118

def _scan_dir(self):

2119

return config.get(prefs.MOVIES_DIRECTORY)

2120

2121

@returns_unicode

2122

def get_title(self):

2123

return _(u'Local Files')

2124

2125

class SearchFeedImpl(RSSMultiFeedBase):

2126

"""Search and Search Results feeds

2127

"""

2128

def setup_new(self, ufeed):

2129

self.engine = searchengines.get_search_engines()[0].name

2130

self.query = u''

2131

RSSMultiFeedBase.setup_new(self, url=u'dtv:search', ufeed=ufeed,

2132

title=_(u'Search'))

2133

self.initialUpdate = True

2134

self.searching = False

2135

self.set_update_frequency(-1)

2136

self.ufeed.autoDownloadable = False

2137

# keeps the items from being seen as 'newly available'

2138

self.ufeed.last_viewed = datetime.max

2139

self.ufeed.signal_change()

2140

2141

def setup_restored(self):

2142

self.searching = False

2143

RSSMultiFeedBase.setup_restored(self)

2144

2145

def calc_urls(self):

2146

if self.engine and self.query:

2147

return searchengines.get_request_urls(self.engine, self.query)

2148

else:

2149

return []

2150

2151

def reset(self, set_engine=None):

2152

self.ufeed.confirm_db_thread()

2153

was_searching = self.searching

2154

self._cancel_all_downloads()

2155

self.initialUpdate = True

2156

app.bulk_sql_manager.start()

2157

try:

2158

for item in self.items:

2159

item.remove()

2160

finally:

2161

app.bulk_sql_manager.finish()

2162

self.urls = []

2163

self.searching = False

2164

if set_engine is not None:

2165

self.engine = set_engine

2166

self.etag = {}

2167

self.modified = {}

2168

self.ufeed.icon_cache.reset()

2169

self.thumbURL = None

2170

self.ufeed.icon_cache.request_update(is_vital=True)

2171

if was_searching:

2172

self.ufeed.emit('update-finished')

2173

2174

def preserve_downloads(self, downloads_feed):

2175

self.ufeed.confirm_db_thread()

2176

for item in self.items:

2177

if item.get_state() not in ('new', 'not-downloaded'):

2178

item.set_feed(downloads_feed.id)

2179

2180

def set_engine(self, engine):

2181

self.engine = engine

2182

2183

def lookup(self, engine, query):

2184

check_u(engine)

2185

check_u(query)

2186

self.reset()

2187

self.searching = True

2188

self.engine = engine

2189

self.query = query

2190

self.urls = self.calc_urls()

2191

self.update()

2192

self.ufeed.signal_change()

2193

2194

def _handle_new_entry(self, entry, fp_values, channelTitle):

2195

"""Handle getting a new entry from a feed."""

2196

url = fp_values.data['url']

2197

if url is not None:

2198

dl = downloader.get_existing_downloader_by_url(url)

2199

if dl is not None:

2200

for item in dl.item_list:

2201

if ((item.get_feed_url() == 'dtv:searchDownloads'

2202

and item.get_url() == url)):

2203

try:

2204

if entry["id"] == item.get_rss_id():

2205

item.set_feed(self.ufeed.id)

2206

if not fp_values.compare_to_item(item):

2207

item.update_from_feed_parser_values(fp_values)

2208

return

2209

except KeyError:

2210

pass

2211

title = entry.get("title")

2212

oldtitle = item.entry_title

2213

if title == oldtitle:

2214

item.set_feed(self.ufeed.id)

2215

if not fp_values.compare_to_item(item):

2216

item.update_from_feed_parser_values(fp_values)

2217

return

2218

RSSMultiFeedBase._handle_new_entry(self, entry, fp_values, channelTitle)

2219

2220

def update_finished(self):

2221

self.searching = False

2222

RSSMultiFeedBase.update_finished(self)

2223

2224

def update(self):

2225

if self.urls:

2226

RSSMultiFeedBase.update(self)

2227

else:

2228

self.ufeed.emit('update-finished')

2229

2230

@returns_unicode

2231

def get_title(self):

2232

return _(u'Search')

2233

2234

class SearchDownloadsFeedImpl(FeedImpl):

2235

def setup_new(self, ufeed):

2236

FeedImpl.setup_new(self, url=u'dtv:searchDownloads', ufeed=ufeed,

2237

title=None)

2238

self.set_update_frequency(-1)

2239

2240

@returns_unicode

2241

def get_title(self):

2242

return _(u'Search')

2243

2244

class ManualFeedImpl(FeedImpl):

2245

"""Downloaded Videos/Torrents that have been added using by the

2246

user opening them with democracy.

2247

"""

2248

def setup_new(self, ufeed):

2249

FeedImpl.setup_new(self, url=u'dtv:manualFeed', ufeed=ufeed,

2250

title=None)

2251

self.ufeed.expire = u'never'

2252

self.set_update_frequency(-1)

2253

self.ufeed.last_viewed = datetime.max

2254

2255

@returns_unicode

2256

def get_title(self):

2257

return _(u'Local Files')

2258

2259

class SingleFeedImpl(FeedImpl):

2260

"""Single Video that is playing that has been added by the user

2261

opening them with democracy.

2262

"""

2263

def setup_new(self, ufeed):

2264

FeedImpl.setup_new(self, url=u'dtv:singleFeed', ufeed=ufeed,

2265

title=None)

2266

self.ufeed.expire = u'never'

2267

self.set_update_frequency(-1)

2268

2269

@returns_unicode

2270

def get_title(self):

2271

return _(u'Playing File')

2272

2273

LINK_PATTERN = re.compile("<(a|embed)\s[^>]*(href|src)\s*=\s*\"([^\"]*)\"[^>]*>(.*?)</a(.*)", re.S)

2274

IMG_PATTERN = re.compile(".*<img\s.*?src\s*=\s*\"(.*?)\".*?>", re.S)

2275

TAG_PATTERN = re.compile("<.*?>")

2276

2277

class HTMLLinkGrabber(HTMLParser):

2278

"""Parse HTML document and grab all of the links and titles.

2279

"""

2280

# FIXME: Grab link title from ALT tags in images

2281

# FIXME: Grab document title from TITLE tags

2282

def get_links(self, data, baseurl):

2283

self.links = []

2284

self.lastLink = None

2285

self.inLink = False

2286

self.inObject = False

2287

self.baseurl = baseurl

2288

self.inTitle = False

2289

self.title = None

2290

self.thumbnailUrl = None

2291

2292

match = LINK_PATTERN.search(data)

2293

while match:

2294

try:

2295

link_url = match.group(3).encode('ascii')

2296

except UnicodeError:

2297

link_url = match.group(3)

2298

i = len(link_url) - 1

2299

while (i >= 0):

2300

if 127 < ord(link_url[i]) <= 255:

2301

link_url = (link_url[:i] +

2302

"%%%02x" % (ord(link_url[i])) +

2303

link_url[i+1:])

2304

i = i - 1

2305

2306

link = urljoin(baseurl, link_url)

2307

desc = match.group(4)

2308

img_match = IMG_PATTERN.match(desc)

2309

if img_match:

2310

try:

2311

thumb = urljoin(baseurl, img_match.group(1).encode('ascii'))

2312

except UnicodeError:

2313

thumb = None

2314

else:

2315

thumb = None

2316

desc = TAG_PATTERN.sub(' ', desc)

2317

self.links.append((link, desc, thumb))

2318

match = LINK_PATTERN.search(match.group(5))

2319

return self.links

2320

2321

class RSSLinkGrabber(xml.sax.handler.ContentHandler,

2322

xml.sax.handler.ErrorHandler):

2323

def __init__(self, baseurl, charset=None):

2324

self.baseurl = baseurl

2325

self.charset = charset

2326

2327

def startDocument(self):

2328

#print "Got start document"

2329

self.enclosureCount = 0

2330

self.itemCount = 0

2331

self.links = []

2332

self.inLink = False

2333

self.inDescription = False

2334

self.inTitle = False

2335

self.inItem = False

2336

self.descHTML = ''

2337

self.theLink = ''

2338

self.title = None

2339

self.firstTag = True

2340

self.errors = 0

2341

self.fatal_errors = 0

2342

2343

def startElementNS(self, name, qname, attrs):

2344

uri = name[0]

2345

tag = name[1]

2346

if self.firstTag:

2347

self.firstTag = False

2348

if tag not in ['rss', 'feed']:

2349

raise xml.sax.SAXNotRecognizedException, "Not an RSS file"

2350

if tag.lower() == 'enclosure' or tag.lower() == 'content':

2351

self.enclosureCount += 1

2352

elif tag.lower() == 'link':

2353

self.inLink = True

2354

self.theLink = ''

2355

elif tag.lower() == 'description':

2356

self.inDescription = True

2357

self.descHTML = ''

2358

elif tag.lower() == 'item':

2359

self.itemCount += 1

2360

self.inItem = True

2361

elif tag.lower() == 'title' and not self.inItem:

2362

self.inTitle = True

2363

2364

def endElementNS(self, name, qname):

2365

uri = name[0]

2366

tag = name[1]

2367

if tag.lower() == 'description':

2368

lg = HTMLLinkGrabber()

2369

try:

2370

html = xhtmlify(unescape(self.descHTML), add_top_tags=True)

2371

if not self.charset is None:

2372

html = fix_html_header(html, self.charset)

2373

self.links[:0] = lg.get_links(html, self.baseurl)

2374

except HTMLParseError: # Don't bother with bad HTML

2375

logging.info ("bad HTML in description for %s", self.baseurl)

2376

self.inDescription = False

2377

elif tag.lower() == 'link':

2378

self.links.append((self.theLink, None, None))

2379

self.inLink = False

2380

elif tag.lower() == 'item':

2381

self.inItem = False

2382

elif tag.lower() == 'title' and not self.inItem:

2383

self.inTitle = False

2384

2385

def characters(self, data):

2386

if self.inDescription:

2387

self.descHTML += data

2388

elif self.inLink:

2389

self.theLink += data

2390

elif self.inTitle:

2391

if self.title is None:

2392

self.title = data

2393

else:

2394

self.title += data

2395

2396

def error(self, exception):

2397

self.errors += 1

2398

2399

def fatalError(self, exception):

2400

self.fatal_errors += 1

2401

2402

class HTMLFeedURLParser(HTMLParser):

2403

"""Grabs the feed link from the given webpage

2404

"""

2405

def get_link(self, baseurl, data):

2406

self.baseurl = baseurl

2407

self.link = None

2408

try:

2409

self.feed(data)

2410

except HTMLParseError:

2411

logging.info ("error parsing %s", baseurl)

2412

try:

2413

self.close()

2414

except HTMLParseError:

2415

logging.info ("error closing %s", baseurl)

2416

return self.link

2417

2418

def handle_starttag(self, tag, attrs):

2419

attrdict = {}

2420

for (key, value) in attrs:

2421

attrdict[key.lower()] = value

2422

if (tag.lower() == 'link' and attrdict.has_key('rel') and

2423

attrdict.has_key('type') and attrdict.has_key('href') and

2424

attrdict['rel'].lower() == 'alternate' and

2425

attrdict['type'].lower() in ['application/rss+xml',

2426

'application/podcast+xml',

2427

'application/rdf+xml',

2428

'application/atom+xml',

2429

'text/xml',

2430

'application/xml']):

2431

self.link = urljoin(self.baseurl, attrdict['href'])

2432

2433

def expire_items():

2434

try:

2435

for feed in Feed.make_view():

2436

feed.expire_items()

2437

finally:

2438

eventloop.add_timeout(300, expire_items, "Expire Items")

2439

2440

def lookup_feed(url, search_term=None):

2441

try:

2442

return Feed.get_by_url_and_search(url, search_term)

2443

except ObjectNotFoundError:

2444

return None

2445

2446

def remove_orphaned_feed_impls():

2447

removed_impls = []

2448

for klass in (FeedImpl, RSSFeedImpl, SavedSearchFeedImpl,

2449

ScraperFeedImpl, SearchFeedImpl, DirectoryFeedImpl,

2450

DirectoryWatchFeedImpl, SearchDownloadsFeedImpl,):

2451

for feed_impl in klass.orphaned_view():

2452

logging.warn("No feed for FeedImpl: %s. Discarding", feed_impl)

2453

feed_impl.remove()

2454

removed_impls.append(feed_impl.url)

2455

if removed_impls:

2456

databaselog.info("Removed FeedImpl objects without a feed: %s",

2457

','.join(removed_impls))

2458

2459

restored_feeds = []

2460

def start_updates():

2461

global restored_feeds

2462

if config.get(prefs.CHECK_CHANNELS_EVERY_X_MN) == -1:

2463

return

2464

for feed in restored_feeds:

2465

if feed.id_exists():

2466

feed.update_after_restore()

2467

restored_feeds = []

Older »