~ubuntu-branches/ubuntu/oneiric/rhythmbox/oneiric

« back to all changes in this revision

Viewing changes to plugins/lyrics/WinampcnParser.py

  • Committer: Bazaar Package Importer
  • Author(s): Rico Tzschichholz
  • Date: 2011-07-29 16:41:38 UTC
  • mto: This revision was merged to the branch mainline in revision 191.
  • Revision ID: james.westby@ubuntu.com-20110729164138-wwicy8nqalm18ck7
Tags: upstream-2.90.1~20110802
ImportĀ upstreamĀ versionĀ 2.90.1~20110802

Show diffs side-by-side

added added

removed removed

Lines of Context:
 
1
# -*- Mode: python; coding: utf-8; tab-width: 8; indent-tabs-mode: t; -*-
 
2
#
 
3
# Copyright (C) 2007 Austin  <austiny@sohu.com>
 
4
#
 
5
# This program is free software; you can redistribute it and/or modify
 
6
# it under the terms of the GNU General Public License as published by
 
7
# the Free Software Foundation; either version 2, or (at your option)
 
8
# any later version.
 
9
#
 
10
# The Rhythmbox authors hereby grant permission for non-GPL compatible
 
11
# GStreamer plugins to be used and distributed together with GStreamer
 
12
# and Rhythmbox. This permission is above and beyond the permissions granted
 
13
# by the GPL license by which Rhythmbox is covered. If you modify this code
 
14
# you may extend this exception to your version of the code, but you are not
 
15
# obligated to do so. If you do not wish to do so, delete this exception
 
16
# statement from your version.
 
17
#
 
18
# This program is distributed in the hope that it will be useful,
 
19
# but WITHOUT ANY WARRANTY; without even the implied warranty of
 
20
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 
21
# GNU General Public License for more details.
 
22
#
 
23
# You should have received a copy of the GNU General Public License
 
24
# along with this program; if not, write to the Free Software
 
25
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301  USA.
 
26
 
 
27
import sys
 
28
import urllib
 
29
import gettext
 
30
import re
 
31
import rb
 
32
from xml.dom import minidom
 
33
 
 
34
def detect_charset(s):
 
35
        charsets = ('iso-8859-1', 'gbk', 'utf-8')
 
36
        for charset in charsets:
 
37
                try:
 
38
                        return unicode(unicode(s, 'utf-8').encode(charset), 'gbk')
 
39
                except:
 
40
                        continue
 
41
        return s
 
42
 
 
43
class WinampcnParser(object):
 
44
        def __init__(self, artist, title):
 
45
                self.artist = artist
 
46
                self.title = title
 
47
        
 
48
        def search(self, callback, *data):
 
49
 
 
50
                # encode search string
 
51
                title_encode = urllib.quote(detect_charset(self.title).encode('gbk').replace(' ', ''))
 
52
                artist_encode = urllib.quote(detect_charset(self.artist).encode('gbk').replace(' ',''))
 
53
                url = 'http://www.winampcn.com/lyrictransfer/get.aspx?song=%s&artist=%s&lsong=%s&Datetime=20060601' % (title_encode, artist_encode, title_encode)
 
54
                
 
55
                loader = rb.Loader()
 
56
                loader.get_url (url, self.got_lyrics, callback, *data)
 
57
                
 
58
        def got_lyrics(self, xmltext, callback, *data):
 
59
                # retrieve xml content
 
60
                if xmltext is None:
 
61
                        callback (None, *data)
 
62
                        return
 
63
 
 
64
                try:
 
65
                        xmltext = xmltext.decode('gbk').encode('UTF-8')
 
66
                        xmltext = xmltext.replace('encoding="gb2312"', 'encoding="UTF-8"')
 
67
                        xmldoc = minidom.parseString(xmltext)
 
68
                        root = xmldoc.documentElement
 
69
 
 
70
                        lrcurl = root.getElementsByTagName('LyricUrl')[0].childNodes[0].data
 
71
                        if lrcurl is None:
 
72
                                callback (xmltext, *data)
 
73
                                return
 
74
 
 
75
                        # download the lyrics file
 
76
                        lrcurl_encode = urllib.quote(detect_charset(lrcurl).encode('gbk'))
 
77
                        lrcurl_encode = lrcurl_encode.replace('%3A', ':');
 
78
 
 
79
                        loader = rb.Loader()
 
80
                        loader.get_url (lrcurl_encode, self.parse_lyrics, callback, *data)
 
81
                except:
 
82
                        callback (None, *data)
 
83
 
 
84
 
 
85
        def parse_lyrics(self, lyrics, callback, *data):
 
86
 
 
87
                if lyrics is None:
 
88
                        callback (None, *data)
 
89
                        return
 
90
 
 
91
                # transform it into plain text
 
92
                lrcplaintext = lyrics
 
93
                try:
 
94
                        lrcplaintext = re.sub('\[.*?\]', '', lrcplaintext)
 
95
                        lrcplaintext = lrcplaintext.decode('gbk').encode('UTF-8')
 
96
                except:
 
97
                        callback (lrcplaintext, *data)
 
98
                        return
 
99
 
 
100
                # callback and show
 
101
                lrcplaintext += "\n\nLyrics provided by winampcn.com"
 
102
                callback(lrcplaintext, *data)
 
103