%PDF- %PDF-
Direktori : /lib/x86_64-linux-gnu/rhythmbox/plugins/lyrics/ |
Current File : //lib/x86_64-linux-gnu/rhythmbox/plugins/lyrics/JetlyricsParser.py |
# -*- Mode: python; coding: utf-8; tab-width: 8; indent-tabs-mode: t; -*- # # Copyright (C) 2012 He Jian <hejian.he@gmail.com> # # This program is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation; either version 2, or (at your option) # any later version. # # The Rhythmbox authors hereby grant permission for non-GPL compatible # GStreamer plugins to be used and distributed together with GStreamer # and Rhythmbox. This permission is above and beyond the permissions granted # by the GPL license by which Rhythmbox is covered. If you modify this code # you may extend this exception to your version of the code, but you are not # obligated to do so. If you do not wish to do so, delete this exception # statement from your version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program; if not, write to the Free Software # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. import rb import urllib.parse import re class JetlyricsParser (object): def __init__ (self, artist, title): self.artist = artist self.title = title def search (self, callback, *data): artist = urllib.parse.quote_plus(self.artist) title = urllib.parse.quote_plus(self.title) q = title + ' - ' + artist url = 'http://www.jetlyrics.com/search.php?q=%s' % (q) loader = rb.Loader() loader.get_url (url, self.got_results, callback, *data) def got_results (self, result, callback, *data): if result is None: callback (None, *data) return result = result.decode('utf-8') m = re.search('<a href=\'(http://jetlyrics\.com/viewlyrics\.php\?id=[0-9]*)\'>', result) if m is None: callback (None, *data) return loader = rb.Loader() loader.get_url (m.group(1), self.parse_lyrics, callback, *data) def parse_lyrics (self, result, callback, *data): if result is None: callback (None, *data) return result = result.decode('utf-8') lyrics = re.split ('<div id=lyricsText>', result)[1] lyrics = re.split ('</div>', lyrics)[0] lyrics = re.sub('<br/>', '\n', lyrics) lyrics = re.sub('<br />', '\n', lyrics) lyrics = re.sub('<br>', '\n', lyrics) lyrics = re.sub('<noscript><a href=\'http://jetlyrics.com\'>Lyrics</a></noscript>', '', lyrics) lyrics = re.sub('<a href=\'http://jetlyrics.com\'>Jet Lyrics</a>', '', lyrics) lyrics = self.title + "\n\n" + lyrics lyrics += "\n\nLyrics provided by jetlyrics.com" callback (lyrics, *data)