/usr/lib/rhythmbox/plugins/lyrics/JetlyricsParser.py is in rhythmbox-plugins 3.1-1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 | # -*- Mode: python; coding: utf-8; tab-width: 8; indent-tabs-mode: t; -*-
#
# Copyright (C) 2012 He Jian <hejian.he@gmail.com>
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2, or (at your option)
# any later version.
#
# The Rhythmbox authors hereby grant permission for non-GPL compatible
# GStreamer plugins to be used and distributed together with GStreamer
# and Rhythmbox. This permission is above and beyond the permissions granted
# by the GPL license by which Rhythmbox is covered. If you modify this code
# you may extend this exception to your version of the code, but you are not
# obligated to do so. If you do not wish to do so, delete this exception
# statement from your version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
import rb
import urllib.parse
import re
class JetlyricsParser (object):
def __init__ (self, artist, title):
self.artist = artist
self.title = title
def search (self, callback, *data):
artist = urllib.parse.quote_plus(self.artist)
title = urllib.parse.quote_plus(self.title)
q = title + ' - ' + artist
url = 'http://www.jetlyrics.com/search.php?q=%s' % (q)
loader = rb.Loader()
loader.get_url (url, self.got_results, callback, *data)
def got_results (self, result, callback, *data):
if result is None:
callback (None, *data)
return
result = result.decode('utf-8')
m = re.search('<a href=\'(http://jetlyrics\.com/viewlyrics\.php\?id=[0-9]*)\'>', result)
if m is None:
callback (None, *data)
return
loader = rb.Loader()
loader.get_url (m.group(1), self.parse_lyrics, callback, *data)
def parse_lyrics (self, result, callback, *data):
if result is None:
callback (None, *data)
return
result = result.decode('utf-8')
lyrics = re.split ('<div id=lyricsText>', result)[1]
lyrics = re.split ('</div>', lyrics)[0]
lyrics = re.sub('<br/>', '\n', lyrics)
lyrics = re.sub('<br />', '\n', lyrics)
lyrics = re.sub('<br>', '\n', lyrics)
lyrics = re.sub('<noscript><a href=\'http://jetlyrics.com\'>Lyrics</a></noscript>', '', lyrics)
lyrics = re.sub('<a href=\'http://jetlyrics.com\'>Jet Lyrics</a>', '', lyrics)
lyrics = self.title + "\n\n" + lyrics
lyrics += "\n\nLyrics provided by jetlyrics.com"
callback (lyrics, *data)
|