-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathgenius.py
40 lines (30 loc) · 1.02 KB
/
genius.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
from bs4 import BeautifulSoup
import urllib.request
import sys
class Genius:
def __init__(self, URL):
self.URL = URL
self.html_source = ''
def get_URL(self, URL):
self.header = urllib.request.Request(self.URL, headers={'User-Agent' : "Magic Browser"})
self.html_source = urllib.request.urlopen(self.header)
self.soup = BeautifulSoup(self.html_source, 'html.parser')
def get_lyrics(self):
bad = 'googletag'
lyrics = self.soup.find('div','song_body-lyrics')
message = lyrics.get_text()
for item in message.split('\n'):
if (bad in item):
strip = (item.strip()[0:91])
message = message.replace(strip, '\n')
message = message.replace('\n', '<br>')
message = '<p>' + message + '</p>'
print(message)
#URL = 'http://genius.com/Beyonce-sorry-lyrics'
URL = sys.argv[1]
lyrics = Genius(URL)
if (not URL.find("http")):
lyrics.get_URL('http://' + URL)
else:
lyrics.get_URL(URL)
lyrics.get_lyrics()