implement spotify search

pull/1/head
Yash Agarwal 2017-06-17 12:20:24 +05:30
parent 87c01cf7d7
commit 134be89024
1 changed files with 44 additions and 155 deletions

View File

@ -1,22 +1,18 @@
import sys
import os
from os.path import basename
import acoustid
import discogs_client as discogs
import musicbrainzngs as m
import eyed3
from bs4 import BeautifulSoup
import requests
import json
import spotipy
import spotipy.oauth2 as oauth2
import re
from titlecase import titlecase
import requests
from bs4 import BeautifulSoup
def improve_song_names(songs):
text_file = open("blacklist.txt", "r")
blacklistWords = text_file.read().splitlines()
blacklistWords = [word.lower() for word in blacklistWords]
char_filters = "()[]{}-:_/=+\"\'"
word_filters = ('lyrics', 'lyric', 'by', 'video', 'official', 'hd', 'dirty', 'with', 'lyrics', 'feat', 'original', 'mix',
'www', 'com', 'mp3', 'audio', 'remixed', 'remix', 'full', 'version', 'music', 'hq', 'uploaded', 'explicit')
reg_exp = 's/^\d\d //'
improved_names = []
@ -24,93 +20,55 @@ def improve_song_names(songs):
song = song.strip()
song = song.lstrip("0123456789.- ")
# re.sub(reg_exp, '', song)
searchText = song[0:-4]
for word in song[0:-4].split(' '):
if word.lower() in blacklistWords:
searchText = searchText.replace(word, '')
song = song[0:-4]
song = ''.join(
map(lambda c: " " if c in char_filters else c, song))
improved_names.append(searchText.strip())
song = re.sub('|'.join(re.escape(key) for key in word_filters),
"", song, flags=re.IGNORECASE)
song = ' '.join(song.split())
improved_names.append(song.strip())
return improved_names
def get_soup(url, headers):
r = requests.get(url, headers=headers)
soup = BeautifulSoup(r.text, 'html.parser')
return soup
def get_song_name(title, artist):
return title + ' - ' + artist
def get_albumart_google(song_name):
url = "https://www.google.co.in/search?q=" + \
song_name.replace(" ", "_") + "&source=lnms&tbm=isch"
def get_metadata_spotify(spotify, song_name):
metadata = {}
meta_tags = spotify.search(song_name, limit=1)['tracks']['items'][0]
HEADERS = {
'User-Agent': "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.2357.134 Safari/537.36"
}
metadata['title'] = meta_tags['name']
metadata['artist'] = meta_tags['artists'][0]['name']
metadata['album'] = meta_tags['album']['name']
metadata['album_artist'] = meta_tags['album']['artists'][0]['name']
soup = get_soup(url, HEADERS)
ActualImages = []
for a in soup.find_all("div", {"class": "rg_meta"}):
link, Type = json.loads(a.text)["ou"], json.loads(a.text)["ity"]
return link
print(link)
ActualImages.append((link, Type))
album_id = meta_tags['album']['id']
album_meta_tags = spotify.album(album_id)
return ActualImages
def get_metadata_acoustid(song):
API_KEY = 'GkQibmzT1u'
metadata['release-date'] = album_meta_tags['release_date']
try:
results = acoustid.match(API_KEY, song)
except acoustid.NoBackendError:
print("chromaprint library/tool not found", file=sys.stderr)
sys.exit(1)
except acoustid.FingerprintGenerationError:
print("fingerprint could not be calculated", file=sys.stderr)
sys.exit(1)
except acoustid.WebServiceError as exc:
print("web service request failed:", exc.message, file=sys.stderr)
sys.exit(1)
except acoustid.FingerprintSubmissionError:
print("Error")
metadata['genre'] = titlecase(album_meta_tags['genres'][0])
except IndexError:
try:
artist_id = meta_tags['artists'][0]['id']
artist_meta_tags = spotify.artist(artist_id)
metadata['genre'] = titlecase(artist_meta_tags['genres'][0])
first = True
scoreMax = 0
except IndexError:
pass
for result in results:
if first:
first = False
else:
# print(result)
if(result[0] > scoreMax):
scoreMax = result[0]
else:
pass
score, rid, title, artist = result[0], result[1], result[2], result[3]
valid = True
albumart = get_albumart_google(title + " - " + artist)
break
metadata['track_num'] = meta_tags['track_number']
metadata['disc_num'] = meta_tags['disc_number']
if first is True:
print("No Data found for " + song + " .... Skipping it")
score = rid = title = artist = albumart = None
valid = False
metadata['albumart'] = meta_tags['album']['images'][0]['url']
# metadata['lyrics'] = get_lyrics_genius(
# get_song_name(metadata['title'], metadata['artist']))
return valid, score, rid, title, artist, albumart
def get_metadata_musicbrainz(rid, artist, title):
d = m.set_useragent(
"MetadataRepair",
"0.1",
"https://github.com/yash2696/python-musicbrainzngs/",
)
result = m.search_recordings(
artist=artist, recording=title, rid=rid, limit=5)
print(result)
return metadata
def list_files():
@ -118,47 +76,6 @@ def list_files():
return [f for f in os.listdir('.') if f.endswith('.mp3')]
def get_metadata_discogs(song_name):
d = discogs.Client('ExampleApplication/0.1',
user_token="mbNSnSrqdyJOKorCDBXjzzeYNhgulysWNJbwgBmk")
results = d.search(song_name, type="release")
first_result = results.page(1)[0]
title = first_result.title
print(title)
print(first_result.artists[0].name)
print(first_result.images[0])
def add_metadata(file_name, album_art):
"""
Add album_art in .mp3's tags
"""
img = requests.get(
"https://i.ytimg.com/vi/7S0MWoXYH5k/maxresdefault.jpg", stream=True)
img = img.raw
audiofile = eyed3.load(file_name)
tag = audiofile.tag
tag.artist = "Alka Yagnik"
tag.album = "Lajja"
tag.title = "Badi Mushkil Baba Badi Mushkil"
tag.images.set(3, img.read(), "image/jpeg", u"Google image")
tag.lyrics.set(u""" """)
# write it back
audiofile.tag.save()
# def get_metadata_spotify(song):
# spotify.search(song, limit=1)['tracks']['items'][0]
# return
def main():
auth = oauth2.SpotifyClientCredentials(
client_id='622a0e16a4914e3eadc2a37b4a134f1e',
@ -169,38 +86,10 @@ def main():
files = list_files()
improved_name = improve_song_names(files)
# get_metadata_spotify(files[1])
# valid, score, rid, title, artist, albumart = get_metadata_acoustid(
# "35. Mike Posner - I Took a Pill in Ibiza (SeeB Remix).mp3")
# print(valid, score, rid, title, artist, albumart)
# add_album_art(
# "Badi.mp3", "")
# for file_name in files:
# print("-------------" + file_name + "------------------")
# print()
# valid, score, rid, title, artist = get_metadata_acoustid(file_name)
# if valid == True:
# get_metadata_musicbrainz(rid, artist, title)
# add_metadata(file_name, rid, title, artist)
# print()
# break
# files = improve_song_names(files)
# print(files)
# count = 0
# for file_name in files:
# print("-------------" + file_name + "------------------")
# print()
# get_metadata_discogs(file_name)
# count += 1
# if count > 5:
# break
# print()
# get_albumart_google(
# "Mike Posner - I Took a Pill in Ibiza (acoustic)")
# print(improved_name[19])
# print(files[16])
metadata = get_metadata_spotify(
spotify, improved_name[19])
if __name__ == "__main__":