implement spotify search
parent
87c01cf7d7
commit
134be89024
197
addMetadata.py
197
addMetadata.py
|
@ -1,22 +1,18 @@
|
|||
import sys
|
||||
import os
|
||||
from os.path import basename
|
||||
import acoustid
|
||||
import discogs_client as discogs
|
||||
import musicbrainzngs as m
|
||||
import eyed3
|
||||
from bs4 import BeautifulSoup
|
||||
import requests
|
||||
import json
|
||||
import spotipy
|
||||
import spotipy.oauth2 as oauth2
|
||||
import re
|
||||
from titlecase import titlecase
|
||||
import requests
|
||||
from bs4 import BeautifulSoup
|
||||
|
||||
|
||||
def improve_song_names(songs):
|
||||
text_file = open("blacklist.txt", "r")
|
||||
blacklistWords = text_file.read().splitlines()
|
||||
blacklistWords = [word.lower() for word in blacklistWords]
|
||||
char_filters = "()[]{}-:_/=+\"\'"
|
||||
word_filters = ('lyrics', 'lyric', 'by', 'video', 'official', 'hd', 'dirty', 'with', 'lyrics', 'feat', 'original', 'mix',
|
||||
'www', 'com', 'mp3', 'audio', 'remixed', 'remix', 'full', 'version', 'music', 'hq', 'uploaded', 'explicit')
|
||||
|
||||
reg_exp = 's/^\d\d //'
|
||||
improved_names = []
|
||||
|
@ -24,93 +20,55 @@ def improve_song_names(songs):
|
|||
song = song.strip()
|
||||
song = song.lstrip("0123456789.- ")
|
||||
# re.sub(reg_exp, '', song)
|
||||
searchText = song[0:-4]
|
||||
for word in song[0:-4].split(' '):
|
||||
if word.lower() in blacklistWords:
|
||||
searchText = searchText.replace(word, '')
|
||||
song = song[0:-4]
|
||||
song = ''.join(
|
||||
map(lambda c: " " if c in char_filters else c, song))
|
||||
|
||||
improved_names.append(searchText.strip())
|
||||
song = re.sub('|'.join(re.escape(key) for key in word_filters),
|
||||
"", song, flags=re.IGNORECASE)
|
||||
|
||||
song = ' '.join(song.split())
|
||||
improved_names.append(song.strip())
|
||||
|
||||
return improved_names
|
||||
|
||||
|
||||
def get_soup(url, headers):
|
||||
r = requests.get(url, headers=headers)
|
||||
soup = BeautifulSoup(r.text, 'html.parser')
|
||||
return soup
|
||||
def get_song_name(title, artist):
|
||||
return title + ' - ' + artist
|
||||
|
||||
|
||||
def get_albumart_google(song_name):
|
||||
url = "https://www.google.co.in/search?q=" + \
|
||||
song_name.replace(" ", "_") + "&source=lnms&tbm=isch"
|
||||
def get_metadata_spotify(spotify, song_name):
|
||||
metadata = {}
|
||||
meta_tags = spotify.search(song_name, limit=1)['tracks']['items'][0]
|
||||
|
||||
HEADERS = {
|
||||
'User-Agent': "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.2357.134 Safari/537.36"
|
||||
}
|
||||
metadata['title'] = meta_tags['name']
|
||||
metadata['artist'] = meta_tags['artists'][0]['name']
|
||||
metadata['album'] = meta_tags['album']['name']
|
||||
metadata['album_artist'] = meta_tags['album']['artists'][0]['name']
|
||||
|
||||
soup = get_soup(url, HEADERS)
|
||||
ActualImages = []
|
||||
for a in soup.find_all("div", {"class": "rg_meta"}):
|
||||
link, Type = json.loads(a.text)["ou"], json.loads(a.text)["ity"]
|
||||
return link
|
||||
print(link)
|
||||
ActualImages.append((link, Type))
|
||||
album_id = meta_tags['album']['id']
|
||||
album_meta_tags = spotify.album(album_id)
|
||||
|
||||
return ActualImages
|
||||
|
||||
|
||||
def get_metadata_acoustid(song):
|
||||
API_KEY = 'GkQibmzT1u'
|
||||
metadata['release-date'] = album_meta_tags['release_date']
|
||||
try:
|
||||
results = acoustid.match(API_KEY, song)
|
||||
except acoustid.NoBackendError:
|
||||
print("chromaprint library/tool not found", file=sys.stderr)
|
||||
sys.exit(1)
|
||||
except acoustid.FingerprintGenerationError:
|
||||
print("fingerprint could not be calculated", file=sys.stderr)
|
||||
sys.exit(1)
|
||||
except acoustid.WebServiceError as exc:
|
||||
print("web service request failed:", exc.message, file=sys.stderr)
|
||||
sys.exit(1)
|
||||
except acoustid.FingerprintSubmissionError:
|
||||
print("Error")
|
||||
metadata['genre'] = titlecase(album_meta_tags['genres'][0])
|
||||
except IndexError:
|
||||
try:
|
||||
artist_id = meta_tags['artists'][0]['id']
|
||||
artist_meta_tags = spotify.artist(artist_id)
|
||||
metadata['genre'] = titlecase(artist_meta_tags['genres'][0])
|
||||
|
||||
first = True
|
||||
scoreMax = 0
|
||||
|
||||
for result in results:
|
||||
if first:
|
||||
first = False
|
||||
else:
|
||||
# print(result)
|
||||
if(result[0] > scoreMax):
|
||||
scoreMax = result[0]
|
||||
else:
|
||||
except IndexError:
|
||||
pass
|
||||
score, rid, title, artist = result[0], result[1], result[2], result[3]
|
||||
valid = True
|
||||
albumart = get_albumart_google(title + " - " + artist)
|
||||
break
|
||||
|
||||
if first is True:
|
||||
print("No Data found for " + song + " .... Skipping it")
|
||||
score = rid = title = artist = albumart = None
|
||||
valid = False
|
||||
metadata['track_num'] = meta_tags['track_number']
|
||||
metadata['disc_num'] = meta_tags['disc_number']
|
||||
|
||||
return valid, score, rid, title, artist, albumart
|
||||
metadata['albumart'] = meta_tags['album']['images'][0]['url']
|
||||
# metadata['lyrics'] = get_lyrics_genius(
|
||||
# get_song_name(metadata['title'], metadata['artist']))
|
||||
|
||||
|
||||
def get_metadata_musicbrainz(rid, artist, title):
|
||||
d = m.set_useragent(
|
||||
"MetadataRepair",
|
||||
"0.1",
|
||||
"https://github.com/yash2696/python-musicbrainzngs/",
|
||||
)
|
||||
|
||||
result = m.search_recordings(
|
||||
artist=artist, recording=title, rid=rid, limit=5)
|
||||
|
||||
print(result)
|
||||
return metadata
|
||||
|
||||
|
||||
def list_files():
|
||||
|
@ -118,47 +76,6 @@ def list_files():
|
|||
return [f for f in os.listdir('.') if f.endswith('.mp3')]
|
||||
|
||||
|
||||
def get_metadata_discogs(song_name):
|
||||
d = discogs.Client('ExampleApplication/0.1',
|
||||
user_token="mbNSnSrqdyJOKorCDBXjzzeYNhgulysWNJbwgBmk")
|
||||
|
||||
results = d.search(song_name, type="release")
|
||||
first_result = results.page(1)[0]
|
||||
|
||||
title = first_result.title
|
||||
|
||||
print(title)
|
||||
print(first_result.artists[0].name)
|
||||
print(first_result.images[0])
|
||||
|
||||
|
||||
def add_metadata(file_name, album_art):
|
||||
"""
|
||||
Add album_art in .mp3's tags
|
||||
"""
|
||||
|
||||
img = requests.get(
|
||||
"https://i.ytimg.com/vi/7S0MWoXYH5k/maxresdefault.jpg", stream=True)
|
||||
img = img.raw
|
||||
|
||||
audiofile = eyed3.load(file_name)
|
||||
tag = audiofile.tag
|
||||
|
||||
tag.artist = "Alka Yagnik"
|
||||
tag.album = "Lajja"
|
||||
tag.title = "Badi Mushkil Baba Badi Mushkil"
|
||||
tag.images.set(3, img.read(), "image/jpeg", u"Google image")
|
||||
tag.lyrics.set(u""" """)
|
||||
|
||||
# write it back
|
||||
audiofile.tag.save()
|
||||
|
||||
|
||||
# def get_metadata_spotify(song):
|
||||
# spotify.search(song, limit=1)['tracks']['items'][0]
|
||||
# return
|
||||
|
||||
|
||||
def main():
|
||||
auth = oauth2.SpotifyClientCredentials(
|
||||
client_id='622a0e16a4914e3eadc2a37b4a134f1e',
|
||||
|
@ -169,38 +86,10 @@ def main():
|
|||
files = list_files()
|
||||
improved_name = improve_song_names(files)
|
||||
|
||||
# get_metadata_spotify(files[1])
|
||||
|
||||
# valid, score, rid, title, artist, albumart = get_metadata_acoustid(
|
||||
# "35. Mike Posner - I Took a Pill in Ibiza (SeeB Remix).mp3")
|
||||
|
||||
# print(valid, score, rid, title, artist, albumart)
|
||||
# add_album_art(
|
||||
# "Badi.mp3", "")
|
||||
# for file_name in files:
|
||||
# print("-------------" + file_name + "------------------")
|
||||
# print()
|
||||
# valid, score, rid, title, artist = get_metadata_acoustid(file_name)
|
||||
# if valid == True:
|
||||
# get_metadata_musicbrainz(rid, artist, title)
|
||||
# add_metadata(file_name, rid, title, artist)
|
||||
# print()
|
||||
# break
|
||||
|
||||
# files = improve_song_names(files)
|
||||
# print(files)
|
||||
# count = 0
|
||||
# for file_name in files:
|
||||
# print("-------------" + file_name + "------------------")
|
||||
# print()
|
||||
# get_metadata_discogs(file_name)
|
||||
# count += 1
|
||||
# if count > 5:
|
||||
# break
|
||||
# print()
|
||||
|
||||
# get_albumart_google(
|
||||
# "Mike Posner - I Took a Pill in Ibiza (acoustic)")
|
||||
# print(improved_name[19])
|
||||
# print(files[16])
|
||||
metadata = get_metadata_spotify(
|
||||
spotify, improved_name[19])
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
|
|
Loading…
Reference in New Issue