implement spotify search

2017-06-17 12:20:24 +05:30 · 2017-06-17 12:20:24 +05:30 · 134be89024
parent 87c01cf7d7
commit 134be89024
1 changed files with 44 additions and 155 deletions
--- a/addMetadata.py
+++ b/addMetadata.py
@ -1,22 +1,18 @@
 import sys
 import os
 from os.path import basename
 import acoustid
 import discogs_client as discogs
 import musicbrainzngs as m
 import eyed3
 from bs4 import BeautifulSoup
 import requests
 import json
 import spotipy
 import spotipy.oauth2 as oauth2
 import re
 from titlecase import titlecase
 import requests
 from bs4 import BeautifulSoup
 def improve_song_names(songs):
-    text_file = open("blacklist.txt", "r")
+    char_filters = "()[]{}-:_/=+\"\'"
-    blacklistWords = text_file.read().splitlines()
+    word_filters = ('lyrics', 'lyric', 'by', 'video', 'official', 'hd', 'dirty', 'with', 'lyrics', 'feat', 'original', 'mix',
-    blacklistWords = [word.lower() for word in blacklistWords]
+                    'www', 'com', 'mp3', 'audio', 'remixed', 'remix', 'full', 'version', 'music', 'hq', 'uploaded', 'explicit')
    reg_exp = 's/^\d\d //'
    improved_names = []
@ -24,93 +20,55 @@ def improve_song_names(songs):
        song = song.strip()
        song = song.lstrip("0123456789.- ")
        # re.sub(reg_exp, '', song)
-        searchText = song[0:-4]
+        song = song[0:-4]
-        for word in song[0:-4].split(' '):
+        song = ''.join(
-            if word.lower() in blacklistWords:
+            map(lambda c: " " if c in char_filters else c, song))
                searchText = searchText.replace(word, '')
-        improved_names.append(searchText.strip())
+        song = re.sub('|'.join(re.escape(key) for key in word_filters),
                      "", song, flags=re.IGNORECASE)
        song = ' '.join(song.split())
        improved_names.append(song.strip())
    return improved_names
-def get_soup(url, headers):
+def get_song_name(title, artist):
-    r = requests.get(url, headers=headers)
+    return title + ' - ' + artist
    soup = BeautifulSoup(r.text, 'html.parser')
    return soup
-def get_albumart_google(song_name):
+def get_metadata_spotify(spotify, song_name):
-    url = "https://www.google.co.in/search?q=" + \
+    metadata = {}
-        song_name.replace(" ", "_") + "&source=lnms&tbm=isch"
+    meta_tags = spotify.search(song_name, limit=1)['tracks']['items'][0]
-    HEADERS = {
+    metadata['title'] = meta_tags['name']
-        'User-Agent': "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.2357.134 Safari/537.36"
+    metadata['artist'] = meta_tags['artists'][0]['name']
-    }
+    metadata['album'] = meta_tags['album']['name']
    metadata['album_artist'] = meta_tags['album']['artists'][0]['name']
-    soup = get_soup(url, HEADERS)
+    album_id = meta_tags['album']['id']
-    ActualImages = []
+    album_meta_tags = spotify.album(album_id)
    for a in soup.find_all("div", {"class": "rg_meta"}):
        link, Type = json.loads(a.text)["ou"], json.loads(a.text)["ity"]
        return link
        print(link)
        ActualImages.append((link, Type))
-    return ActualImages
+    metadata['release-date'] = album_meta_tags['release_date']
 def get_metadata_acoustid(song):
    API_KEY = 'GkQibmzT1u'
    try:
-        results = acoustid.match(API_KEY, song)
+        metadata['genre'] = titlecase(album_meta_tags['genres'][0])
-    except acoustid.NoBackendError:
+    except IndexError:
-        print("chromaprint library/tool not found", file=sys.stderr)
+        try:
-        sys.exit(1)
+            artist_id = meta_tags['artists'][0]['id']
-    except acoustid.FingerprintGenerationError:
+            artist_meta_tags = spotify.artist(artist_id)
-        print("fingerprint could not be calculated", file=sys.stderr)
+            metadata['genre'] = titlecase(artist_meta_tags['genres'][0])
        sys.exit(1)
    except acoustid.WebServiceError as exc:
        print("web service request failed:", exc.message, file=sys.stderr)
        sys.exit(1)
    except acoustid.FingerprintSubmissionError:
        print("Error")
-    first = True
+        except IndexError:
-    scoreMax = 0
+            pass
-    for result in results:
+    metadata['track_num'] = meta_tags['track_number']
-        if first:
+    metadata['disc_num'] = meta_tags['disc_number']
            first = False
        else:
            # print(result)
            if(result[0] > scoreMax):
                scoreMax = result[0]
            else:
                pass
            score, rid, title, artist = result[0], result[1], result[2], result[3]
            valid = True
            albumart = get_albumart_google(title + " - " + artist)
            break
-    if first is True:
+    metadata['albumart'] = meta_tags['album']['images'][0]['url']
-        print("No Data found for " + song + " .... Skipping it")
+    # metadata['lyrics'] = get_lyrics_genius(
-        score = rid = title = artist = albumart = None
+    #     get_song_name(metadata['title'], metadata['artist']))
        valid = False
-    return valid, score, rid, title, artist, albumart
+    return metadata
 def get_metadata_musicbrainz(rid, artist, title):
    d = m.set_useragent(
        "MetadataRepair",
        "0.1",
        "https://github.com/yash2696/python-musicbrainzngs/",
    )
    result = m.search_recordings(
        artist=artist, recording=title, rid=rid, limit=5)
    print(result)
 def list_files():
@ -118,47 +76,6 @@ def list_files():
    return [f for f in os.listdir('.') if f.endswith('.mp3')]
 def get_metadata_discogs(song_name):
    d = discogs.Client('ExampleApplication/0.1',
                       user_token="mbNSnSrqdyJOKorCDBXjzzeYNhgulysWNJbwgBmk")
    results = d.search(song_name, type="release")
    first_result = results.page(1)[0]
    title = first_result.title
    print(title)
    print(first_result.artists[0].name)
    print(first_result.images[0])
 def add_metadata(file_name, album_art):
    """
    Add album_art in .mp3's tags
    """
    img = requests.get(
        "https://i.ytimg.com/vi/7S0MWoXYH5k/maxresdefault.jpg", stream=True)
    img = img.raw
    audiofile = eyed3.load(file_name)
    tag = audiofile.tag
    tag.artist = "Alka Yagnik"
    tag.album = "Lajja"
    tag.title = "Badi Mushkil Baba Badi Mushkil"
    tag.images.set(3, img.read(), "image/jpeg", u"Google image")
    tag.lyrics.set(u""" """)
    # write it back
    audiofile.tag.save()
 # def get_metadata_spotify(song):
 #     spotify.search(song, limit=1)['tracks']['items'][0]
 #     return
 def main():
    auth = oauth2.SpotifyClientCredentials(
        client_id='622a0e16a4914e3eadc2a37b4a134f1e',
@ -169,38 +86,10 @@ def main():
    files = list_files()
    improved_name = improve_song_names(files)
-    # get_metadata_spotify(files[1])
+    # print(improved_name[19])
-
+    # print(files[16])
-    # valid, score, rid, title, artist, albumart = get_metadata_acoustid(
+    metadata = get_metadata_spotify(
-    #     "35. Mike Posner - I Took a Pill in Ibiza (SeeB Remix).mp3")
+        spotify, improved_name[19])
    # print(valid, score, rid, title, artist, albumart)
    # add_album_art(
    #     "Badi.mp3", "")
    # for file_name in files:
    #     print("-------------" + file_name + "------------------")
    #     print()
    #     valid, score, rid, title, artist = get_metadata_acoustid(file_name)
    #     if valid == True:
    #         get_metadata_musicbrainz(rid, artist, title)
    #         add_metadata(file_name, rid, title, artist)
    #     print()
    #     break
    # files = improve_song_names(files)
    # print(files)
    # count = 0
    # for file_name in files:
    #     print("-------------" + file_name + "------------------")
    #     print()
    #     get_metadata_discogs(file_name)
    #     count += 1
    #     if count > 5:
    #         break
    #     print()
    # get_albumart_google(
    #     "Mike Posner - I Took a Pill in Ibiza (acoustic)")
 if __name__ == "__main__":