mirror of
				https://github.com/KevinMidboe/spotify-downloader.git
				synced 2025-10-29 18:00:15 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			317 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
	
	
			
		
		
	
	
			317 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
	
	
#!/usr/bin/env python
 | 
						|
# -*- coding: UTF-8 -*-
 | 
						|
 | 
						|
from core import metadata
 | 
						|
from core import convert
 | 
						|
from core import misc
 | 
						|
from bs4 import BeautifulSoup
 | 
						|
from titlecase import titlecase
 | 
						|
from slugify import slugify
 | 
						|
import spotipy
 | 
						|
import pafy
 | 
						|
import sys
 | 
						|
import os
 | 
						|
 | 
						|
# urllib2 is urllib.request in python3
 | 
						|
try:
 | 
						|
    import urllib2
 | 
						|
except ImportError:
 | 
						|
    import urllib.request as urllib2
 | 
						|
 | 
						|
 | 
						|
def generate_songname(raw_song):
 | 
						|
    """Generate a string of the format '[artist] - [song]' for the given song."""
 | 
						|
    if misc.is_spotify(raw_song):
 | 
						|
        tags = generate_metadata(raw_song)
 | 
						|
        raw_song = u'{0} - {1}'.format(tags['artists'][0]['name'], tags['name'])
 | 
						|
    return misc.fix_encoding(raw_song)
 | 
						|
 | 
						|
 | 
						|
def generate_metadata(raw_song):
 | 
						|
    """Fetch a song's metadata from Spotify."""
 | 
						|
    if misc.is_spotify(raw_song):
 | 
						|
        # fetch track information directly if it is spotify link
 | 
						|
        meta_tags = spotify.track(raw_song)
 | 
						|
    else:
 | 
						|
        # otherwise search on spotify and fetch information from first result
 | 
						|
        try:
 | 
						|
            meta_tags = spotify.search(raw_song, limit=1)['tracks']['items'][0]
 | 
						|
        except:
 | 
						|
            return None
 | 
						|
    artist = spotify.artist(meta_tags['artists'][0]['id'])
 | 
						|
    album = spotify.album(meta_tags['album']['id'])
 | 
						|
 | 
						|
    try:
 | 
						|
        meta_tags[u'genre'] = titlecase(artist['genres'][0])
 | 
						|
    except IndexError:
 | 
						|
        meta_tags[u'genre'] = None
 | 
						|
    try:
 | 
						|
        meta_tags[u'copyright'] = album['copyrights'][0]['text']
 | 
						|
    except IndexError:
 | 
						|
        meta_tags[u'copyright'] = None
 | 
						|
 | 
						|
    meta_tags[u'release_date'] = album['release_date']
 | 
						|
    meta_tags[u'publisher'] = album['label']
 | 
						|
    meta_tags[u'total_tracks'] = album['tracks']['total']
 | 
						|
    # import pprint
 | 
						|
    # pprint.pprint(meta_tags)
 | 
						|
    # pprint.pprint(spotify.album(meta_tags['album']['id']))
 | 
						|
    return meta_tags
 | 
						|
 | 
						|
 | 
						|
def generate_youtube_url(raw_song):
 | 
						|
    """Search for the song on YouTube and generate an URL to its video."""
 | 
						|
    song = generate_songname(raw_song)
 | 
						|
    search_url = misc.generate_search_url(song)
 | 
						|
    item = urllib2.urlopen(search_url).read()
 | 
						|
    # item = unicode(item, 'utf-8')
 | 
						|
    items_parse = BeautifulSoup(item, "html.parser")
 | 
						|
    check = 1
 | 
						|
    if args.manual:
 | 
						|
        links = []
 | 
						|
        print(song)
 | 
						|
        print('')
 | 
						|
        print('0. Skip downloading this song')
 | 
						|
        # fetch all video links on first page on YouTube
 | 
						|
        for x in items_parse.find_all('h3', {'class': 'yt-lockup-title'}):
 | 
						|
            # confirm the video result is not an advertisement
 | 
						|
            if x.find('channel') > -1 or x.find('googleads') > -1:
 | 
						|
                print(u'{0}. {1}'.format(check, x.get_text()))
 | 
						|
                links.append(x.find('a')['href'])
 | 
						|
                check += 1
 | 
						|
        print('')
 | 
						|
        # let user select the song to download
 | 
						|
        result = misc.input_link(links)
 | 
						|
        if result is None:
 | 
						|
            return None
 | 
						|
    else:
 | 
						|
        # get video link of the first YouTube result
 | 
						|
        result = items_parse.find_all(
 | 
						|
            attrs={'class': 'yt-uix-tile-link'})[0]['href']
 | 
						|
 | 
						|
        # confirm the video result is not an advertisement
 | 
						|
        # otherwise keep iterating until it is not
 | 
						|
        while result.find('channel') > -1 or result.find('googleads') > -1:
 | 
						|
            result = items_parse.find_all(
 | 
						|
                attrs={'class': 'yt-uix-tile-link'})[check]['href']
 | 
						|
            check += 1
 | 
						|
 | 
						|
    full_link = u'youtube.com{0}'.format(result)
 | 
						|
    return full_link
 | 
						|
 | 
						|
 | 
						|
def go_pafy(raw_song):
 | 
						|
    """Parse track from YouTube."""
 | 
						|
    track_url = generate_youtube_url(raw_song)
 | 
						|
    if track_url is None:
 | 
						|
        return None
 | 
						|
    else:
 | 
						|
        return pafy.new(track_url)
 | 
						|
 | 
						|
 | 
						|
def get_youtube_title(content, number=None):
 | 
						|
    """Get the YouTube video's title."""
 | 
						|
    title = misc.fix_encoding(content.title)
 | 
						|
    if number is None:
 | 
						|
        return title
 | 
						|
    else:
 | 
						|
        return u'{0}. {1}'.format(number, title)
 | 
						|
 | 
						|
 | 
						|
def feed_playlist(username):
 | 
						|
    """Fetch user playlists when using the -u option."""
 | 
						|
    playlists = spotify.user_playlists(username)
 | 
						|
    links = []
 | 
						|
    check = 1
 | 
						|
 | 
						|
    while True:
 | 
						|
        for playlist in playlists['items']:
 | 
						|
            # in rare cases, playlists may not be found, so playlists['next']
 | 
						|
            # is None. Skip these. Also see Issue #91.
 | 
						|
            if playlist['name'] is not None:
 | 
						|
                print(u'{0}. {1} ({2} tracks)'.format(
 | 
						|
                    check, misc.fix_encoding(playlist['name'])),
 | 
						|
                    playlist['tracks']['total'])
 | 
						|
                links.append(playlist)
 | 
						|
                check += 1
 | 
						|
        if playlists['next']:
 | 
						|
            playlists = spotify.next(playlists)
 | 
						|
        else:
 | 
						|
            break
 | 
						|
 | 
						|
    print('')
 | 
						|
    playlist = misc.input_link(links)
 | 
						|
    results = spotify.user_playlist(
 | 
						|
        playlist['owner']['id'], playlist['id'], fields='tracks,next')
 | 
						|
    print('')
 | 
						|
    file = u'{0}.txt'.format(slugify(playlist['name'], ok='-_()[]{}'))
 | 
						|
    print(u'Feeding {0} tracks to {1}'.format(playlist['tracks']['total'], file))
 | 
						|
 | 
						|
    tracks = results['tracks']
 | 
						|
    with open(file, 'a') as file_out:
 | 
						|
        while True:
 | 
						|
            for item in tracks['items']:
 | 
						|
                track = item['track']
 | 
						|
                try:
 | 
						|
                    file_out.write(track['external_urls']['spotify'] + '\n')
 | 
						|
                except KeyError:
 | 
						|
                    print(u'Skipping track {0} by {1} (local only?)'.format(
 | 
						|
                        track['name'], track['artists'][0]['name']))
 | 
						|
            # 1 page = 50 results
 | 
						|
            # check if there are more pages
 | 
						|
            if tracks['next']:
 | 
						|
                tracks = spotify.next(tracks)
 | 
						|
            else:
 | 
						|
                break
 | 
						|
 | 
						|
 | 
						|
def download_song(content):
 | 
						|
    """Download the audio file from YouTube."""
 | 
						|
    if args.input_ext == '.webm':
 | 
						|
        link = content.getbestaudio(preftype='webm')
 | 
						|
    elif args.input_ext == '.m4a':
 | 
						|
        link = content.getbestaudio(preftype='m4a')
 | 
						|
    else:
 | 
						|
        return False
 | 
						|
 | 
						|
    if link is None:
 | 
						|
        return False
 | 
						|
    else:
 | 
						|
        music_file = misc.generate_filename(content.title)
 | 
						|
        link.download(
 | 
						|
            filepath='Music/{0}{1}'.format(music_file, args.input_ext))
 | 
						|
        return True
 | 
						|
 | 
						|
 | 
						|
def check_exists(music_file, raw_song, islist=True):
 | 
						|
    """Check if the input song already exists in the 'Music' folder."""
 | 
						|
    files = os.listdir('Music')
 | 
						|
    for file in files:
 | 
						|
        if file.endswith('.temp'):
 | 
						|
            os.remove(u'Music/{0}'.format(file))
 | 
						|
            continue
 | 
						|
        # check if any file with similar name is already present in Music/
 | 
						|
        dfile = misc.fix_decoding(file)
 | 
						|
        umfile = misc.fix_decoding(misc.generate_filename(music_file))
 | 
						|
        if dfile.startswith(umfile):
 | 
						|
            # check if the already downloaded song has correct metadata
 | 
						|
            already_tagged = metadata.compare(file, generate_metadata(raw_song))
 | 
						|
 | 
						|
            # if not, remove it and download again without prompt
 | 
						|
            if misc.is_spotify(raw_song) and not already_tagged:
 | 
						|
                os.remove('Music/{0}'.format(file))
 | 
						|
                return False
 | 
						|
 | 
						|
            # do not prompt and skip the current song
 | 
						|
            # if already downloaded when using list
 | 
						|
            if islist:
 | 
						|
                return True
 | 
						|
            # if downloading only single song, prompt to re-download
 | 
						|
            else:
 | 
						|
                prompt = misc.user_input(
 | 
						|
                    'Song with same name has already been downloaded. '
 | 
						|
                    'Re-download? (y/n): ').lower()
 | 
						|
                if prompt == 'y':
 | 
						|
                    os.remove('Music/{0}'.format(file))
 | 
						|
                    return False
 | 
						|
                else:
 | 
						|
                    return True
 | 
						|
    return False
 | 
						|
 | 
						|
 | 
						|
def grab_list(file):
 | 
						|
    """Download all songs from the list."""
 | 
						|
    with open(file, 'r') as listed:
 | 
						|
        lines = (listed.read()).splitlines()
 | 
						|
    # ignore blank lines in file (if any)
 | 
						|
    try:
 | 
						|
        lines.remove('')
 | 
						|
    except ValueError:
 | 
						|
        pass
 | 
						|
    print(u'Total songs in list: {0} songs'.format(len(lines)))
 | 
						|
    print('')
 | 
						|
    # nth input song
 | 
						|
    number = 1
 | 
						|
    for raw_song in lines:
 | 
						|
        try:
 | 
						|
            grab_single(raw_song, number=number)
 | 
						|
        # token expires after 1 hour
 | 
						|
        except spotipy.oauth2.SpotifyOauthError:
 | 
						|
            # refresh token when it expires
 | 
						|
            new_token = misc.generate_token()
 | 
						|
            global spotify
 | 
						|
            spotify = spotipy.Spotify(auth=new_token)
 | 
						|
            grab_single(raw_song, number=number)
 | 
						|
        # detect network problems
 | 
						|
        except (urllib2.URLError, TypeError, IOError):
 | 
						|
            lines.append(raw_song)
 | 
						|
            # remove the downloaded song from .txt
 | 
						|
            misc.trim_song(file)
 | 
						|
            # and append it to the last line in .txt
 | 
						|
            with open(file, 'a') as myfile:
 | 
						|
                myfile.write(raw_song)
 | 
						|
            print('Failed to download song. Will retry after other songs.')
 | 
						|
            continue
 | 
						|
        except KeyboardInterrupt:
 | 
						|
            misc.grace_quit()
 | 
						|
        finally:
 | 
						|
            print('')
 | 
						|
        misc.trim_song(file)
 | 
						|
        number += 1
 | 
						|
 | 
						|
 | 
						|
def grab_single(raw_song, number=None):
 | 
						|
    """Logic behind downloading a song."""
 | 
						|
    if number:
 | 
						|
        islist = True
 | 
						|
    else:
 | 
						|
        islist = False
 | 
						|
    content = go_pafy(raw_song)
 | 
						|
    if content is None:
 | 
						|
        return
 | 
						|
    # print '[number]. [artist] - [song]' if downloading from list
 | 
						|
    # otherwise print '[artist] - [song]'
 | 
						|
    print(get_youtube_title(content, number))
 | 
						|
 | 
						|
    # generate file name of the song to download
 | 
						|
    music_file = misc.generate_filename(content.title)
 | 
						|
    music_file = misc.fix_decoding(music_file)
 | 
						|
    if not check_exists(music_file, raw_song, islist=islist):
 | 
						|
        if download_song(content):
 | 
						|
            print('')
 | 
						|
            input_song = music_file + args.input_ext
 | 
						|
            output_song = music_file + args.output_ext
 | 
						|
            convert.song(input_song, output_song, avconv=args.avconv,
 | 
						|
                         verbose=args.verbose)
 | 
						|
            os.remove('Music/{0}'.format(misc.fix_encoding(input_song)))
 | 
						|
            meta_tags = generate_metadata(raw_song)
 | 
						|
            if not args.no_metadata:
 | 
						|
                metadata.embed(output_song, meta_tags)
 | 
						|
        else:
 | 
						|
            print('No audio streams available')
 | 
						|
 | 
						|
 | 
						|
class Args(object):
 | 
						|
    manual = False
 | 
						|
    input_ext = '.m4a'
 | 
						|
    output_ext = '.mp3'
 | 
						|
 | 
						|
args = Args()
 | 
						|
# token is mandatory when using Spotify's API
 | 
						|
# https://developer.spotify.com/news-stories/2017/01/27/removing-unauthenticated-calls-to-the-web-api/
 | 
						|
token = misc.generate_token()
 | 
						|
spotify = spotipy.Spotify(auth=token)
 | 
						|
 | 
						|
misc.filter_path('Music')
 | 
						|
 | 
						|
if __name__ == '__main__':
 | 
						|
    os.chdir(sys.path[0])
 | 
						|
    args = misc.get_arguments()
 | 
						|
 | 
						|
    if args.song:
 | 
						|
        grab_single(raw_song=args.song)
 | 
						|
    elif args.list:
 | 
						|
        grab_list(file=args.list)
 | 
						|
    elif args.username:
 | 
						|
        feed_playlist(username=args.username)
 |