mirror of
				https://github.com/KevinMidboe/spotify-downloader.git
				synced 2025-10-29 18:00:15 +00:00 
			
		
		
		
	* Conversion with ffmpeg is more flexible now * Testing OK after introducing changes * Normalized genre and disc number across functions * Small indentation problems * Remove if condition for setting log level to error
		
			
				
	
	
		
			451 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			451 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #!/usr/bin/env python
 | |
| # -*- coding: UTF-8 -*-
 | |
| 
 | |
| # Usual import stuff
 | |
| from bs4 import BeautifulSoup
 | |
| from shutil import copyfileobj
 | |
| from sys import path, version_info
 | |
| from slugify import slugify
 | |
| from titlecase import titlecase
 | |
| from mutagen.mp4 import MP4, MP4Cover
 | |
| import spotipy
 | |
| import spotipy.oauth2 as oauth2
 | |
| import eyed3
 | |
| import requests
 | |
| import pafy
 | |
| import os
 | |
| import argparse
 | |
| 
 | |
| 
 | |
| def getInputLink(links):
 | |
|     while True:
 | |
|         try:
 | |
|             the_chosen_one = int(raw_input('>> Choose your number: '))
 | |
|             if the_chosen_one >= 1 and the_chosen_one <= len(links):
 | |
|                 return links[the_chosen_one - 1]
 | |
|             elif the_chosen_one == 0:
 | |
|                 return None
 | |
|             else:
 | |
|                 print('Choose a valid number!')
 | |
|         except ValueError:
 | |
|             print('Choose a valid number!')
 | |
| 
 | |
| # Check if input song is Spotify URL or just a song name
 | |
| 
 | |
| 
 | |
| def isSpotify(raw_song):
 | |
|     if (len(raw_song) == 22 and raw_song.replace(" ", "%20") == raw_song) or (raw_song.find('spotify') > -1):
 | |
|         return True
 | |
|     else:
 | |
|         return False
 | |
| 
 | |
| # [Artist] - [Song Name]
 | |
| 
 | |
| 
 | |
| def generateSongName(raw_song):
 | |
|     if isSpotify(raw_song):
 | |
|         tags = generateMetaTags(raw_song)
 | |
|         raw_song = tags['artists'][0]['name'] + ' - ' + tags['name']
 | |
|     return raw_song
 | |
| 
 | |
| 
 | |
| def generateMetaTags(raw_song):
 | |
|     try:
 | |
|         if isSpotify(raw_song):
 | |
|             return spotify.track(raw_song)
 | |
|         else:
 | |
|             return spotify.search(raw_song, limit=1)['tracks']['items'][0]
 | |
|     except BaseException:
 | |
|         return None
 | |
| 
 | |
| 
 | |
| def generateSearchURL(song):
 | |
|     URL = "https://www.youtube.com/results?sp=EgIQAQ%253D%253D&q=" + \
 | |
|         song.replace(" ", "%20")
 | |
|     return URL
 | |
| 
 | |
| 
 | |
| def generateYouTubeURL(raw_song):
 | |
|     song = generateSongName(raw_song)
 | |
|     searchURL = generateSearchURL(song)
 | |
|     items = requests.get(searchURL).text
 | |
|     items_parse = BeautifulSoup(items, "html.parser")
 | |
|     check = 1
 | |
|     if args.manual:
 | |
|         links = []
 | |
|         print(song)
 | |
|         print('')
 | |
|         print('0. Skip downloading this song')
 | |
|         for x in items_parse.find_all('h3', {'class': 'yt-lockup-title'}):
 | |
|             if not x.find('channel') == -1 or not x.find('googleads') == -1:
 | |
|                 print(str(check) + '. ' + x.get_text())
 | |
|                 links.append(x.find('a')['href'])
 | |
|                 check += 1
 | |
|         print('')
 | |
|         result = getInputLink(links)
 | |
|         if result is None:
 | |
|             return None
 | |
|     else:
 | |
|         result = items_parse.find_all(
 | |
|             attrs={'class': 'yt-uix-tile-link'})[0]['href']
 | |
|         while not result.find('channel') == - \
 | |
|                 1 or not result.find('googleads') == -1:
 | |
|             result = items_parse.find_all(
 | |
|                 attrs={'class': 'yt-uix-tile-link'})[check]['href']
 | |
|             check += 1
 | |
|     full_link = "youtube.com" + result
 | |
|     return full_link
 | |
| 
 | |
| 
 | |
| def goPafy(raw_song):
 | |
|     trackURL = generateYouTubeURL(raw_song)
 | |
|     if trackURL is None:
 | |
|         return None
 | |
|     else:
 | |
|         return pafy.new(trackURL)
 | |
| 
 | |
| 
 | |
| def getYouTubeTitle(content, number):
 | |
|     title = content.title
 | |
|     if number is None:
 | |
|         return title
 | |
|     else:
 | |
|         return str(number) + '. ' + title
 | |
| 
 | |
| # Generate name for the song to be downloaded
 | |
| 
 | |
| 
 | |
| def generateFileName(content):
 | |
|     title = (content.title).replace(' ', '_')
 | |
|     return slugify(title, ok='-_()[]{}', lower=False)
 | |
| 
 | |
| 
 | |
| def downloadSong(content):
 | |
|     music_file = generateFileName(content)
 | |
|     if input_ext == '.webm':
 | |
|         link = content.getbestaudio(preftype='webm')
 | |
|         if link is not None:
 | |
|             link.download(filepath='Music/' + music_file + input_ext)
 | |
|     else:
 | |
|         link = content.getbestaudio(preftype="m4a")
 | |
|         if link is not None:
 | |
|             link.download(filepath='Music/' + music_file + input_ext)
 | |
| 
 | |
| 
 | |
| def convertToMP3(music_file):
 | |
|     if os.name == 'nt':
 | |
|         os.system(
 | |
|             'Scripts\\avconv.exe -loglevel 0 -i "' +
 | |
|             'Music/' +
 | |
|             music_file +
 | |
|             '.m4a" -ab 192k "' +
 | |
|             'Music/' +
 | |
|             music_file +
 | |
|             '.mp3"')
 | |
|     else:
 | |
|         os.system(
 | |
|             'avconv -loglevel 0 -i "' +
 | |
|             'Music/' +
 | |
|             music_file +
 | |
|             '.m4a" -ab 192k "' +
 | |
|             'Music/' +
 | |
|             music_file +
 | |
|             '.mp3"')
 | |
|     os.remove('Music/' + music_file + '.m4a')
 | |
| 
 | |
| 
 | |
| def convertWithFfmpeg(music_file):
 | |
|     # What are the differences and similarities between ffmpeg, libav, and avconv?
 | |
|     # https://stackoverflow.com/questions/9477115
 | |
|     # ffmeg encoders high to lower quality
 | |
|     # libopus > libvorbis >= libfdk_aac > aac > libmp3lame
 | |
|     # libfdk_aac due to copyrights needs to be compiled by end user
 | |
|     # on MacOS brew install ffmpeg --with-fdk-aac will do just that. Other OS?
 | |
|     # https://trac.ffmpeg.org/wiki/Encode/AAC
 | |
|     #
 | |
|     if args.quiet:
 | |
|         ffmpeg_pre = 'ffmpeg -hide_banner -nostats -v panic -y '
 | |
|     else:
 | |
|         ffmpeg_pre = 'ffmpeg -y '
 | |
| 
 | |
|     if input_ext == '.m4a':
 | |
|         if output_ext == '.mp3':
 | |
|             ffmpeg_params = '-codec:v copy -codec:a libmp3lame -q:a 2 '
 | |
|         elif output_ext == '.webm':
 | |
|             ffmpeg_params = '-c:a libopus -vbr on -b:a 192k -vn '
 | |
|         else:
 | |
|             return
 | |
|     elif input_ext == '.webm':
 | |
|         if output_ext == '.mp3':
 | |
|             ffmpeg_params = '-ab 192k -ar 44100 -vn '
 | |
|         elif output_ext == '.m4a':
 | |
|             ffmpeg_params = '-cutoff 20000 -c:a libfdk_aac -b:a 256k -vn '
 | |
|         else:
 | |
|             return
 | |
|     else:
 | |
|         print('Unknown formats. Unable to convert.', input_ext, output_ext)
 | |
|         return
 | |
| 
 | |
|     if not args.quiet:
 | |
|         print(ffmpeg_pre +
 | |
|               '-i "Music/' + music_file + input_ext + '" ' +
 | |
|               ffmpeg_params +
 | |
|               '"Music/' + music_file + output_ext + '" ')
 | |
| 
 | |
|     os.system(
 | |
|         ffmpeg_pre +
 | |
|         '-i "Music/' + music_file + input_ext + '" ' +
 | |
|         ffmpeg_params +
 | |
|         '"Music/' + music_file + output_ext + '" ')
 | |
|     os.remove('Music/' + music_file + input_ext)
 | |
| 
 | |
| 
 | |
| def checkExists(music_file, raw_song, islist):
 | |
|     if os.path.exists("Music/" + music_file + input_ext + ".temp"):
 | |
|         os.remove("Music/" + music_file + input_ext + ".temp")
 | |
|     if args.no_convert:
 | |
|         extension = input_ext
 | |
|     else:
 | |
|         extension = output_ext
 | |
|     if os.path.isfile("Music/" + music_file + extension):
 | |
|         if extension == '.mp3':
 | |
|             audiofile = eyed3.load("Music/" + music_file + extension)
 | |
|             if isSpotify(raw_song) and not audiofile.tag.title == (
 | |
|                     generateMetaTags(raw_song))['name']:
 | |
|                 os.remove("Music/" + music_file + extension)
 | |
|                 return False
 | |
|         if islist:
 | |
|             return True
 | |
|         else:
 | |
|             prompt = raw_input(
 | |
|                 'Song with same name has already been downloaded. Re-download? (y/n): ').lower()
 | |
|             if prompt == "y":
 | |
|                 os.remove("Music/" + music_file + extension)
 | |
|                 return False
 | |
|             else:
 | |
|                 return True
 | |
| 
 | |
| # Remove song from list.txt once downloaded
 | |
| 
 | |
| 
 | |
| def trimSong(file):
 | |
|     with open(file, 'r') as fin:
 | |
|         data = fin.read().splitlines(True)
 | |
|     with open(file, 'w') as fout:
 | |
|         fout.writelines(data[1:])
 | |
| 
 | |
| 
 | |
| def fixSong(music_file, meta_tags):
 | |
|     audiofile = eyed3.load("Music/" + music_file + '.mp3')
 | |
|     audiofile.tag.artist = meta_tags['artists'][0]['name']
 | |
|     audiofile.tag.album_artist = meta_tags['artists'][0]['name']
 | |
|     audiofile.tag.album = meta_tags['album']['name']
 | |
|     audiofile.tag.title = meta_tags['name']
 | |
|     artist = spotify.artist(meta_tags['artists'][0]['id'])
 | |
|     audiofile.tag.genre = titlecase(artist['genres'][0])
 | |
|     audiofile.tag.track_num = meta_tags['track_number']
 | |
|     audiofile.tag.disc_num = meta_tags['disc_number']
 | |
|     audiofile.tag.release_date = spotify.album(
 | |
|         meta_tags['album']['id'])['release_date']
 | |
|     albumart = (
 | |
|         requests.get(
 | |
|             meta_tags['album']['images'][0]['url'],
 | |
|             stream=True)).raw
 | |
|     with open('last_albumart.jpg', 'wb') as out_file:
 | |
|         copyfileobj(albumart, out_file)
 | |
|     albumart = open("last_albumart.jpg", "rb").read()
 | |
|     audiofile.tag.images.set(3, albumart, "image/jpeg")
 | |
|     audiofile.tag.save(version=(2, 3, 0))
 | |
| 
 | |
| 
 | |
| def fixSongM4A(music_file, meta_tags):
 | |
|     # eyed serves only mp3 not aac so using mutagen
 | |
|     # Apple has specific tags - see mutagen docs -
 | |
|     # http://mutagen.readthedocs.io/en/latest/api/mp4.html
 | |
|     tags = {'album': '\xa9alb',
 | |
|             'artist': '\xa9ART',
 | |
|             'year': '\xa9day',
 | |
|             'title': '\xa9nam',
 | |
|             'comment': '\xa9cmt',
 | |
|             'group': '\xa9grp',
 | |
|             'writer': '\xa9wrt',
 | |
|             'genre': '\xa9gen',
 | |
|             'track': 'trkn',
 | |
|             'aart': 'aART',
 | |
|             'disk': 'disk',
 | |
|             'cpil': 'cpil',
 | |
|             'tempo': 'tmpo'}
 | |
|     audiofile = MP4('Music/' + music_file + output_ext)
 | |
|     audiofile[tags['artist']] = meta_tags['artists'][0]['name']
 | |
|     audiofile[tags['album']] = meta_tags['album']['name']
 | |
|     audiofile[tags['title']] = meta_tags['name']
 | |
|     artist = spotify.artist(meta_tags['artists'][0]['id'])
 | |
|     audiofile[tags['genre']] = titlecase(artist['genres'][0])
 | |
|     album = spotify.album(meta_tags['album']['id'])
 | |
|     audiofile[tags['year']] = album['release_date']
 | |
|     audiofile[tags['track']] = [(meta_tags['track_number'], 0)]
 | |
|     audiofile[tags['disk']] = [(meta_tags['disc_number'], 0)]
 | |
|     albumart = (
 | |
|         requests.get(meta_tags['album']['images'][0]['url'], stream=True)).raw
 | |
|     with open('last_albumart.jpg', 'wb') as out_file:
 | |
|         copyfileobj(albumart, out_file)
 | |
|     with open("last_albumart.jpg", "rb") as f:
 | |
|         audiofile["covr"] = [
 | |
|             MP4Cover(
 | |
|                 f.read(),
 | |
|                 imageformat=MP4Cover.FORMAT_JPEG)]
 | |
|     audiofile.save()
 | |
| 
 | |
| 
 | |
| # Logic behind preparing the song to download to finishing meta-tags
 | |
| 
 | |
| 
 | |
| def grabSingle(raw_song, number=None):
 | |
|     if number:
 | |
|         islist = True
 | |
|     else:
 | |
|         islist = False
 | |
|     content = goPafy(raw_song)
 | |
|     if content is None:
 | |
|         return
 | |
|     print(getYouTubeTitle(content, number))
 | |
|     music_file = generateFileName(content)
 | |
|     if not checkExists(music_file, raw_song, islist=islist):
 | |
|         downloadSong(content)
 | |
|         print('')
 | |
|         if not args.no_convert:
 | |
|             print('Converting ' + music_file + input_ext + ' to ' + output_ext)
 | |
|             if args.ffmpeg:
 | |
|                 convertWithFfmpeg(music_file)
 | |
|             else:
 | |
|                 convertToMP3(music_file)
 | |
|             meta_tags = generateMetaTags(raw_song)
 | |
|             if output_ext == '.m4a':
 | |
|                 if meta_tags is not None:
 | |
|                     print('Fixing meta-tags')
 | |
|                     fixSongM4A(music_file, meta_tags)
 | |
|             elif output_ext == '.mp3':
 | |
|                 if meta_tags is not None:
 | |
|                     print('Fixing meta-tags')
 | |
|                     fixSong(music_file, meta_tags)
 | |
| 
 | |
| # Fix python2 encoding issues
 | |
| 
 | |
| 
 | |
| def fixEncoding(query):
 | |
|     if version_info > (3, 0):
 | |
|         return query
 | |
|     else:
 | |
|         return query.encode('utf-8')
 | |
| 
 | |
| 
 | |
| def grabList(file):
 | |
|     lines = open(file, 'r').read()
 | |
|     lines = lines.splitlines()
 | |
|     # Ignore blank lines in list.txt (if any)
 | |
|     try:
 | |
|         lines.remove('')
 | |
|     except ValueError:
 | |
|         pass
 | |
|     print('Total songs in list = ' + str(len(lines)) + ' songs')
 | |
|     print('')
 | |
|     # Count the number of song being downloaded
 | |
|     number = 1
 | |
|     for raw_song in lines:
 | |
|         try:
 | |
|             grabSingle(raw_song, number=number)
 | |
|             trimSong(file)
 | |
|             number += 1
 | |
|             print('')
 | |
|         except KeyboardInterrupt:
 | |
|             graceQuit()
 | |
|         except BaseException:
 | |
|             lines.append(raw_song)
 | |
|             trimSong(file)
 | |
|             with open(file, 'a') as myfile:
 | |
|                 myfile.write(raw_song)
 | |
|             print('Failed to download song. Will retry after other songs.')
 | |
| 
 | |
| 
 | |
| def getArgs(argv=None):
 | |
|     parser = argparse.ArgumentParser(description='Download and convert songs \
 | |
|                     from Spotify, Youtube etc.',
 | |
|                                      formatter_class=argparse.ArgumentDefaultsHelpFormatter)
 | |
|     parser.add_argument('-n', '--no-convert', default=False,
 | |
|                         help='skip the conversion process and meta-tags', action='store_true')
 | |
|     parser.add_argument('-m', '--manual', default=False,
 | |
|                         help='choose the song to download manually', action='store_true')
 | |
|     parser.add_argument('-l', '--list', default=False,
 | |
|                         help='download songs present in list.txt', action='store_true')
 | |
|     parser.add_argument('-f', '--ffmpeg', default=False,
 | |
|                         help='Use ffmpeg instead of libav for conversion. If not set defaults to libav',
 | |
|                         action='store_true')
 | |
|     parser.add_argument('-q', '--quiet', default=False,
 | |
|                         help='spare us output of ffmpeg conversion', action='store_true')
 | |
|     parser.add_argument('-i', '--input_ext', default='.m4a',
 | |
|                         help='prefered input format .m4a or .webm (Opus)')
 | |
|     parser.add_argument('-o', '--output_ext', default='.mp3',
 | |
|                         help='prefered output extension .mp3 or .m4a (AAC)')
 | |
|     return parser.parse_args(argv)
 | |
| 
 | |
| 
 | |
| def graceQuit():
 | |
|     print('')
 | |
|     print('')
 | |
|     print('Exitting..')
 | |
|     exit()
 | |
| 
 | |
| 
 | |
| def spotifyDownload():
 | |
|     while True:
 | |
|         for temp in os.listdir('Music/'):
 | |
|             if temp.endswith('.m4a.temp'):
 | |
|                 os.remove('Music/' + temp)
 | |
|         try:
 | |
|             print('Enter a Spotify URL or Song Name: ')
 | |
|             command = raw_input('>> ')
 | |
|             print('')
 | |
|             grabSingle(raw_song=command)
 | |
|             print('')
 | |
|         except KeyboardInterrupt:
 | |
|             graceQuit()
 | |
| 
 | |
| 
 | |
| if __name__ == '__main__':
 | |
| 
 | |
|     # Python 3 compatibility
 | |
|     if version_info > (3, 0):
 | |
|         raw_input = input
 | |
| 
 | |
|     os.chdir(path[0])
 | |
|     if not os.path.exists("Music"):
 | |
|         os.makedirs("Music")
 | |
|     open('list.txt', 'a').close()
 | |
| 
 | |
|     # Please respect this user token :)
 | |
|     oauth2 = oauth2.SpotifyClientCredentials(
 | |
|         client_id='4fe3fecfe5334023a1472516cc99d805',
 | |
|         client_secret='0f02b7c483c04257984695007a4a8d5c')
 | |
|     token = oauth2.get_access_token()
 | |
|     spotify = spotipy.Spotify(auth=token)
 | |
| 
 | |
|     # Set up arguments
 | |
|     args = getArgs()
 | |
|     if args.ffmpeg:
 | |
|         input_ext = args.input_ext
 | |
|         output_ext = args.output_ext
 | |
|     else:
 | |
|         input_ext = '.m4a'
 | |
|         output_ext = '.mp3'
 | |
|     if args.no_convert:
 | |
|         print("-n, --no-convert skip the conversion process and meta-tags")
 | |
|     if args.manual:
 | |
|         print("-m, --manual     choose the song to download manually")
 | |
|     print('')
 | |
|     if args.list:
 | |
|         grabList(file='list.txt')
 | |
|         exit()
 | |
|     eyed3.log.setLevel("ERROR")
 | |
| 
 | |
|     spotifyDownload()
 |