Fix token issues and ability to download opus audio and encoding to AAC (#59)

* Ability to download opus audio and encoding to AAC

Requires ffmpeg with libfdk_aac and mutagen.

* Change to oauth2 to get access token

* Add import spotipy.oauth2

* Final polish before merge
This commit is contained in:
Robert J
2017-06-01 22:28:23 +07:00
committed by Ritiek Malhotra
parent c4e3a9ac82
commit b5e3dbd2e1
2 changed files with 349 additions and 207 deletions

552
spotdl.py
View File

@@ -5,6 +5,9 @@
from bs4 import BeautifulSoup
from shutil import copyfileobj
from sys import path, version_info
from slugify import slugify
from titlecase import titlecase
from mutagen.mp4 import MP4, MP4Cover
import spotipy
import eyed3
import requests
@@ -12,262 +15,397 @@ import pafy
import os
import argparse
import pathlib
import spotipy.util as util
import spotipy.oauth2 as oauth2
def getInputLink(links):
while True:
try:
the_chosen_one = int(raw_input('>> Choose your number: '))
if the_chosen_one >= 1 and the_chosen_one <= len(links):
return links[the_chosen_one-1]
elif the_chosen_one == 0:
return None
else:
print('Choose a valid number!')
except ValueError:
print('Choose a valid number!')
while True:
try:
the_chosen_one = int(raw_input('>> Choose your number: '))
if the_chosen_one >= 1 and the_chosen_one <= len(links):
return links[the_chosen_one - 1]
elif the_chosen_one == 0:
return None
else:
print('Choose a valid number!')
except ValueError:
print('Choose a valid number!')
# Check if input song is Spotify URL or just a song name
def isSpotify(raw_song):
if (len(raw_song) == 22 and raw_song.replace(" ", "%20") == raw_song) or (raw_song.find('spotify') > -1):
return True
else:
return False
if (len(raw_song) == 22 and raw_song.replace(" ", "%20")
== raw_song) or (raw_song.find('spotify') > -1):
return True
else:
return False
# [Artist] - [Song Name]
def generateSongName(raw_song):
if isSpotify(raw_song):
tags = generateMetaTags(raw_song)
raw_song = tags['artists'][0]['name'] + ' - ' + tags['name']
return raw_song
if isSpotify(raw_song):
tags = generateMetaTags(raw_song)
raw_song = tags['artists'][0]['name'] + ' - ' + tags['name']
return raw_song
def generateMetaTags(raw_song):
try:
if isSpotify(raw_song):
return spotify.track(raw_song)
else:
return spotify.search(raw_song, limit=1)['tracks']['items'][0]
except:
return None
try:
if isSpotify(raw_song):
return spotify.track(raw_song)
else:
return spotify.search(raw_song, limit=1)['tracks']['items'][0]
except BaseException:
return None
def generateSearchURL(song):
URL = "https://www.youtube.com/results?sp=EgIQAQ%253D%253D&q=" + song.replace(" ", "%20")
return URL
URL = "https://www.youtube.com/results?sp=EgIQAQ%253D%253D&q=" + \
song.replace(" ", "%20")
return URL
def generateYouTubeURL(raw_song):
song = generateSongName(raw_song)
searchURL = generateSearchURL(song)
items = requests.get(searchURL).text
items_parse = BeautifulSoup(items, "html.parser")
check = 1
if args.manual:
links = []
print(song)
print('')
print('0. Skip downloading this song')
for x in items_parse.find_all('h3', {'class':'yt-lockup-title'}):
if not x.find('channel') == -1 or not x.find('googleads') == -1:
print(str(check) + '. ' + x.get_text())
links.append(x.find('a')['href'])
check += 1
print('')
result = getInputLink(links)
if result == None:
return None
else:
result = items_parse.find_all(attrs={'class':'yt-uix-tile-link'})[0]['href']
while not result.find('channel') == -1 or not result.find('googleads') == -1:
result = items_parse.find_all(attrs={'class':'yt-uix-tile-link'})[check]['href']
check += 1
full_link = "youtube.com" + result
return full_link
song = generateSongName(raw_song)
searchURL = generateSearchURL(song)
items = requests.get(searchURL).text
items_parse = BeautifulSoup(items, "html.parser")
check = 1
if args.manual:
links = []
print(song)
print('')
print('0. Skip downloading this song')
for x in items_parse.find_all('h3', {'class': 'yt-lockup-title'}):
if not x.find('channel') == -1 or not x.find('googleads') == -1:
print(str(check) + '. ' + x.get_text())
links.append(x.find('a')['href'])
check += 1
print('')
result = getInputLink(links)
if result is None:
return None
else:
result = items_parse.find_all(
attrs={'class': 'yt-uix-tile-link'})[0]['href']
while not result.find('channel') == - \
1 or not result.find('googleads') == -1:
result = items_parse.find_all(
attrs={'class': 'yt-uix-tile-link'})[check]['href']
check += 1
full_link = "youtube.com" + result
return full_link
def goPafy(raw_song):
trackURL = generateYouTubeURL(raw_song)
if trackURL == None:
return None
else:
return pafy.new(trackURL)
trackURL = generateYouTubeURL(raw_song)
if trackURL is None:
return None
else:
return pafy.new(trackURL)
def getYouTubeTitle(content, number):
title = content.title
if number == None:
return title
else:
return str(number) + '. ' + title
title = content.title
if number is None:
return title
else:
return str(number) + '. ' + title
# Generate name for the song to be downloaded
def generateFileName(content):
return fixEncoding((content.title).replace("\\", "_").replace("/", "_").replace(":", "_").replace("*", "_").replace("?", "_").replace('"', "_").replace("<", "_").replace(">", "_").replace("|", "_").replace(" ", "_"))
return slugify(content.title)
def downloadSong(content):
music_file = generateFileName(content)
link = content.getbestaudio(preftype="m4a")
link.download(filepath="Music/" + music_file + ".m4a")
music_file = generateFileName(content)
if args.input_ext == '.webm':
link = content.getbestaudio(preftype='webm')
if link is not None:
link.download(filepath='Music/' + music_file + args.input_ext)
else:
link = content.getbestaudio(preftype="m4a")
if link is not None:
link.download(filepath="Music/" + music_file + ".m4a")
def convertToMP3(music_file):
if os.name == 'nt':
os.system('Scripts\\avconv.exe -loglevel 0 -i "' + 'Music/' + music_file + '.m4a" -ab 192k "' + 'Music/' + music_file + '.mp3"')
else:
os.system('avconv -loglevel 0 -i "' + 'Music/' + music_file + '.m4a" -ab 192k "' + 'Music/' + music_file + '.mp3"')
os.remove('Music/' + music_file + '.m4a')
if os.name == 'nt':
os.system(
'Scripts\\avconv.exe -loglevel 0 -i "' +
'Music/' +
music_file +
'.m4a" -ab 192k "' +
'Music/' +
music_file +
'.mp3"')
else:
os.system(
'avconv -loglevel 0 -i "' +
'Music/' +
music_file +
'.m4a" -ab 192k "' +
'Music/' +
music_file +
'.mp3"')
os.remove('Music/' + music_file + '.m4a')
def convertToM4A(music_file):
# Here we prefer downloading .webm (Opus) audio and encode as m4a
# in format prefered by iTunes - AAC (256k)
# We are using ffmpeg with fdk_aac code and cutoff at 18kHz
# python3 spotdl.py -i '.webm' -o '.m4a'
if args.quiet:
ffmpeg_pre = 'ffmpeg -hide_banner -nostats -v panic -y '
else:
ffmpeg_pre = 'ffmpeg -y '
os.system(ffmpeg_pre +
'-i "Music/' + music_file + args.input_ext + '" ' +
'-cutoff 18000 -c:a libfdk_aac -b:a 256k -vn ' +
'"Music/_' + music_file + args.output_ext + '" ')
os.remove('Music/' + music_file + args.input_ext)
def checkExists(music_file, raw_song, islist):
if os.path.exists("Music/" + music_file + ".m4a.temp"):
os.remove("Music/" + music_file + ".m4a.temp")
if args.no_convert:
extension = '.m4a'
else:
if os.path.exists("Music/" + music_file + ".m4a"):
os.remove("Music/" + music_file + ".m4a")
extension = '.mp3'
if os.path.isfile("Music/" + music_file + extension):
if extension == '.mp3':
audiofile = eyed3.load("Music/" + music_file + extension)
if isSpotify(raw_song) and not audiofile.tag.title == (generateMetaTags(raw_song))['name']:
os.remove("Music/" + music_file + extension)
return False
if islist:
return True
else:
prompt = raw_input('Song with same name has already been downloaded. Re-download? (y/n): ').lower()
if prompt == "y":
os.remove("Music/" + music_file + extension)
return False
else:
return True
if os.path.exists("Music/" + music_file + ".m4a.temp"):
os.remove("Music/" + music_file + ".m4a.temp")
if args.no_convert:
extension = args.input_ext
else:
if os.path.exists('Music/' + music_file + args.input_ext):
os.remove('Music/' + music_file + args.input_ext)
extension = args.output_ext
if os.path.isfile("Music/" + music_file + extension):
if extension == '.mp3':
audiofile = eyed3.load("Music/" + music_file + extension)
if isSpotify(raw_song) and not audiofile.tag.title == (
generateMetaTags(raw_song))['name']:
os.remove("Music/" + music_file + extension)
return False
if islist:
return True
else:
prompt = raw_input(
'Song with same name has already been downloaded. Re-download? (y/n): ').lower()
if prompt == "y":
os.remove("Music/" + music_file + extension)
return False
else:
return True
# Remove song from list.txt once downloaded
def trimSong(file):
with open(file, 'r') as fin:
data = fin.read().splitlines(True)
with open(file, 'w') as fout:
fout.writelines(data[1:])
with open(file, 'r') as fin:
data = fin.read().splitlines(True)
with open(file, 'w') as fout:
fout.writelines(data[1:])
def fixSong(music_file, meta_tags):
audiofile = eyed3.load("Music/" + music_file + '.mp3')
audiofile.tag.artist = meta_tags['artists'][0]['name']
audiofile.tag.album_artist = meta_tags['artists'][0]['name']
audiofile.tag.album = meta_tags['album']['name']
audiofile.tag.title = meta_tags['name']
audiofile.tag.track_num = meta_tags['track_number']
audiofile.tag.disc_num = meta_tags['disc_number']
audiofile.tag.release_date = spotify.album(meta_tags['album']['id'])['release_date']
albumart = (requests.get(meta_tags['album']['images'][0]['url'], stream=True)).raw
with open('last_albumart.jpg', 'wb') as out_file:
copyfileobj(albumart, out_file)
albumart = open("last_albumart.jpg", "rb").read()
audiofile.tag.images.set(3,albumart,"image/jpeg")
audiofile.tag.save(version=(2,3,0))
audiofile = eyed3.load("Music/" + music_file + '.mp3')
audiofile.tag.artist = meta_tags['artists'][0]['name']
audiofile.tag.album_artist = meta_tags['artists'][0]['name']
audiofile.tag.album = meta_tags['album']['name']
audiofile.tag.title = meta_tags['name']
audiofile.tag.track_num = meta_tags['track_number']
audiofile.tag.disc_num = meta_tags['disc_number']
audiofile.tag.release_date = spotify.album(
meta_tags['album']['id'])['release_date']
albumart = (
requests.get(
meta_tags['album']['images'][0]['url'],
stream=True)).raw
with open('last_albumart.jpg', 'wb') as out_file:
copyfileobj(albumart, out_file)
albumart = open("last_albumart.jpg", "rb").read()
audiofile.tag.images.set(3, albumart, "image/jpeg")
audiofile.tag.save(version=(2, 3, 0))
def fixSongM4A(music_file, meta_tags):
# eyed serves only mp3 not aac so using mutagen
# Apple has specific tags - see mutagen docs -
# http://mutagen.readthedocs.io/en/latest/api/mp4.html
tags = {'album': '\xa9alb',
'artist': '\xa9ART',
'year': '\xa9day',
'title': '\xa9nam',
'comment': '\xa9cmt',
'group': '\xa9grp',
'writer': '\xa9wrt',
'genre': '\xa9gen',
'track': 'trkn',
'aart': 'aART',
'disk': 'disk',
'cpil': 'cpil',
'tempo': 'tmpo'}
audiofile = MP4('Music/_' + music_file + args.output_ext)
audiofile[tags['artist']] = meta_tags['artists'][0]['name']
audiofile[tags['album']] = meta_tags['album']['name']
audiofile[tags['title']] = meta_tags['name']
artist = spotify.artist(meta_tags['artists'][0]['id'])
audiofile[tags['genre']] = titlecase(artist['genres'][0])
album = spotify.album(meta_tags['album']['id'])
audiofile[tags['year']] = album['release_date']
audiofile[tags['track']] = [(meta_tags['track_number'], 0)]
albumart = (
requests.get(meta_tags['album']['images'][0]['url'], stream=True)).raw
with open('last_albumart.jpg', 'wb') as out_file:
copyfileobj(albumart, out_file)
with open("last_albumart.jpg", "rb") as f:
audiofile["covr"] = [
MP4Cover(
f.read(),
imageformat=MP4Cover.FORMAT_JPEG)]
audiofile.save()
# Logic behind preparing the song to download to finishing meta-tags
def grabSingle(raw_song, number=None):
if number:
islist = True
else:
islist = False
content = goPafy(raw_song)
if content == None:
return
print(getYouTubeTitle(content, number))
music_file = generateFileName(content)
if not checkExists(music_file, raw_song, islist=islist):
downloadSong(content)
print('')
if not args.no_convert:
print('Converting ' + music_file + '.m4a to mp3')
convertToMP3(music_file)
meta_tags = generateMetaTags(raw_song)
if not meta_tags == None:
print('Fixing meta-tags')
fixSong(music_file, meta_tags)
if number:
islist = True
else:
islist = False
content = goPafy(raw_song)
if content is None:
return
print(getYouTubeTitle(content, number))
music_file = generateFileName(content)
if not checkExists(music_file, raw_song, islist=islist):
downloadSong(content)
print('')
if not args.no_convert:
print('Converting ' + music_file + '.m4a to mp3')
if args.output_ext == '.m4a':
convertToM4A(music_file)
meta_tags = generateMetaTags(raw_song)
if meta_tags is not None:
print('Fixing meta-tags')
fixSongM4A(music_file, meta_tags)
else:
convertToMP3(music_file)
meta_tags = generateMetaTags(raw_song)
if meta_tags is not None:
print('Fixing meta-tags')
fixSong(music_file, meta_tags)
# Fix python2 encoding issues
def fixEncoding(query):
if version_info > (3,0):
return query
else:
return query.encode('utf-8')
if version_info > (3, 0):
return query
else:
return query.encode('utf-8')
def grabList(file):
lines = open(file, 'r').read()
lines = lines.splitlines()
# Ignore blank lines in list.txt (if any)
try:
lines.remove('')
except ValueError:
pass
print('Total songs in list = ' + str(len(lines)) + ' songs')
print('')
# Count the number of song being downloaded
number = 1
for raw_song in lines:
try:
grabSingle(raw_song, number=number)
trimSong(file)
number += 1
print('')
except KeyboardInterrupt:
graceQuit()
except:
lines.append(raw_song)
trimSong(file)
with open(file, 'a') as myfile:
myfile.write(raw_song)
print('Failed to download song. Will retry after other songs.')
lines = open(file, 'r').read()
lines = lines.splitlines()
# Ignore blank lines in list.txt (if any)
try:
lines.remove('')
except ValueError:
pass
print('Total songs in list = ' + str(len(lines)) + ' songs')
print('')
# Count the number of song being downloaded
number = 1
for raw_song in lines:
try:
grabSingle(raw_song, number=number)
trimSong(file)
number += 1
print('')
except KeyboardInterrupt:
graceQuit()
except BaseException:
lines.append(raw_song)
trimSong(file)
with open(file, 'a') as myfile:
myfile.write(raw_song)
print('Failed to download song. Will retry after other songs.')
def getArgs(argv=None):
parser = argparse.ArgumentParser(description='Find and convert songs \
from Spotify, Youtube etc.',
formatter_class=argparse.ArgumentDefaultsHelpFormatter)
parser = argparse.ArgumentParser()
parser.add_argument('-n', '--no-convert', default=False,
help='Skip the conversion process and meta-tags', action='store_true')
parser.add_argument('-m', '--manual', default=False,
help='Choose the song to download manually', action='store_true')
parser.add_argument('-l', '--list', default=False,
help='Download songs present in list.txt', action='store_true')
parser.add_argument('-q', '--quiet', default=False,
help='Spare us output of ffmpeg conversion', action='store_true')
parser.add_argument('-i', '--input_ext', default='.m4a',
help='Prefered input format .m4a or .webm (Opus)')
parser.add_argument('-o', '--output_ext', default='.mp3',
help='Prefered output extension .mp3 or .m4a (AAC)')
return parser.parse_args(argv)
def graceQuit():
print('')
print('')
print('Exitting..')
exit()
print('')
print('')
print('Exitting..')
exit()
# Python 3 compatibility
if version_info > (3,0):
raw_input = input
eyed3.log.setLevel("ERROR")
if __name__ == '__main__':
os.chdir(path[0])
# Python 3 compatibility
if version_info > (3, 0):
raw_input = input
if not os.path.exists("Music"):
os.makedirs("Music")
open('list.txt', 'a').close()
eyed3.log.setLevel("ERROR")
# Please respect this user token :)
token = util.prompt_for_user_token('Spotify-Downloader',
scope = 'playlist-read-private',
client_id='4fe3fecfe5334023a1472516cc99d805',
client_secret='0f02b7c483c04257984695007a4a8d5c',
redirect_uri='http://localhost:9876/callback')
os.chdir(path[0])
spotify = spotipy.Spotify(auth=token)
if not os.path.exists("Music"):
os.makedirs("Music")
open('list.txt', 'a').close()
# Set up arguments
parser = argparse.ArgumentParser()
parser.add_argument("-n", "--no-convert", help="skip the conversion process and meta-tags", action="store_true")
parser.add_argument("-m", "--manual", help="choose the song to download manually", action="store_true")
parser.add_argument("-l", "--list", help="download songs present in list.txt", action="store_true")
args = parser.parse_args()
# Please respect this user token :)
oauth2 = oauth2.SpotifyClientCredentials(client_id='4fe3fecfe5334023a1472516cc99d805',
client_secret='0f02b7c483c04257984695007a4a8d5c')
token = oauth2.get_access_token()
if args.no_convert:
spotify = spotipy.Spotify(auth=token)
# Set up arguments
args = getArgs()
if args.no_convert:
print("-n, --no-convert skip the conversion process and meta-tags")
if args.manual:
print("-m, --manual choose the song to download manually")
print('')
if args.list:
grabList(file='list.txt')
exit()
if args.manual:
print("-m, --manual choose the song to download manually")
print('')
if args.list:
grabList(file='list.txt')
exit()
while True:
for temp in os.listdir('Music/'):
if temp.endswith('.m4a.temp'):
os.remove('Music/' + temp)
try:
print('Enter a Spotify URL or Song Name: ')
command = raw_input('>> ')
print('')
grabSingle(raw_song=command)
print('')
except KeyboardInterrupt:
graceQuit()
while True:
for temp in os.listdir('Music/'):
if temp.endswith('.m4a.temp'):
os.remove('Music/' + temp)
try:
print('Enter a Spotify URL or Song Name: ')
command = raw_input('>> ')
print('')
grabSingle(raw_song=command)
print('')
except KeyboardInterrupt:
graceQuit()