Download using Spotify's song URL's

2026-07-04 00:41:55 +00:00 · 2016-08-24 21:57:04 +05:30
parent a56500440c
commit fcbb4a3f47
1 changed files with 199 additions and 137 deletions
--- a/bin/YTMusic
+++ b/bin/YTMusic
@@ -1,147 +1,203 @@
 #!/bin/python
 import mechanize
-from bs4 import BeautifulSoup as soup
+from bs4 import BeautifulSoup
 import pafy
 import os
 import requests
 from os.path import expanduser
 import spotipy
 #import spotipy.util as util
 import eyed3
 opsys = ''
 spotify = spotipy.Spotify()
 if not os.path.exists("Music"):
 	os.makedirs("Music")
 script_dir = expanduser("~") + '/YTMusic'
 os.chdir(script_dir)
 for m in os.listdir('Music/'):
 	if m.endswith(".temp") or m.endswith("webm"):
 		os.remove('Music/' + m)
 print ''
 convert = 1
 if os.name == 'nt':
 	opsys = 'win'
 	if not os.path.isfile('ffmpeg.exe'):
 		print 'ffmpeg not found, will not convert to mp3 (from m4a). download from https://ffmpeg.zeranoe.com/builds/ to be able to convert them'
 		convert = 0
 else:
 	opsys = 'linux'
 	check_install = os.system('which avconv > /dev/null')
 	if check_install == '':
 		print 'avconv not found, will not convert to mp3 (from m4a). use sudo apt-get install libav-tools to install it'
 		convert = 0
 def Main():
 	script_dir = os.getcwd()
 	Title = ''
 	while True:
 		try:
 			print('')
 			print('')
 			raw_song = raw_input('Enter a song/cmd: ')
 			print ''
 			if raw_song == "exit":
 				exit()
 			elif raw_song == "play":
 				if not Title == '':
 					if opsys == 'win':
-						if os.path.isfile(script_dir + "\Music\\" + Unencoded_Title + ".mp3"):
+						if os.path.isfile(script_dir + "\Music\\" + Title + ".mp3"):
-							os.system('"' + script_dir + "\Music\\" + Unencoded_Title + ".mp3" + '"')
+							os.system('"' + script_dir + "\Music\\" + Title + ".mp3" + '"')
 						else:
-							os.system('"' + script_dir + "\Music\\" + Unencoded_Title + ".m4a" + '"')
+							os.system('"' + script_dir + "\Music\\" + Title + ".webm" + '"')
 					elif opsys == 'linux':
-						if os.path.isfile(script_dir + '/Music/' + Unencoded_Title + '.mp3'):
+						if os.path.isfile(script_dir + '/Music/' + Title + '.mp3'):
-							os.system('mplayer "' + script_dir + '/Music/' + Unencoded_Title + '.mp3"')
+							os.system('mplayer "' + script_dir + '/Music/' + Title + '.mp3"')
 						else:
-							os.system('mplayer "' + script_dir + '/Music/' + Unencoded_Title + '.m4a"')
+							os.system('mplayer "' + script_dir + '/Music/' + Title + '.webm"')
-
+			elif raw_song == "lyrics":
 				if not Title == '':
 					if not label == '':
 						url = 'http://www.google.com/search?q=' + Title + ' metrolyrics'
 					else:
 						url = 'http://www.google.com/search?q=' + label + ' metrolyrics'
 					req = requests.get(url)
 					response = req.content
 					result=response
 					link_start=result.find('http://www.metrolyrics.com')
 					link_end=result.find('html',link_start+1)
 					link = result[link_start:link_end+4]
 					lyrics_html = link
 					try:
 						a = requests.get(lyrics_html)
 						#print (lyrics_html)
 						html_doc=  a.content
 						soup = BeautifulSoup(html_doc, 'html.parser')
 						#album_name = soup.find(id = "album-name-link").text
 						raw_lyrics= (soup.findAll('p', attrs={'class' : 'verse'}))
 						test1=unicode.join(u'\n',map(unicode,raw_lyrics))
 						test1 = (test1.replace('<p class="verse">','\n'))
 						test1 = (test1.replace('</br>',''))
 						test1 = (test1.replace('<br>',''))
 						test1 = test1.replace('</p>','')
 						print (test1)
 					except:
 						print 'Sorry, could not find lyrics'
 				else:
 					print 'No log to read from..'
 			elif raw_song == "convert":
-				print ''
+			elif raw_song == "list":
-				if opsys == 'win':
+					f = open('Music/list.txt')
-					if convert == 1:
+					lines = f.readlines()
-						y = 1
+					f.close()
-						x = 0
+					x = 0
-						for m in os.listdir(script_dir + '/Music/'):
+					y = 0
-							if m.endswith(".m4a"):
+					for songie in lines:
-								x = x + 1
+						if not songie == '\n' or not songie == '':
-						print 'Total songs to convert = ' + str(x) + ' songs'
+							x = x + 1
-						for m in os.listdir(script_dir + '/Music/'):
+					print 'Total songs in list = ' + str(x) + ' songs'
-							if m.endswith(".m4a"):
+					for songie in lines:
 						try:
 							if not songie == '\n' or not songie == '':
 								if (len(songie) == 22 and songie.replace(" ", "%20") == songie) or (songie.find('spotify') > -1):
 									song = songie.replace(songie[-1:], "")
 									content = spotify.track(song)
 									URL = "https://www.youtube.com/results?sp=EgIQAQ%253D%253D&q=" + (content['artists'][0]['name'] + ' - ' + content['name']).replace(" ", "%20")
 								else:
 									song = songie.replace(" ", "%20")
 									URL = "https://www.youtube.com/results?sp=EgIQAQ%253D%253D&q=" + song
 									song = ''
 								print ''
-								print str(y) + '. ' 'Converting ' + m + ' to mp3..'
+								br = mechanize.Browser()
 								br.set_handle_robots(False)
 								br.addheaders = [("User-agent","Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.13) Gecko/20101206 Ubuntu/10.10 (maverick) Firefox/3.6.13")]
 #								print URL
 								items = br.open(URL)
 #								print items
 								items = items.read()
 #								print items
 								zoom1 = items.find('yt-uix-tile-link')
 								zoom2 = items.find('yt-uix-tile-link', zoom1+1)
 								zoom3 = items.find('yt-uix-tile-link', zoom2+1)
 								part = items[zoom1-100: zoom2]
 								items_parse = BeautifulSoup(part, "html.parser")
 								#items_parse = soup(items, "html.parser")
 								br.close()
 								first_result = items_parse.find(attrs={'class':'yt-uix-tile-link'})['href']
 								full_link = "youtube.com" + first_result
 								#print full_link
 								video = pafy.new(full_link)
 								Title = ((video.title).replace("\\", "_").replace("/", "_").replace(":", "_").replace("*", "_").replace("?", "_").replace('"', "_").replace("<", "_").replace(">", "_").replace("|", "_").replace(" ", "_"))
 								y = y + 1
-								song = m.replace(".m4a", "")
+								print str(y) + '. ' + ((video.title).encode("utf-8"))
-								os.system('ffmpeg.exe -loglevel 0 -i "Music\\' + song + '.m4a" ' + '"Music\\' + song + '.mp3"')
+								if os.path.exists("Music/" + Title + ".webm.temp"):
-								os.remove("Music/" + m)
+									os.remove("Music/" + Title + ".webm.temp")
-					else:
+								download = 1
-						print 'ffmpeg is not installed, cant convert to mp3'
+								if os.path.exists("Music/" + Title + ".mp3"):
-				elif opsys == 'linux':
+									audiofile = eyed3.load("Music/" + Title + '.mp3')
-					if convert == 1:
+									if ((len(raw_song) == 22 and raw_song.replace(" ", "%20") == raw_song) or (raw_song.find('spotify') > -1)) and not audiofile.tag.title == content['name']:
-						y = 1
+										os.remove("Music/" + Title + '.mp3')
-						x = 0
+									else:
-						for m in os.listdir(script_dir + '/Music/'):
+										with open('Music/list.txt', 'r') as fin:
-							if m.endswith(".m4a"):
+											data = fin.read().splitlines(True)
-								x = x + 1
+										with open('Music/list.txt', 'w') as fout:
-						print 'Total songs to convert = ' + str(x) + ' songs'
+											fout.writelines(data[1:])
-						for m in os.listdir(script_dir + '/Music/'):
+										download = 0
-							if m.endswith(".m4a"):
+								if download == 1:
-								print ''
+									a = video.getbestaudio(preftype='webm')
-								print str(y) + '. ' 'Converting ' + m + ' to mp3..'
+									a.download(filepath="Music/" + Title + ".webm")
-								y = y + 1
+									with open('Music/list.txt', 'r') as fin:
-								song = m.replace(".m4a", "")
+										data = fin.read().splitlines(True)
-								os.system('sudo avconv -loglevel 0 -i "Music/' + song + '.m4a" ' + '"Music/' + song + '.mp3"')
+									with open('Music/list.txt', 'w') as fout:
-								os.remove("Music/" + m)
+										fout.writelines(data[1:])
-				else:
+										print ''
-					print 'avconv is not installed, cant convert to mp3'
+									print 'Converting ' + Title + '.webm' + ' to mp3..'
-			elif raw_song == "spotify":
+									os.system('sudo avconv -loglevel 0 -i ' + script_dir + '"/Music/' + Title + '.webm" ' + script_dir + '"/Music/' + Title + '.mp3"')
-				print ''
+									os.remove("Music/" + Title + '.webm')
-				f = open(script_dir + '/Music/spotify.txt')
+									os.system('sudo chmod 777 "' + script_dir + '/Music/' + Title + '.mp3"')
-				lines = f.readlines()
+									if (len(songie) == 22 and songie.replace(" ", "%20") == songie) or (songie.find('spotify') > -1):
-				print 'Total songs in spotify.txt = ' + str(len(lines)) + ' songs'
+										print 'Fixing meta-tags..'
-				y = 1
+										audiofile = eyed3.load("Music/" + Title + '.mp3')
-				for x in lines:
+										audiofile.tag.artist = content['artists'][0]['name']
-					print ''
+										audiofile.tag.album = content['album']['name']
-					song = x.replace(" ", "%20")
+										audiofile.tag.title = content['name']
-					br = mechanize.Browser()
+										os.system("wget -q " + content['album']['images'][0]['url'] + "  -O " + script_dir + "/Music/last_albumart.jpg")
-					br.set_handle_robots(False)
+										bla = open("Music/last_albumart.jpg","rb").read()
-					br.addheaders = [("User-agent","Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.13) Gecko/20101206 Ubuntu/10.10 (maverick) Firefox/3.6.13")]
+										audiofile.tag.images.set(3,bla,"image/jpeg")
-					URL = "https://www.youtube.com/results?search_query=" + song
+										audiofile.tag.save()
-					items = br.open(URL).read()
+							else:
-
+								with open('Music/list.txt', 'r') as fin:
 					items_parse = soup(items, "html.parser")
 					br.close()
 					first_result = items_parse.find(attrs={'class':'yt-uix-tile-link'})['href']
 					full_link = "youtube.com" + first_result
 					#print full_link
 					video = pafy.new(full_link)
 					Unencoded_Title = ((video.title).replace("\\", "_").replace("/", "_").replace(":", "_").replace("*", "_").replace("?", "_").replace('"', "_").replace("<", "_").replace(">", "_").replace("|", "_").replace(" ", "_"))
 					Title = Unencoded_Title.encode("utf-8")
 					print str(y) + '. ' + Title
 					y = y + 1
 					if os.path.exists("Music/" + Unencoded_Title + ".m4a.temp"):
 						os.remove("Music/" + Unencoded_Title + ".m4a.temp")
 					if os.path.exists("Music/" + Unencoded_Title + ".m4a") or os.path.exists("Music/" + Unencoded_Title + ".mp3"):
 						with open('Music/spotify.txt', 'r') as fin:
 							data = fin.read().splitlines(True)
 						with open('Music/spotify.txt', 'w') as fout:
 							fout.writelines(data[1:])
 					else:
 						audiostreams = video.audiostreams
 						for a in audiostreams:
 							if a.bitrate == "128k" and a.extension == "m4a":
 								a.download(filepath="Music/" + Unencoded_Title + ".m4a")
 								with open('Music/spotify.txt', 'r') as fin:
 									data = fin.read().splitlines(True)
-								with open('Music/spotify.txt', 'w') as fout:
+								with open('Music/list.txt', 'w') as fout:
 									fout.writelines(data[1:])
-								print ''
+
 						except KeyboardInterrupt:
 							Main()
 						except:
 							lines.append(songie)
 							with open('Music/list.txt', 'r') as fin:
 								data = fin.read().splitlines(True)
 							with open('Music/list.txt', 'w') as fout:
 								fout.writelines(data[1:])
 							with open("Music/list.txt", "a") as myfile:
 								myfile.write(songie)
 							print 'Could not complete a Song download, will try later..'
 			else:
 				song = raw_song.replace(" ", "%20")
 				br = mechanize.Browser()
 				br.set_handle_robots(False)
 				br.addheaders = [("User-agent","Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.13) Gecko/20101206 Ubuntu/10.10 (maverick) Firefox/3.6.13")]
-				URL = "https://www.youtube.com/results?search_query=" + song
+				if (len(raw_song) == 22 and raw_song == song) or (raw_song.find('spotify') > -1):
 					content = spotify.track(song)
 					label = (content['artists'][0]['name'] + ' - ' + content['name']).replace(" ", "%20")
 					URL = "https://www.youtube.com/results?sp=EgIQAQ%253D%253D&q=" + label
 				else:
 					URL = "https://www.youtube.com/results?sp=EgIQAQ%253D%253D&q=" + song
 				items = br.open(URL).read()
-				items_parse = soup(items, "html.parser")
+				zoom1 = items.find('yt-uix-tile-link')
 				zoom2 = items.find('yt-uix-tile-link', zoom1+1)
 				zoom3 = items.find('yt-uix-tile-link', zoom2+1)
 				part = items[zoom1-100: zoom2]
 				items_parse = BeautifulSoup(part, "html.parser")
 				#items_parse = soup(items, "html.parser")
 				br.close()
 				first_result = items_parse.find(attrs={'class':'yt-uix-tile-link'})['href']
@@ -149,45 +205,51 @@ def Main():
 				#print full_link
 				video = pafy.new(full_link)
-				Unencoded_Title = ((video.title).replace("\\", "_").replace("/", "_").replace(":", "_").replace("*", "_").replace("?", "_").replace('"', "_").replace("<", "_").replace(">", "_").replace("|", "_").replace(" ", "_"))
+				Title = ((video.title).replace("\\", "_").replace("/", "_").replace(":", "_").replace("*", "_").replace("?", "_").replace('"', "_").replace("<", "_").replace(">", "_").replace("|", "_").replace(" ", "_"))
-				Title = Unencoded_Title.encode("utf-8")
+				print ((video.title).encode("utf-8"))
-				print Title
+				if os.path.exists("Music/" + Title + ".webm.temp"):
-				if os.path.exists("Music/" + Unencoded_Title + ".m4a.temp"):
+					os.remove("Music/" + Title + ".webm.temp")
 					os.remove("Music/" + Unencoded_Title + ".m4a.temp")
-				if os.path.exists("Music/" + Unencoded_Title + ".m4a") or os.path.exists("Music/" + Unencoded_Title + ".mp3"):
+				download = 1
 				if os.path.exists("Music/" + Title + ".mp3"):
 					audiofile = eyed3.load("Music/" + Title + '.mp3')
 					if ((len(raw_song) == 22 and raw_song.replace(" ", "%20") == raw_song) or (raw_song.find('spotify') > -1)) and not audiofile.tag.title == content['name']:
 						os.remove("Music/" + Title + '.mp3')
 					else:
 						prompt = raw_input('Song with same name has already been downloaded.. re-download? (y/n/play): ')
 						if prompt == "y":
-							if os.path.exists("Music/" + Unencoded_Title + ".mp3"):
+							os.remove("Music/" + Title + ".mp3")
-								os.remove("Music/" + Unencoded_Title + ".mp3")
+							download = 1
 							else:
 								os.remove("Music/" + Unencoded_Title + ".m4a")
 							audiostreams = video.audiostreams
 							for a in audiostreams:
 								if a.bitrate == "128k" and a.extension == "m4a":
 									a.download(filepath="Music/" + Unencoded_Title + ".m4a")
 							print '' 
 						elif prompt =="play":
 							download = 0
 							if opsys == 'win':
-								if os.path.isfile(script_dir + "\Music\\" + Unencoded_Title + ".mp3"):
+								if os.path.isfile(script_dir + "\Music\\" + Title + ".mp3"):
-									os.system('"' + script_dir + "\Music\\" + Unencoded_Title + ".mp3" + '"')
+									os.system('"' + script_dir + "\Music\\" + Title + ".mp3" + '"')
-								else:
+							else:
-									os.system('"' + script_dir + "\Music\\" + Unencoded_Title + ".m4a" + '"')
+								if os.path.isfile(script_dir + '/Music/' + Title + '.mp3'):
-							elif opsys == 'linux':
+									os.system('mplayer "' + script_dir + '/Music/' + Title + '.mp3"')
 								if os.path.isfile(script_dir + '/Music/' + Unencoded_Title + '.mp3'):
 									os.system('mplayer "' + script_dir + '/Music/' + Unencoded_Title + '.mp3"')
 								else:
 									os.system('mplayer "' + script_dir + '/Music/' + Unencoded_Title + '.m4a"')
 						else:
-							pass
+							download = 0
-
+				if download == 1:
-				else:
+					a = video.getbestaudio(preftype="webm")
-					audiostreams = video.audiostreams
+					a.download(filepath="Music/" + Title + ".webm")
-					for a in audiostreams:
+					print ''
-						if a.bitrate == "128k" and a.extension == "m4a":
+					print 'Converting ' + Title + '.webm' + ' to mp3..'
-							a.download(filepath="Music/" + Unencoded_Title + ".m4a")
+					os.system('sudo avconv -loglevel 0 -i ' + script_dir + '"/Music/' + Title + '.webm" ' + script_dir + '"/Music/' + Title + '.mp3"')
-							print ''
+					os.remove("Music/" + Title + '.webm')
 					os.system('sudo chmod 777 "' + script_dir + '/Music/' + Title + '.mp3"')
 					if (len(raw_song) == 22 and raw_song.replace(" ", "%20") == raw_song) or (raw_song.find('spotify') > -1):
 						print 'Fixing meta-tags..'
 						audiofile = eyed3.load("Music/" + Title + '.mp3')
 						audiofile.tag.artist = content['artists'][0]['name']
 						audiofile.tag.album = content['album']['name']
 						audiofile.tag.title = content['name']
 						os.system("wget -q " + content['album']['images'][0]['url'] + "  -O " + script_dir + "/Music/last_albumart.jpg")
 						bla = open("Music/last_albumart.jpg","rb").read()
 						audiofile.tag.images.set(3,bla,"image/jpeg")
 						audiofile.tag.save()
 		except KeyboardInterrupt:
 			pass
-Main()
+Main()