Moved functions into a new Bandcamp class
parent
7e0fd439dc
commit
1a80306f7f
|
@ -0,0 +1,171 @@
|
|||
import unicodedata
|
||||
import os
|
||||
import urllib2
|
||||
|
||||
from mutagen.mp3 import MP3
|
||||
from mutagen.id3 import TIT2
|
||||
from mutagen.easyid3 import EasyID3
|
||||
from bs4 import BeautifulSoup
|
||||
import requests
|
||||
import sys
|
||||
import Bandcamp
|
||||
from os.path import expanduser
|
||||
|
||||
import jsobj
|
||||
|
||||
|
||||
class Bandcamp:
|
||||
DOWNLOAD_DIR = expanduser("~/music")
|
||||
|
||||
# def __init__(self, artist, album):
|
||||
# self.artist = artist
|
||||
# self.album = album
|
||||
|
||||
|
||||
def get_embed_string_block(self, request):
|
||||
embedBlock = request.text.split("var EmbedData = ")
|
||||
|
||||
embedStringBlock = embedBlock[1]
|
||||
embedStringBlock = unicodedata.normalize('NFKD', embedStringBlock).encode('ascii', 'ignore')
|
||||
embedStringBlock = embedStringBlock.split("};")[0] + "};"
|
||||
embedStringBlock = jsobj.read_js_object("var EmbedData = %s" % str(embedStringBlock))
|
||||
|
||||
return embedStringBlock
|
||||
|
||||
|
||||
def sanatize_text(self, text, space=False, slash=False, period=False):
|
||||
result = text
|
||||
|
||||
if not space:
|
||||
result = result.replace(" ", "")
|
||||
if not slash:
|
||||
result = result.replace("/", "")
|
||||
if not period:
|
||||
result = result.replace(".", "")
|
||||
|
||||
return result
|
||||
|
||||
|
||||
def download(self, request, destination, show_progress=False):
|
||||
remote_file = urllib2.urlopen(request)
|
||||
meta = remote_file.info()
|
||||
file_size = int(meta.getheaders("Content-Length")[0])
|
||||
file_size_dl = 0
|
||||
block_sz = 8192
|
||||
|
||||
local_file = open(destination, 'wb')
|
||||
|
||||
while True:
|
||||
buffer = remote_file.read(block_sz)
|
||||
if not buffer:
|
||||
break
|
||||
|
||||
file_size_dl += len(buffer)
|
||||
local_file.write(buffer)
|
||||
|
||||
if show_progress:
|
||||
self.display_progress(file_size_dl, file_size)
|
||||
|
||||
local_file.close()
|
||||
print "Done downloading: " + destination
|
||||
|
||||
|
||||
def display_progress(self, current, total):
|
||||
factor = float(current) / total
|
||||
percent = factor * 100
|
||||
status = str( int(round(percent)) )
|
||||
|
||||
sys.stdout.write("Download progress: %s%% \r" % (status))
|
||||
sys.stdout.flush()
|
||||
|
||||
|
||||
def download_track(self, track, url, title, album_path, artist, album):
|
||||
print "Now Downloading: " + track['title'], track['file']['mp3-128']
|
||||
|
||||
req = urllib2.Request(url, headers={'User-Agent': "Magic Browser"})
|
||||
destination = album_path + '/' + self.sanatize_text(track['title']) + '.mp3'
|
||||
|
||||
self.download(req, destination, show_progress = True)
|
||||
|
||||
|
||||
def write_id3_tags(self, track, title, album_path, artist, album):
|
||||
print "Encoding . . . "
|
||||
|
||||
audio = MP3(album_path + '/' + track['title'] + '.mp3')
|
||||
audio["TIT2"] = TIT2(encoding=3, text=["title"])
|
||||
audio.save()
|
||||
|
||||
audio = EasyID3(album_path + '/' + track['title'] + '.mp3')
|
||||
audio["title"] = track['title']
|
||||
audio["artist"] = artist
|
||||
audio["album"] = album
|
||||
audio.save()
|
||||
|
||||
print "Done encoding . . . "
|
||||
|
||||
def create_directories(self, artist, album):
|
||||
album_path = self.DOWNLOAD_DIR + "/" + artist + "/" + self.sanatize_text(album)
|
||||
|
||||
if not os.path.exists(self.DOWNLOAD_DIR):
|
||||
os.makedirs(self.DOWNLOAD_DIR)
|
||||
|
||||
if not os.path.exists(self.DOWNLOAD_DIR + "/zips"):
|
||||
os.makedirs(self.DOWNLOAD_DIR + "/zips")
|
||||
|
||||
if not os.path.exists(album_path):
|
||||
os.makedirs(album_path)
|
||||
|
||||
return album_path
|
||||
|
||||
def get_embed_string_block(self, request):
|
||||
embedBlock = request.text.split("var EmbedData = ")
|
||||
|
||||
embedStringBlock = embedBlock[1]
|
||||
embedStringBlock = unicodedata.normalize('NFKD', embedStringBlock).encode('ascii', 'ignore')
|
||||
embedStringBlock = embedStringBlock.split("};")[0] + "};"
|
||||
embedStringBlock = jsobj.read_js_object("var EmbedData = %s" % str(embedStringBlock))
|
||||
|
||||
return embedStringBlock
|
||||
|
||||
|
||||
def extract_album_meta_data(self, request):
|
||||
album = {}
|
||||
|
||||
embedData = self.get_embed_string_block(request)
|
||||
|
||||
block = request.text.split("var TralbumData = ")
|
||||
|
||||
stringBlock = block[1]
|
||||
stringBlock = unicodedata.normalize('NFKD', stringBlock).encode('ascii', 'ignore')
|
||||
stringBlock = stringBlock.split("};")[0] + "};"
|
||||
stringBlock = jsobj.read_js_object("var TralbumData = %s" % str(stringBlock))
|
||||
|
||||
album['title'] = embedData['EmbedData']['album_title']
|
||||
album['artist'] = stringBlock['TralbumData']['artist']
|
||||
album['tracks'] = stringBlock['TralbumData']['trackinfo']
|
||||
|
||||
return album
|
||||
|
||||
|
||||
def parse_album_page(self, url):
|
||||
print "Starting the parsing for: " + url
|
||||
|
||||
r = requests.get(url)
|
||||
soup = BeautifulSoup(r.text)
|
||||
|
||||
album = self.extract_album_meta_data(r)
|
||||
album['path'] = self.create_directories(album['artist'], album['title'])
|
||||
|
||||
for track in album['tracks']:
|
||||
title = self.sanatize_text(track['title'], space=True)
|
||||
url = track['file']['mp3-128']
|
||||
|
||||
self.download_track(track, url, title, album['path'], album['artist'], album['title'])
|
||||
self.write_id3_tags(track, title, album['path'], album['artist'], album['title'])
|
||||
|
||||
|
||||
if __name__ == '__main__':
|
||||
url = 'http://wmdchiptune.bandcamp.com/album/sophrosyne'
|
||||
|
||||
bc = Bandcamp()
|
||||
bc.parse_album_page(url)
|
|
@ -17,6 +17,7 @@ from mutagen.easyid3 import EasyID3
|
|||
from bs4 import BeautifulSoup
|
||||
import requests
|
||||
import sys
|
||||
import Bandcamp
|
||||
|
||||
import jsobj
|
||||
|
||||
|
@ -159,5 +160,6 @@ def parse_file(url):
|
|||
download_track(track, url, title, album['path'], album['artist'], album['title'])
|
||||
write_id3_tags(track, title, album['path'], album['artist'], album['title'])
|
||||
|
||||
|
||||
url = raw_input("Please enter the url of the album or song you wish to download: ")
|
||||
parse_file(url)
|
||||
|
|
Loading…
Reference in New Issue