+# Xavier Beynon 2014
# coding: utf-8
from __future__ import unicode_literals
from .common import InfoExtractor
+from .soundcloud import SoundcloudIE
import datetime
import time
-import urllib.request
-import json
class AudiomackIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?audiomack\.com/song/(?P<id>[\w/-]+)'
- _TEST = {
- 'url': 'https://www.audiomack.com/song/crewneckkramer/story-i-tell',
- 'info_dict': {
- 'id': 'story-i-tell',
- 'ext': 'mp3',
- 'title': 'story-i-tell'
+ IE_NAME = 'audiomack'
+ _TESTS = [
+ #hosted on audiomack
+ {
+ 'url': 'http://www.audiomack.com/song/roosh-williams/extraordinary',
+ 'file': 'Roosh Williams - Extraordinary.mp3',
+ 'info_dict':
+ {
+ 'ext': 'mp3',
+ 'title': 'Roosh Williams - Extraordinary'
+ }
+ },
+ #hosted on soundcloud via audiomack
+ {
+ 'url': 'http://www.audiomack.com/song/xclusiveszone/take-kare',
+ 'file': '172419696.mp3',
+ 'info_dict':
+ {
+ 'ext': 'mp3',
+ 'title': 'Young Thug ft Lil Wayne - Take Kare',
+ "upload_date": "20141016",
+ "description": "New track produced by London On Da Track called “Take Kare\"\n\nhttp://instagram.com/theyoungthugworld\nhttps://www.facebook.com/ThuggerThuggerCashMoney\n",
+ "uploader": "Young Thug World"
+ }
}
- }
+ ]
def _real_extract(self, url):
- # TODO more code goes here, for example ...
- #webpage = self._download_webpage(url, video_id)
- #title = self._html_search_regex(r'<h1>(.*?)</h1>', webpage, 'title')
-
- assert("/song/" in url)
- songurl = url[url.index("/song/")+5:]
- title = songurl[songurl.rindex("/")+1:]
- video_id = title
- t = int(time.mktime(datetime.datetime.now().timetuple()))
- s = "http://www.audiomack.com/api/music/url/song"+songurl+"?_="+str(t)
- f = urllib.request.urlopen(s)
- j = f.read(1000).decode("utf-8")
- data = json.loads(j)
+ #id is what follows /song/ in url, usually the uploader name + title
+ id = url[url.index("/song/")+5:]
- return {
- 'id': video_id,
- 'title': title,
- 'url' : data["url"],
- 'ext' : 'mp3'
- # TODO more properties (see youtube_dl/extractor/common.py)
- }
+ #Call the api, which gives us a json doc with the real url inside
+ rightnow = int(time.mktime(datetime.datetime.now().timetuple()))
+ apiresponse = self._download_json("http://www.audiomack.com/api/music/url/song"+id+"?_="+str(rightnow), id)
+ if not url in apiresponse:
+ raise Exception("Unable to deduce api url of song")
+ realurl = apiresponse["url"]
+
+ #Audiomack wraps a lot of soundcloud tracks in their branded wrapper
+ # - if so, pass the work off to the soundcloud extractor
+ if SoundcloudIE.suitable(realurl):
+ sc = SoundcloudIE(downloader=self._downloader)
+ return sc._real_extract(realurl)
+ else:
+ #Pull out metadata
+ page = self._download_webpage(url, id)
+ artist = self._html_search_regex(r'<span class="artist">(.*)</span>', page, "artist")
+ songtitle = self._html_search_regex(r'<h1 class="profile-title song-title"><span class="artist">.*</span>(.*)</h1>', page, "title")
+ title = artist+" - "+songtitle
+ return {
+ 'id': title, # ignore id, which is not useful in song name
+ 'title': title,
+ 'url': realurl,
+ 'ext': 'mp3'
+ }