[bandcamp] Add support for subdomains (Fixes #2850)

author: Philipp Hagemeister <[email protected]> 2014-05-05 02:44:44 +0200
committer: Philipp Hagemeister <[email protected]> 2014-05-05 02:44:44 +0200
commit: b48f147d5a36b16e421b9b91fcc72b62e695c948 (patch)
tree: d193368fdb53fe757b4df9565697c296191c0266
parent: 4f3e943080f3381213ee979647f68eee43af4bb8 (diff)
download: youtube-dl-b48f147d5a36b16e421b9b91fcc72b62e695c948.tar.gz
youtube-dl-b48f147d5a36b16e421b9b91fcc72b62e695c948.zip
1 files changed, 7 insertions, 3 deletions
diff --git a/youtube_dl/extractor/bandcamp.py b/youtube_dl/extractor/bandcamp.py
index 886b0dfab..929aafdff 100644
--- a/youtube_dl/extractor/bandcamp.py
+++ b/youtube_dl/extractor/bandcamp.py
@@ -12,7 +12,7 @@ from ..utils import (
 
 
 class BandcampIE(InfoExtractor):
-    _VALID_URL = r'http://.*?\.bandcamp\.com/track/(?P<title>.*)'
+    _VALID_URL = r'https?://.*?\.bandcamp\.com/track/(?P<title>.*)'
     _TESTS = [{
         'url': 'http://youtube-dl.bandcamp.com/track/youtube-dl-test-song',
         'file': '1812978515.mp3',
@@ -100,7 +100,7 @@ class BandcampIE(InfoExtractor):
 
 class BandcampAlbumIE(InfoExtractor):
     IE_NAME = 'Bandcamp:album'
-    _VALID_URL = r'http://.*?\.bandcamp\.com/album/(?P<title>.*)'
+    _VALID_URL = r'https?://(?:(?P<subdomain>[^.]+)\.)?bandcamp\.com(?:/album/(?P<title>[^?#]+))?'
 
     _TEST = {
         'url': 'http://blazo.bandcamp.com/album/jazz-format-mixtape-vol-1',
@@ -128,8 +128,10 @@ class BandcampAlbumIE(InfoExtractor):
 
     def _real_extract(self, url):
         mobj = re.match(self._VALID_URL, url)
+        playlist_id = mobj.group('subdomain')
         title = mobj.group('title')
-        webpage = self._download_webpage(url, title)
+        display_id = title or playlist_id
+        webpage = self._download_webpage(url, display_id)
         tracks_paths = re.findall(r'<a href="(.*?)" itemprop="url">', webpage)
         if not tracks_paths:
             raise ExtractorError('The page doesn\'t contain any tracks')
@@ -139,6 +141,8 @@ class BandcampAlbumIE(InfoExtractor):
         title = self._search_regex(r'album_title : "(.*?)"', webpage, 'title')
         return {
             '_type': 'playlist',
+            'id': playlist_id,
+            'display_id': display_id,
             'title': title,
             'entries': entries,
         }
author	Philipp Hagemeister <[email protected]>	2014-05-05 02:44:44 +0200
committer	Philipp Hagemeister <[email protected]>	2014-05-05 02:44:44 +0200
commit	b48f147d5a36b16e421b9b91fcc72b62e695c948 (patch)
tree	d193368fdb53fe757b4df9565697c296191c0266
parent	4f3e943080f3381213ee979647f68eee43af4bb8 (diff)
download	youtube-dl-b48f147d5a36b16e421b9b91fcc72b62e695c948.tar.gz youtube-dl-b48f147d5a36b16e421b9b91fcc72b62e695c948.zip