summaryrefslogtreecommitdiffhomepage
path: root/youtube_dl/extractor/roxwel.py
blob: d339e6cb532223e271a5c762ceb1ff58c6071ee2 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
import re
import json

from .common import InfoExtractor
from ..utils import unified_strdate, determine_ext


class RoxwelIE(InfoExtractor):
    _VALID_URL = r'https?://www\.roxwel\.com/player/(?P<filename>.+?)(\.|\?|$)'

    _TEST = {
        u'url': u'http://www.roxwel.com/player/passionpittakeawalklive.html',
        u'file': u'passionpittakeawalklive.flv',
        u'md5': u'd9dea8360a1e7d485d2206db7fe13035',
        u'info_dict': {
            u'title': u'Take A Walk (live)',
            u'uploader': u'Passion Pit',
            u'description': u'Passion Pit performs "Take A Walk\" live at The Backyard in Austin, Texas. ',
        },
        u'skip': u'Requires rtmpdump',
    }

    def _real_extract(self, url):
        mobj = re.match(self._VALID_URL, url)
        filename = mobj.group('filename')
        info_url = 'http://www.roxwel.com/api/videos/%s' % filename
        info_page = self._download_webpage(info_url, filename,
                                           u'Downloading video info')

        self.report_extraction(filename)
        info = json.loads(info_page)
        rtmp_rates = sorted([int(r.replace('flv_', '')) for r in info['media_rates'] if r.startswith('flv_')])
        best_rate = rtmp_rates[-1]
        url_page_url = 'http://roxwel.com/pl_one_time.php?filename=%s&quality=%s' % (filename, best_rate)
        rtmp_url = self._download_webpage(url_page_url, filename, u'Downloading video url')
        ext = determine_ext(rtmp_url)
        if ext == 'f4v':
            rtmp_url = rtmp_url.replace(filename, 'mp4:%s' % filename)

        return {'id': filename,
                'title': info['title'],
                'url': rtmp_url,
                'ext': 'flv',
                'description': info['description'],
                'thumbnail': info.get('player_image_url') or info.get('image_url_large'),
                'uploader': info['artist'],
                'uploader_id': info['artistname'],
                'upload_date': unified_strdate(info['dbdate']),
                }