summaryrefslogtreecommitdiffhomepage
path: root/youtube_dl/postprocessor/metadatafromtitle.py
blob: 4c9d3aafec43ec12be9dcb4eba991274d8dbe849 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
# -*- coding: utf-8 -*-

import re

from .common import PostProcessor
from ..utils import PostProcessingError


class MetadataFromTitlePPError(PostProcessingError):
    pass


class MetadataFromTitlePP(PostProcessor):
    def __init__(self, downloader, titleformat):
        self._titleformat = titleformat
        self._titleregex = self.fmtToRegex(titleformat)

    def fmtToRegex(self, fmt):
        """
        Converts a string like
           '%(title)s - %(artist)s'
        to a regex like
           '(?P<title>.+)\ \-\ (?P<artist>.+)'
        and a list of the named groups [title, artist]
        """
        lastpos = 0
        regex = ""
        groups = []
        # replace %(..)s with regex group and escape other string parts
        for match in re.finditer(r'%\((\w+)\)s', fmt):
            regex += re.escape(fmt[lastpos:match.start()])
            regex += r'(?P<' + match.group(1) + '>.+)'
            lastpos = match.end()
        if lastpos < len(fmt):
            regex += re.escape(fmt[lastpos:len(fmt)])
        return regex

    def run(self, info):
        title = info['title']
        match = re.match(self._titleregex, title)
        if match is None:
            raise MetadataFromTitlePPError('Could not interpret title of video as "%s"' % self._titleformat)
        for attribute, value in match.groupdict().items():
            value = match.group(attribute)
            info[attribute] = value
            self._downloader.to_screen('[fromtitle] parsed ' + attribute + ': ' + value)

        return True, info