summaryrefslogtreecommitdiff
path: root/youtube_dl/postprocessor/metadatafromtitle.py
blob: f5c14d974f4b44c9a5c014a536a0b2f72c65b2db (plain)
    1 from __future__ import unicode_literals
    2 
    3 import re
    4 
    5 from .common import PostProcessor
    6 
    7 
    8 class MetadataFromTitlePP(PostProcessor):
    9     def __init__(self, downloader, titleformat):
   10         super(MetadataFromTitlePP, self).__init__(downloader)
   11         self._titleformat = titleformat
   12         self._titleregex = (self.format_to_regex(titleformat)
   13                             if re.search(r'%\(\w+\)s', titleformat)
   14                             else titleformat)
   15 
   16     def format_to_regex(self, fmt):
   17         r"""
   18         Converts a string like
   19            '%(title)s - %(artist)s'
   20         to a regex like
   21            '(?P<title>.+)\ \-\ (?P<artist>.+)'
   22         """
   23         lastpos = 0
   24         regex = ''
   25         # replace %(..)s with regex group and escape other string parts
   26         for match in re.finditer(r'%\((\w+)\)s', fmt):
   27             regex += re.escape(fmt[lastpos:match.start()])
   28             regex += r'(?P<' + match.group(1) + '>.+)'
   29             lastpos = match.end()
   30         if lastpos < len(fmt):
   31             regex += re.escape(fmt[lastpos:])
   32         return regex
   33 
   34     def run(self, info):
   35         title = info['title']
   36         match = re.match(self._titleregex, title)
   37         if match is None:
   38             self._downloader.to_screen(
   39                 '[fromtitle] Could not interpret title of video as "%s"'
   40                 % self._titleformat)
   41             return [], info
   42         for attribute, value in match.groupdict().items():
   43             info[attribute] = value
   44             self._downloader.to_screen(
   45                 '[fromtitle] parsed %s: %s'
   46                 % (attribute, value if value is not None else 'NA'))
   47 
   48         return [], info

Generated by cgit