metadatafromtitle.py (1652B)
1 from __future__ import unicode_literals 2 3 import re 4 5 from .common import PostProcessor 6 7 8 class MetadataFromTitlePP(PostProcessor): 9 def __init__(self, downloader, titleformat): 10 super(MetadataFromTitlePP, self).__init__(downloader) 11 self._titleformat = titleformat 12 self._titleregex = (self.format_to_regex(titleformat) 13 if re.search(r'%\(\w+\)s', titleformat) 14 else titleformat) 15 16 def format_to_regex(self, fmt): 17 r""" 18 Converts a string like 19 '%(title)s - %(artist)s' 20 to a regex like 21 '(?P<title>.+)\ \-\ (?P<artist>.+)' 22 """ 23 lastpos = 0 24 regex = '' 25 # replace %(..)s with regex group and escape other string parts 26 for match in re.finditer(r'%\((\w+)\)s', fmt): 27 regex += re.escape(fmt[lastpos:match.start()]) 28 regex += r'(?P<' + match.group(1) + '>.+)' 29 lastpos = match.end() 30 if lastpos < len(fmt): 31 regex += re.escape(fmt[lastpos:]) 32 return regex 33 34 def run(self, info): 35 title = info['title'] 36 match = re.match(self._titleregex, title) 37 if match is None: 38 self._downloader.to_screen( 39 '[fromtitle] Could not interpret title of video as "%s"' 40 % self._titleformat) 41 return [], info 42 for attribute, value in match.groupdict().items(): 43 info[attribute] = value 44 self._downloader.to_screen( 45 '[fromtitle] parsed %s: %s' 46 % (attribute, value if value is not None else 'NA')) 47 48 return [], info