id: Video identifier.
url: Final video URL.
- uploader: Nickname of the video uploader.
+ uploader: Nickname of the video uploader, unescaped.
upload_date: Video upload date (YYYYMMDD).
title: Video title, unescaped.
ext: Video filename extension.
description: One-line video description.
player_url: SWF Player URL (used for rtmpdump).
+ The fields should all be Unicode strings.
+
Subclasses of this one should re-define the _real_initialize() and
_real_extract() methods and define a _VALID_URL regexp.
Probably, they should also be added to the list of extractors.
'ext': video_extension.decode('utf-8'),
'thumbnail': video_thumbnail.decode('utf-8'),
'description': video_description,
- 'thumbnail': video_thumbnail,
}]
info = {
'id': title,
'url': url,
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
'title': title,
'ext': ext,
'urlhandle': urlh
'id': videoId,
'url': videoUrl,
'uploader': showName,
- 'upload_date': None,
+ 'upload_date': u'NA',
'title': showName,
'ext': 'flv',
'thumbnail': imgUrl,
info = {
'id': video_id,
'internal_id': internal_video_id,
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
}
self.report_extraction(video_id)
info = {
'id': video_id,
'url': video_url,
- 'uploader': None,
- 'upload_date': None,
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
'title': video_title,
'ext': 'flv',
'thumbnail': video_thumbnail,
description = mobj.group(1)
# upload date
- upload_date = None
+ upload_date = u'NA'
mobj = re.search("pretty-date'>on ([\w]+ [\d]+, [\d]+ \d+:\d+)</abbr></h2>", webpage)
if mobj:
try:
info = {
'id': video_id,
'url': video_url,
- 'uploader': None,
- 'upload_date': None,
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
'title': video_title,
'ext': extension, # Extension is always(?) mp4, but seems to be flv
'thumbnail': None,
video = mobj.group('video')
info = {
'id': course + '_' + video,
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
}
self.report_extraction(info['id'])
info = {
'id': course,
'type': 'playlist',
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
}
self.report_download_webpage(info['id'])
info = {
'id': 'Stanford OpenClassroom',
'type': 'playlist',
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
}
self.report_download_webpage(info['id'])
'id': video_id,
'url': video_url,
'uploader': performer,
+ 'upload_date': u'NA',
'title': video_title,
'ext': ext,
'format': format,
info = {
'id': '%s_part%02d' % (video_id, index),
'url': download_url,
- 'uploader': None,
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
'title': video_title,
'ext': ext,
}
return [{
'id': video_id,
'url': video_url,
- 'uploader': None,
- 'upload_date': None,
+ 'uploader': u'NA',
+ 'upload_date': u'NA',
'title': video_title,
'ext': 'flv',
'thumbnail': video_thumbnail,