1
0
mirror of https://github.com/l1ving/youtube-dl synced 2025-01-22 17:53:00 +08:00
youtube-dl/youtube_dl/extractor/dump.py

40 lines
1.0 KiB
Python
Raw Normal View History

2014-08-22 04:30:49 +08:00
# encoding: utf-8
from __future__ import unicode_literals
import re
from .common import InfoExtractor
2014-08-22 07:43:19 +08:00
2014-08-22 04:30:49 +08:00
class DumpIE(InfoExtractor):
_VALID_URL = r'^https?://(?:www\.)?dump\.com/(?P<id>[a-zA-Z0-9]+)/'
2014-08-22 04:31:12 +08:00
_TEST = {
2014-08-22 07:43:19 +08:00
'url': 'http://www.dump.com/oneus/',
'md5': 'ad71704d1e67dfd9e81e3e8b42d69d99',
'info_dict': {
'id': 'oneus',
'ext': 'flv',
'title': "He's one of us.",
'thumbnail': 're:^https?://.*\.jpg$',
2014-08-22 04:31:12 +08:00
},
}
2014-08-22 04:30:49 +08:00
def _real_extract(self, url):
m = re.match(self._VALID_URL, url)
video_id = m.group('id')
webpage = self._download_webpage(url, video_id)
2014-08-22 07:43:19 +08:00
video_url = self._search_regex(
r's1.addVariable\("file",\s*"([^"]+)"', webpage, 'video URL')
2014-08-22 04:30:49 +08:00
2014-08-22 07:43:19 +08:00
thumb = self._og_search_thumbnail(webpage)
title = self._search_regex(r'<b>([^"]+)</b>', webpage, 'title')
2014-08-22 04:30:49 +08:00
return {
'id': video_id,
'title': title,
'url': video_url,
'thumbnail': thumb,
}