From dea421f3937ce3ab9392b0086bdcbc20edcbf7fe Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?D=C3=A9stin=20Reed?= Date: Mon, 9 Jan 2017 19:04:52 +0100 Subject: [PATCH] [BlogTalkRadio] Add new extractor --- youtube_dl/extractor/blogtalkradio.py | 33 +++++++++++++++++++++++++++ youtube_dl/extractor/extractors.py | 1 + 2 files changed, 34 insertions(+) create mode 100644 youtube_dl/extractor/blogtalkradio.py diff --git a/youtube_dl/extractor/blogtalkradio.py b/youtube_dl/extractor/blogtalkradio.py new file mode 100644 index 000000000..1ffe77471 --- /dev/null +++ b/youtube_dl/extractor/blogtalkradio.py @@ -0,0 +1,33 @@ +from __future__ import unicode_literals + +from .common import InfoExtractor + + +class BlogTalkRadioIE(InfoExtractor): + _VALID_URL = r'https?://(?:www\.)?blogtalkradio\.com/(?:[^/]+/)+(?P[^.]+)' + _TEST = { + 'url': 'http://www.blogtalkradio.com/ghost/2008/02/20/true-conservative-radio-hosted-by-ghost', + 'md5': '733fdaef2a328f7c8884ac6a33ca0097', + 'info_dict': { + 'id': 'true-conservative-radio-hosted-by-ghost', + 'ext': 'mp3', + 'title': 'True Conservative Radio hosted by Ghost', + 'description': 'free format (political chat)', + 'thumbnail': r're:^https?://.*\.jpg$', + } + } + + def _real_extract(self, url): + display_id = self._match_id(url) + webpage = self._download_webpage(url, display_id) + + title = self._og_search_title(webpage) + audio_url = self._html_search_meta('twitter:player:stream', webpage, 'audio url') + + return { + 'id': display_id, + 'title': title, + 'url': audio_url, + 'description': self._og_search_description(webpage), + 'thumbnail': self._og_search_thumbnail(webpage), + } diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py index fcfe87f6f..638796193 100644 --- a/youtube_dl/extractor/extractors.py +++ b/youtube_dl/extractor/extractors.py @@ -106,6 +106,7 @@ from .bleacherreport import ( BleacherReportCMSIE, ) from .blinkx import BlinkxIE +from .blogtalkradio import BlogTalkRadioIE from .bloomberg import BloombergIE from .bokecc import BokeCCIE from .bpb import BpbIE