[idf1_extractor] Add new extractor (fulfilling support request #25671)

2025-01-21 06:22:51 +08:00 · 2020-06-19 17:08:13 -04:00 · 2020-06-19 17:08:13 -04:00 · acb0f56569
commit acb0f56569
parent 2391941f28
2 changed files with 45 additions and 0 deletions
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@ -451,6 +451,7 @@ from .hungama import (
    HungamaSongIE,
 )
 from .hypem import HypemIE
+from .idf1_extractor import IDF1IE
 from .ign import (
    IGNIE,
    OneUPIE,
@ -1516,3 +1517,4 @@ from .zattoo import (
 from .zdf import ZDFIE, ZDFChannelIE
 from .zingmp3 import ZingMp3IE
 from .zype import ZypeIE
+
--- a/youtube_dl/extractor/idf1_extractor.py
+++ b/youtube_dl/extractor/idf1_extractor.py
@ -0,0 +1,43 @@
+# coding: utf-8
+from __future__ import unicode_literals
+
+from .common import InfoExtractor
+from ..utils import url_or_none
+
+
+class IDF1IE(InfoExtractor):
+    IE_NAME = 'IDF1'
+    _VALID_URL = r'https?://(?:www\.)?idf1\.fr/videos/(?:[^/|.]+)/(?P<id>[^/|.]+)\.html'
+    _TESTS = [{
+        'url': 'https://www.idf1.fr/videos/jlpp/2020-05-29-partie-1.html',
+        'info_dict': {
+            'id': '2020-05-29-partie-1',
+            'ext': 'js',
+            'title': 'JLPP - 2020/05/29 - partie 1 sur le replay IDF1 - IDF1',
+            'description': '"Jacky lave plus propre, votre nouvelle &eacute;mission culte, tous les jours du lundi au vendredi &agrave; 17h00 sur IDF1&nbsp;!"',
+            'url': 'https://player.dacast.com/js/player.js?contentId=15863_f_890022',
+        },
+    }, {
+        'url': 'https://www.idf1.fr/videos/id-voyance/2020-03-13-partie-3.html',
+        'info_dict': {
+            'id': '2020-03-13-partie-3',
+            'ext': 'js',
+            'title': 'ID Voyance Île-de-France - 2020/03/13 - partie 3 sur le replay IDF1 - IDF1',
+            'description': '"Isabelle et nos voyants en direct tous les vendredis d&egrave;s 20h50 sur IDF1 pour l\'&eacute;mission ID Voyance &Icirc;le-de-France."',
+            'url': 'https://player.dacast.com/js/player.js?contentId=15863_f_827665',
+        },
+    }]
+
+    def _real_extract(self, url):
+        video_id = self._match_id(url)
+        webpage = self._download_webpage(url, video_id)
+        title = self._html_search_regex(r'<title[^>]*>(.+?)</title>', webpage, 'title', default='(no title available)')
+        description = self._html_search_regex(r'<meta[^>]*\sname=["|\']description["|\'][^>]*\scontent=(.+?)/>', webpage, 'description', fatal=False)
+        dacast_link = self._html_search_regex(r'<script\ssrc=([^\>]+)></script>', webpage, 'link')
+        dacast_link = url_or_none(dacast_link.replace('"', ''))
+        return {
+            'id': video_id,
+            'title': title,
+            'description': description,
+            'url': dacast_link,
+        }