1
mirror of https://github.com/yt-dlp/yt-dlp synced 2024-12-11 04:43:55 +01:00
yt-dlp/yt_dlp/extractor/daystar.py
Ha Tien Loi 761fba6d22
[daystar] Add extractor (#2924)
Closes #2887
Authored by; hatienl0i261299
2022-03-04 03:19:57 -08:00

49 lines
2.0 KiB
Python

from .common import InfoExtractor
from ..utils import js_to_json, urljoin
class DaystarClipIE(InfoExtractor):
IE_NAME = 'daystar:clip'
_VALID_URL = r'https?://player\.daystar\.tv/(?P<id>\w+)'
_TESTS = [{
'url': 'https://player.daystar.tv/0MTO2ITM',
'info_dict': {
'id': '0MTO2ITM',
'ext': 'mp4',
'title': 'The Dark World of COVID Pt. 1 | Aaron Siri',
'description': 'a420d320dda734e5f29458df3606c5f4',
'thumbnail': r're:^https?://.+\.jpg',
},
}]
def _real_extract(self, url):
video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id)
src_iframe = self._search_regex(r'\<iframe[^>]+src="([^"]+)"', webpage, 'src iframe')
webpage_iframe = self._download_webpage(
src_iframe.replace('player.php', 'config2.php'), video_id, headers={'Referer': src_iframe})
sources = self._parse_json(self._search_regex(
r'sources\:\s*(\[.*?\])', webpage_iframe, 'm3u8 source'), video_id, transform_source=js_to_json)
formats, subtitles = [], {}
for source in sources:
file = source.get('file')
if file and source.get('type') == 'm3u8':
fmts, subs = self._extract_m3u8_formats_and_subtitles(
urljoin('https://www.lightcast.com/embed/', file),
video_id, 'mp4', fatal=False, headers={'Referer': src_iframe})
formats.extend(fmts)
subtitles = self._merge_subtitles(subtitles, subs)
self._sort_formats(formats)
return {
'id': video_id,
'title': self._html_search_meta(['og:title', 'twitter:title'], webpage),
'description': self._html_search_meta(['og:description', 'twitter:description'], webpage),
'thumbnail': self._search_regex(r'image:\s*"([^"]+)', webpage_iframe, 'thumbnail'),
'formats': formats,
'subtitles': subtitles,
}