1
mirror of https://github.com/yt-dlp/yt-dlp synced 2025-01-06 16:46:25 +01:00
yt-dlp/youtube_dl/extractor/anitube.py

60 lines
1.7 KiB
Python
Raw Normal View History

2014-07-02 14:24:01 +02:00
from __future__ import unicode_literals
2013-11-16 15:26:34 +01:00
import re
from .common import InfoExtractor
class AnitubeIE(InfoExtractor):
2014-07-02 14:24:01 +02:00
IE_NAME = 'anitube.se'
2013-11-20 06:35:02 +01:00
_VALID_URL = r'https?://(?:www\.)?anitube\.se/video/(?P<id>\d+)'
2013-11-16 15:26:34 +01:00
_TEST = {
2014-07-02 14:24:01 +02:00
'url': 'http://www.anitube.se/video/36621',
'md5': '59d0eeae28ea0bc8c05e7af429998d43',
'info_dict': {
'id': '36621',
'ext': 'mp4',
'title': 'Recorder to Randoseru 01',
'duration': 180.19,
2013-11-16 15:26:34 +01:00
},
2014-07-02 14:24:01 +02:00
'skip': 'Blocked in the US',
2013-11-16 15:26:34 +01:00
}
def _real_extract(self, url):
mobj = re.match(self._VALID_URL, url)
video_id = mobj.group('id')
webpage = self._download_webpage(url, video_id)
2014-07-02 14:24:01 +02:00
key = self._html_search_regex(
r'http://www\.anitube\.se/embed/([A-Za-z0-9_-]*)', webpage, 'key')
2013-11-16 15:26:34 +01:00
2014-07-02 14:24:01 +02:00
config_xml = self._download_xml(
'http://www.anitube.se/nuevo/econfig.php?key=%s' % key, key)
2013-11-16 15:26:34 +01:00
video_title = config_xml.find('title').text
2014-07-02 14:24:01 +02:00
thumbnail = config_xml.find('image').text
duration = float(config_xml.find('duration').text)
2013-11-16 15:26:34 +01:00
formats = []
video_url = config_xml.find('file')
if video_url is not None:
formats.append({
'format_id': 'sd',
'url': video_url.text,
})
video_url = config_xml.find('filehd')
if video_url is not None:
formats.append({
'format_id': 'hd',
'url': video_url.text,
})
return {
'id': video_id,
'title': video_title,
2014-07-02 14:24:01 +02:00
'thumbnail': thumbnail,
'duration': duration,
2013-11-16 15:26:34 +01:00
'formats': formats
}