haruhi-dl/youtube_dl/extractor/dctp.py

# coding: utf-8
from __future__ import unicode_literals

from .common import InfoExtractor
from ..utils import unified_strdate


class DctpTvIE(InfoExtractor):
    _VALID_URL = r'https?://(?:www\.)?dctp\.tv/(#/)?filme/(?P<id>.+?)/$'
    _TEST = {
        'url': 'http://www.dctp.tv/filme/videoinstallation-fuer-eine-kaufhausfassade/',
        'md5': '174dd4a8a6225cf5655952f969cfbe24',
        'info_dict': {
            'id': '95eaa4f33dad413aa17b4ee613cccc6c',
            'display_id': 'videoinstallation-fuer-eine-kaufhausfassade',
            'ext': 'mp4',
            'title': 'Videoinstallation für eine Kaufhausfassade',
            'description': 'Kurzfilm',
            'upload_date': '20110407',
            'thumbnail': r're:^https?://.*\.jpg$',
        },
    }

    def _real_extract(self, url):
        video_id = self._match_id(url)
        webpage = self._download_webpage(url, video_id)

        object_id = self._html_search_meta('DC.identifier', webpage)

        servers_json = self._download_json(
            'http://www.dctp.tv/elastic_streaming_client/get_streaming_server/',
            video_id, note='Downloading server list')
        server = servers_json[0]['server']
        m3u8_path = self._search_regex(
            r'\'([^\'"]+/playlist\.m3u8)"', webpage, 'm3u8 path')
        formats = self._extract_m3u8_formats(
            'http://%s%s' % (server, m3u8_path), video_id, ext='mp4',
            entry_protocol='m3u8_native')

        title = self._og_search_title(webpage)
        description = self._html_search_meta('DC.description', webpage)
        upload_date = unified_strdate(
            self._html_search_meta('DC.date.created', webpage))
        thumbnail = self._og_search_thumbnail(webpage)

        return {
            'id': object_id,
            'title': title,
            'formats': formats,
            'display_id': video_id,
            'description': description,
            'upload_date': upload_date,
            'thumbnail': thumbnail,
        }
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`# coding: utf-8`
added extractor for dctp.tv 2015-01-28 08:21:04 +01:00			`from __future__ import unicode_literals`

			`from .common import InfoExtractor`
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`from ..utils import unified_strdate`
added extractor for dctp.tv 2015-01-28 08:21:04 +01:00
added test for dctp 2015-01-28 08:59:58 +01:00
added extractor for dctp.tv 2015-01-28 08:21:04 +01:00			`class DctpTvIE(InfoExtractor):`
Improve some _VALID_URLs 2016-09-08 13:29:05 +02:00			`_VALID_URL = r'https?://(?:www\.)?dctp\.tv/(#/)?filme/(?P<id>.+?)/$'`
added test for dctp 2015-01-28 08:59:58 +01:00			`_TEST = {`
			`'url': 'http://www.dctp.tv/filme/videoinstallation-fuer-eine-kaufhausfassade/',`
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`'md5': '174dd4a8a6225cf5655952f969cfbe24',`
added test for dctp 2015-01-28 08:59:58 +01:00			`'info_dict': {`
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`'id': '95eaa4f33dad413aa17b4ee613cccc6c',`
[dctp] fix test 2015-01-30 00:35:53 +01:00			`'display_id': 'videoinstallation-fuer-eine-kaufhausfassade',`
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`'ext': 'mp4',`
			`'title': 'Videoinstallation für eine Kaufhausfassade',`
			`'description': 'Kurzfilm',`
			`'upload_date': '20110407',`
Fix "invalid escape sequences" error on Python 3.6 2017-01-02 13:08:07 +01:00			`'thumbnail': r're:^https?://.*\.jpg$',`
[dctptv] Skip rtmp download 2015-02-11 17:10:33 +01:00			`},`
[dctp] PEP8 2015-01-30 03:45:06 +01:00			`}`
added extractor for dctp.tv 2015-01-28 08:21:04 +01:00
			`def _real_extract(self, url):`
			`video_id = self._match_id(url)`
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`webpage = self._download_webpage(url, video_id)`

			`object_id = self._html_search_meta('DC.identifier', webpage)`
added extractor for dctp.tv 2015-01-28 08:21:04 +01:00
[dctp] Improve output (#4796) 2015-01-30 03:15:34 +01:00			`servers_json = self._download_json(`
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`'http://www.dctp.tv/elastic_streaming_client/get_streaming_server/',`
[dctp] Improve output (#4796) 2015-01-30 03:15:34 +01:00			`video_id, note='Downloading server list')`
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`server = servers_json[0]['server']`
			`m3u8_path = self._search_regex(`
			`r'\'([^\'"]+/playlist\.m3u8)"', webpage, 'm3u8 path')`
			`formats = self._extract_m3u8_formats(`
			`'http://%s%s' % (server, m3u8_path), video_id, ext='mp4',`
			`entry_protocol='m3u8_native')`

			`title = self._og_search_title(webpage)`
			`description = self._html_search_meta('DC.description', webpage)`
			`upload_date = unified_strdate(`
			`self._html_search_meta('DC.date.created', webpage))`
			`thumbnail = self._og_search_thumbnail(webpage)`
added extractor for dctp.tv 2015-01-28 08:21:04 +01:00
			`return {`
[dctp] follow id conventions 2015-01-29 23:34:56 +01:00			`'id': object_id,`
added extractor for dctp.tv 2015-01-28 08:21:04 +01:00			`'title': title,`
[dctp] Fix extraction (closes #10734) 2016-10-01 09:22:48 +02:00			`'formats': formats,`
			`'display_id': video_id,`
			`'description': description,`
			`'upload_date': upload_date,`
			`'thumbnail': thumbnail,`
added extractor for dctp.tv 2015-01-28 08:21:04 +01:00			`}`