yt-dlp/yt_dlp/extractor/doodstream.py

import string
import random
import time

from .common import InfoExtractor


class DoodStreamIE(InfoExtractor):
    _VALID_URL = r'https?://(?:www\.)?dood\.(?:to|watch|so|pm)/[ed]/(?P<id>[a-z0-9]+)'
    _TESTS = [{
        'url': 'http://dood.to/e/5s1wmbdacezb',
        'md5': '4568b83b31e13242b3f1ff96c55f0595',
        'info_dict': {
            'id': '5s1wmbdacezb',
            'ext': 'mp4',
            'title': 'Kat Wonders - Monthly May 2020',
            'description': 'Kat Wonders - Monthly May 2020 | DoodStream.com',
            'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg',
        }
    }, {
        'url': 'http://dood.watch/d/5s1wmbdacezb',
        'md5': '4568b83b31e13242b3f1ff96c55f0595',
        'info_dict': {
            'id': '5s1wmbdacezb',
            'ext': 'mp4',
            'title': 'Kat Wonders - Monthly May 2020',
            'description': 'Kat Wonders - Monthly May 2020 | DoodStream.com',
            'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg',
        }
    }, {
        'url': 'https://dood.to/d/jzrxn12t2s7n',
        'md5': '3207e199426eca7c2aa23c2872e6728a',
        'info_dict': {
            'id': 'jzrxn12t2s7n',
            'ext': 'mp4',
            'title': 'Stacy Cruz Cute ALLWAYSWELL',
            'description': 'Stacy Cruz Cute ALLWAYSWELL | DoodStream.com',
            'thumbnail': 'https://img.doodcdn.com/snaps/8edqd5nppkac3x8u.jpg',
        }
    }, {
        'url': 'https://dood.so/d/jzrxn12t2s7n',
        'only_matching': True
    }]

    def _real_extract(self, url):
        video_id = self._match_id(url)
        url = f'https://dood.to/e/{video_id}'
        webpage = self._download_webpage(url, video_id)

        title = self._html_search_meta(
            ('og:title', 'twitter:title'), webpage, default=None) or self._html_extract_title(webpage)
        thumb = self._html_search_meta(['og:image', 'twitter:image'], webpage, default=None)
        token = self._html_search_regex(r'[?&]token=([a-z0-9]+)[&\']', webpage, 'token')
        description = self._html_search_meta(
            ['og:description', 'description', 'twitter:description'], webpage, default=None)

        headers = {
            'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64; rv:53.0) Gecko/20100101 Firefox/66.0',
            'referer': url
        }

        pass_md5 = self._html_search_regex(r'(/pass_md5.*?)\'', webpage, 'pass_md5')
        final_url = ''.join((
            self._download_webpage(f'https://dood.to{pass_md5}', video_id, headers=headers),
            *(random.choice(string.ascii_letters + string.digits) for _ in range(10)),
            f'?token={token}&expiry={int(time.time() * 1000)}',
        ))

        return {
            'id': video_id,
            'title': title,
            'url': final_url,
            'http_headers': headers,
            'ext': 'mp4',
            'description': description,
            'thumbnail': thumb,
        }
[doodstream] new extractor 2020-08-16 09:40:59 -04:00			`import string`
			`import random`
			`import time`

			`from .common import InfoExtractor`


			`class DoodStreamIE(InfoExtractor):`
[extractor/doodstream] Support more domains (#4493) Authored by: Galiley 2022-07-30 08:06:58 -04:00			`_VALID_URL = r'https?://(?:www\.)?dood\.(?:to\|watch\|so\|pm)/[ed]/(?P<id>[a-z0-9]+)'`
[doodstream] new extractor 2020-08-16 09:40:59 -04:00			`_TESTS = [{`
			`'url': 'http://dood.to/e/5s1wmbdacezb',`
			`'md5': '4568b83b31e13242b3f1ff96c55f0595',`
			`'info_dict': {`
			`'id': '5s1wmbdacezb',`
			`'ext': 'mp4',`
			`'title': 'Kat Wonders - Monthly May 2020',`
			`'description': 'Kat Wonders - Monthly May 2020 \| DoodStream.com',`
			`'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg',`
			`}`
[doodstream] Fix extractor Closes #2584 2022-02-01 20:09:46 -05:00			`}, {`
			`'url': 'http://dood.watch/d/5s1wmbdacezb',`
			`'md5': '4568b83b31e13242b3f1ff96c55f0595',`
			`'info_dict': {`
			`'id': '5s1wmbdacezb',`
			`'ext': 'mp4',`
			`'title': 'Kat Wonders - Monthly May 2020',`
			`'description': 'Kat Wonders - Monthly May 2020 \| DoodStream.com',`
			`'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg',`
			`}`
[doodstream] new extractor 2020-08-16 09:40:59 -04:00			`}, {`
			`'url': 'https://dood.to/d/jzrxn12t2s7n',`
			`'md5': '3207e199426eca7c2aa23c2872e6728a',`
			`'info_dict': {`
			`'id': 'jzrxn12t2s7n',`
			`'ext': 'mp4',`
			`'title': 'Stacy Cruz Cute ALLWAYSWELL',`
			`'description': 'Stacy Cruz Cute ALLWAYSWELL \| DoodStream.com',`
			`'thumbnail': 'https://img.doodcdn.com/snaps/8edqd5nppkac3x8u.jpg',`
			`}`
[extractor/doodstream] Support more domains (#4493) Authored by: Galiley 2022-07-30 08:06:58 -04:00			`}, {`
			`'url': 'https://dood.so/d/jzrxn12t2s7n',`
			`'only_matching': True`
[doodstream] new extractor 2020-08-16 09:40:59 -04:00			`}]`

			`def _real_extract(self, url):`
			`video_id = self._match_id(url)`
[doodstream] Fix extractor Closes #2584 2022-02-01 20:09:46 -05:00			`url = f'https://dood.to/e/{video_id}'`
[doodstream] new extractor 2020-08-16 09:40:59 -04:00			`webpage = self._download_webpage(url, video_id)`

[extractor/doodstream] Support more domains (#4493) Authored by: Galiley 2022-07-30 08:06:58 -04:00			`title = self._html_search_meta(`
			`('og:title', 'twitter:title'), webpage, default=None) or self._html_extract_title(webpage)`
[doodstream] Fix extractor Closes #2584 2022-02-01 20:09:46 -05:00			`thumb = self._html_search_meta(['og:image', 'twitter:image'], webpage, default=None)`
[doodstream] new extractor 2020-08-16 09:40:59 -04:00			`token = self._html_search_regex(r'[?&]token=([a-z0-9]+)[&\']', webpage, 'token')`
Styling changes 2020-08-17 11:07:22 -04:00			`description = self._html_search_meta(`
[doodstream] Fix extractor Closes #2584 2022-02-01 20:09:46 -05:00			`['og:description', 'description', 'twitter:description'], webpage, default=None)`

Styling changes 2020-08-17 11:07:22 -04:00			`headers = {`
[doodstream] flake8 compliance 2020-08-17 18:12:14 -04:00			`'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64; rv:53.0) Gecko/20100101 Firefox/66.0',`
Styling changes 2020-08-17 11:07:22 -04:00			`'referer': url`
			`}`
[doodstream] new extractor 2020-08-16 09:40:59 -04:00
[doodstream] Fix extractor Closes #2584 2022-02-01 20:09:46 -05:00			`pass_md5 = self._html_search_regex(r'(/pass_md5.*?)\'', webpage, 'pass_md5')`
			`final_url = ''.join((`
			`self._download_webpage(f'https://dood.to{pass_md5}', video_id, headers=headers),`
			`*(random.choice(string.ascii_letters + string.digits) for _ in range(10)),`
			`f'?token={token}&expiry={int(time.time() * 1000)}',`
			`))`
[doodstream] new extractor 2020-08-16 09:40:59 -04:00
			`return {`
			`'id': video_id,`
			`'title': title,`
			`'url': final_url,`
			`'http_headers': headers,`
			`'ext': 'mp4',`
			`'description': description,`
			`'thumbnail': thumb,`
			`}`