From 3687a4f9bdb025855acd2a4e782748c8e3810765 Mon Sep 17 00:00:00 2001
From: dirkf <fieldhouse@gmx.net>
Date: Sat, 4 Jun 2022 08:07:54 +0100
Subject: [PATCH 1/5] [DoodStream] Add extractor from yt-dlp back-port and
 improve

---
 youtube_dl/extractor/doodstream.py | 119 +++++++++++++++++++++++++++++
 youtube_dl/extractor/extractors.py |   1 +
 2 files changed, 120 insertions(+)
 create mode 100644 youtube_dl/extractor/doodstream.py
diff --git a/youtube_dl/extractor/doodstream.py b/youtube_dl/extractor/doodstream.py
new file mode 100644
index 000000000..70bf4e512
--- /dev/null
+++ b/youtube_dl/extractor/doodstream.py
@@ -0,0 +1,119 @@
+# coding: utf-8
+from __future__ import unicode_literals
+
+import random
+import string
+import time
+
+from ..compat import compat_filter as filter
+from ..utils import (
+    clean_html,
+    ExtractorError,
+    get_element_by_class,
+    parse_duration,
+    parse_filesize,
+    update_url_query,
+    unified_strdate,
+    url_or_none,
+)
+
+from .common import InfoExtractor
+
+
+class DoodStreamIE(InfoExtractor):
+    _VALID_URL = r'https?://(?:www\.)?dood\.(?:to|watch)/[ed]/(?P<id>[a-z0-9]+)'
+    _TESTS = [{
+        'url': 'http://dood.to/e/5s1wmbdacezb',
+        'md5': '4568b83b31e13242b3f1ff96c55f0595',
+        'info_dict': {
+            'id': '5s1wmbdacezb',
+            'ext': 'mp4',
+            'title': 'Kat Wonders - Monthly May 2020',
+            'description': 'Kat Wonders - Monthly May 2020 | DoodStream.com',
+            'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg',
+        },
+        'skip': 'Video not found',
+    }, {
+        'url': 'http://dood.watch/d/5s1wmbdacezb',
+        'md5': '4568b83b31e13242b3f1ff96c55f0595',
+        'info_dict': {
+            'id': '5s1wmbdacezb',
+            'ext': 'mp4',
+            'title': 'Kat Wonders - Monthly May 2020',
+            'description': 'Kat Wonders - Monthly May 2020 | DoodStream.com',
+            'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg',
+        },
+        'skip': 'Video not found',
+    }, {
+        'url': 'https://dood.to/d/jzrxn12t2s7n',
+        'md5': '3207e199426eca7c2aa23c2872e6728a',
+        'info_dict': {
+            'id': 'jzrxn12t2s7n',
+            'ext': 'mp4',
+            'title': 'Stacy Cruz Cute ALLWAYSWELL',
+            'description': 'Stacy Cruz Cute ALLWAYSWELL | DoodStream.com',
+            'thumbnail': 'https://img.doodcdn.com/snaps/8edqd5nppkac3x8u.jpg',
+        },
+        'skip': 'Video not found',
+    }, {
+        'url': 'https://dood.to/d/is34uy8wvaet',
+        'md5': '04740d3ba93bcd638aa7a097d9226710',
+        'info_dict': {
+            'id': 'is34uy8wvaet',
+            'ext': 'mp4',
+            'title': 'Akhanda (2021) Telugu DVDScr MP3 700MB - DoodStream',
+            'upload_date': '20211202',
+            'filesize_approx': int,
+            'duration': 9886,
+        }
+    }]
+
+    def _real_extract(self, url):
+        video_id = self._match_id(url)
+        url = 'https://dood.to/e/' + video_id
+        headers = {
+            'User-Agent': 'Mozilla/5.0',  # (Windows NT 6.1; WOW64; rv:53.0) Gecko/20100101 Firefox/66.0',
+        }
+        webpage = self._download_webpage(url, video_id, headers=headers)
+
+        title = self._html_search_meta(('og:title', 'twitter:title'), webpage, default=None)
+        if not title:
+            title = self._html_search_regex(r'<title\b[^>]*>([^<]+?)(?:\|\s+DoodStream\s*)?</title', webpage, 'title')
+            if title == 'Video not found':
+                raise ExtractorError(title, expected=True)
+        token = self._html_search_regex(r'''[?&]token=([a-z0-9]+)[&']''', webpage, 'token')
+
+        headers.update({
+            # 'User-Agent': 'Mozilla/5.0',  # (Windows NT 6.1; WOW64; rv:53.0) Gecko/20100101 Firefox/66.0',
+            'referer': url
+        })
+
+        pass_md5 = self._html_search_regex(r'(/pass_md5.*?)\'', webpage, 'pass_md5')
+        final_url = (
+            self._download_webpage('https://dood.to' + pass_md5, video_id, headers=headers, note='Downloading final URL')
+            + ''.join((random.choice(string.ascii_letters + string.digits) for _ in range(10)))
+        )
+        final_url = update_url_query(final_url, {'token': token, 'expiry': int(time.time() * 1000), })
+
+        thumb = next(filter(None, (url_or_none(self._html_search_meta(x, webpage, default=None))
+                                   for x in ('og:image', 'twitter:image'))), None)
+        description = self._html_search_meta(
+            ('og:description', 'description', 'twitter:description'), webpage, default=None)
+
+        webpage = self._download_webpage('https://dood.to/d/' + video_id, video_id, headers=headers, fatal=False)
+
+        def get_class_text(x):
+            return clean_html(get_element_by_class(x, webpage))
+
+        return {
+            'id': video_id,
+            'title': title,
+            'url': final_url,
+            'http_headers': headers,
+            'ext': 'mp4',
+            'upload_date': unified_strdate(get_class_text('uploadate')),
+            'duration': parse_duration(get_class_text('length')),
+            'filesize_approx': parse_filesize(get_class_text('size')),
+            'description': description,
+            'thumbnail': thumb,
+        }
diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py
index 452caeade..3d1d9375e 100644
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@@ -299,6 +299,7 @@ from .democracynow import DemocracynowIE
 from .dfb import DFBIE
 from .dhm import DHMIE
 from .digg import DiggIE
+from .doodstream import DoodStreamIE
 from .dotsub import DotsubIE
 from .douyutv import (
     DouyuShowIE,

From 9dd91758aea6b3427662cac1efde1c5b5c1de6c3 Mon Sep 17 00:00:00 2001
From: dirkf <fieldhouse@gmx.net>
Date: Sat, 4 Jun 2022 09:26:41 +0100
Subject: [PATCH 2/5] [DoodStream] Support more TLDs * also fix title
 extraction

---
 youtube_dl/extractor/doodstream.py | 35 +++++++++++++++++++++++-------
 1 file changed, 27 insertions(+), 8 deletions(-)

diff --git a/youtube_dl/extractor/doodstream.py b/youtube_dl/extractor/doodstream.py
index 70bf4e512..94411ebb0 100644
--- a/youtube_dl/extractor/doodstream.py
+++ b/youtube_dl/extractor/doodstream.py
@@ -21,7 +21,7 @@ from .common import InfoExtractor
 
 
 class DoodStreamIE(InfoExtractor):
-    _VALID_URL = r'https?://(?:www\.)?dood\.(?:to|watch)/[ed]/(?P<id>[a-z0-9]+)'
+    _VALID_URL = r'https?://(?:www\.)?dood\.(?:to|watch|so|la|pm|sh|ws|one)/[ed]/(?P<id>[a-z0-9]+)'
     _TESTS = [{
         'url': 'http://dood.to/e/5s1wmbdacezb',
         'md5': '4568b83b31e13242b3f1ff96c55f0595',
@@ -61,11 +61,24 @@ class DoodStreamIE(InfoExtractor):
         'info_dict': {
             'id': 'is34uy8wvaet',
             'ext': 'mp4',
-            'title': 'Akhanda (2021) Telugu DVDScr MP3 700MB - DoodStream',
+            'title': 'Akhanda (2021) Telugu DVDScr MP3 700MB',
             'upload_date': '20211202',
+            'thumbnail': r're:https?://img\.doodcdn\.com?/[\w/]+\.jpg',
             'filesize_approx': int,
             'duration': 9886,
         }
+    }, {
+        'url': 'https://dood.so/d/wlihoael8uog',
+        'md5': '2c14444c89788cc309738c1560abe278',
+        'info_dict': {
+            'id': 'wlihoael8uog',
+            'ext': 'mp4',
+            'title': 'VID 20220319 161659',
+            'thumbnail': r're:https?://img\.doodcdn\.com?/splash/rmpnhb8ckkk79cge\.jpg',
+            'upload_date': '20220319',
+            'filesize_approx': int,
+            'duration': 12.0,
+        }
     }]
 
     def _real_extract(self, url):
@@ -76,11 +89,12 @@ class DoodStreamIE(InfoExtractor):
         }
         webpage = self._download_webpage(url, video_id, headers=headers)
 
-        title = self._html_search_meta(('og:title', 'twitter:title'), webpage, default=None)
-        if not title:
-            title = self._html_search_regex(r'<title\b[^>]*>([^<]+?)(?:\|\s+DoodStream\s*)?</title', webpage, 'title')
-            if title == 'Video not found':
-                raise ExtractorError(title, expected=True)
+        def get_title(html, fatal=False):
+            return self._html_search_regex(r'<title\b[^>]*>([^<]+?)(?:[|-]\s+DoodStream\s*)?</title', html, 'title', fatal=fatal)
+
+        title = get_title(webpage)
+        if title == 'Video not found':
+            raise ExtractorError(title, expected=True)
         token = self._html_search_regex(r'''[?&]token=([a-z0-9]+)[&']''', webpage, 'token')
 
         headers.update({
@@ -100,7 +114,12 @@ class DoodStreamIE(InfoExtractor):
         description = self._html_search_meta(
             ('og:description', 'description', 'twitter:description'), webpage, default=None)
 
-        webpage = self._download_webpage('https://dood.to/d/' + video_id, video_id, headers=headers, fatal=False)
+        webpage = self._download_webpage('https://dood.to/d/' + video_id, video_id, headers=headers, fatal=False) or ''
+
+        title = (
+            self._html_search_meta(('og:title', 'twitter:title'), webpage, default=None)
+            or get_title(webpage, fatal=(title is not None))
+            or title)
 
         def get_class_text(x):
             return clean_html(get_element_by_class(x, webpage))

From ab9ad567d8d1fe15be74b1eaf176cab3211aa343 Mon Sep 17 00:00:00 2001
From: dirkf <fieldhouse@gmx.net>
Date: Fri, 29 Nov 2024 14:11:41 +0000
Subject: [PATCH 3/5] Incorporate changes from PR #32979

* update tests
* send `Referer` when fetching media link

Co-authored-by: mp3butcher <julienvalentin51@gmail.com>
---
 youtube_dl/extractor/doodstream.py | 87 ++++++++++++++----------------
 1 file changed, 40 insertions(+), 47 deletions(-)

diff --git a/youtube_dl/extractor/doodstream.py b/youtube_dl/extractor/doodstream.py
index 94411ebb0..8dd54a0ab 100644
--- a/youtube_dl/extractor/doodstream.py
+++ b/youtube_dl/extractor/doodstream.py
@@ -1,9 +1,9 @@
 # coding: utf-8
 from __future__ import unicode_literals
 
-import random
-import string
-import time
+from random import choice as random_choice
+from string import ascii_letters, digits
+from time import time as time_time
 
 from ..compat import compat_filter as filter
 from ..utils import (
@@ -21,40 +21,20 @@ from .common import InfoExtractor
 
 
 class DoodStreamIE(InfoExtractor):
-    _VALID_URL = r'https?://(?:www\.)?dood\.(?:to|watch|so|la|pm|sh|ws|one)/[ed]/(?P<id>[a-z0-9]+)'
+    # dood.* redirects
+    # .watch -> .re (but HEAD request fails in GenericIE)
+    # .so -> .li
+    _VALID_URL = r'https?://(?:www\.)?(?P<host>dood\.(?:to|la|li|pm|re|sh|watch|ws|one)|ds2play\.com)/[ed]/(?P<id>[a-z\d]+)'
     _TESTS = [{
-        'url': 'http://dood.to/e/5s1wmbdacezb',
-        'md5': '4568b83b31e13242b3f1ff96c55f0595',
+        'url': 'https://dood.li/e/h7ecgw5oqn8k',
+        'md5': '90f2af170551c17fc78bee7426890054',
         'info_dict': {
-            'id': '5s1wmbdacezb',
+            'id': 'h7ecgw5oqn8k',
             'ext': 'mp4',
-            'title': 'Kat Wonders - Monthly May 2020',
-            'description': 'Kat Wonders - Monthly May 2020 | DoodStream.com',
-            'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg',
+            'title': 'Free-Slow-Music',
+            'upload_date': '20230814',
+            'thumbnail': 'https://img.doodcdn.co/splash/7mbnwydhb6kb7xyk.jpg',
         },
-        'skip': 'Video not found',
-    }, {
-        'url': 'http://dood.watch/d/5s1wmbdacezb',
-        'md5': '4568b83b31e13242b3f1ff96c55f0595',
-        'info_dict': {
-            'id': '5s1wmbdacezb',
-            'ext': 'mp4',
-            'title': 'Kat Wonders - Monthly May 2020',
-            'description': 'Kat Wonders - Monthly May 2020 | DoodStream.com',
-            'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg',
-        },
-        'skip': 'Video not found',
-    }, {
-        'url': 'https://dood.to/d/jzrxn12t2s7n',
-        'md5': '3207e199426eca7c2aa23c2872e6728a',
-        'info_dict': {
-            'id': 'jzrxn12t2s7n',
-            'ext': 'mp4',
-            'title': 'Stacy Cruz Cute ALLWAYSWELL',
-            'description': 'Stacy Cruz Cute ALLWAYSWELL | DoodStream.com',
-            'thumbnail': 'https://img.doodcdn.com/snaps/8edqd5nppkac3x8u.jpg',
-        },
-        'skip': 'Video not found',
     }, {
         'url': 'https://dood.to/d/is34uy8wvaet',
         'md5': '04740d3ba93bcd638aa7a097d9226710',
@@ -66,9 +46,10 @@ class DoodStreamIE(InfoExtractor):
             'thumbnail': r're:https?://img\.doodcdn\.com?/[\w/]+\.jpg',
             'filesize_approx': int,
             'duration': 9886,
-        }
+        },
+        'skip': 'Video not found',
     }, {
-        'url': 'https://dood.so/d/wlihoael8uog',
+        'url': 'https://dood.sh/d/wlihoael8uog',
         'md5': '2c14444c89788cc309738c1560abe278',
         'info_dict': {
             'id': 'wlihoael8uog',
@@ -78,16 +59,20 @@ class DoodStreamIE(InfoExtractor):
             'upload_date': '20220319',
             'filesize_approx': int,
             'duration': 12.0,
-        }
+        },
+    }, {
+        'url': 'http://dood.ws /d/h7ecgw5oqn8k',
+        'only_matching': True,
+    }, {
+        'url': 'https://dood.li/d/wlihoael8uog',
+        'only_matching': True,
     }]
 
     def _real_extract(self, url):
         video_id = self._match_id(url)
-        url = 'https://dood.to/e/' + video_id
-        headers = {
-            'User-Agent': 'Mozilla/5.0',  # (Windows NT 6.1; WOW64; rv:53.0) Gecko/20100101 Firefox/66.0',
-        }
-        webpage = self._download_webpage(url, video_id, headers=headers)
+        host = 'dood.li'
+        url = 'https://%s/e/%s' % (host, video_id)
+        webpage = self._download_webpage(url, video_id, note='Downloading "/e/" webpage')
 
         def get_title(html, fatal=False):
             return self._html_search_regex(r'<title\b[^>]*>([^<]+?)(?:[|-]\s+DoodStream\s*)?</title', html, 'title', fatal=fatal)
@@ -103,18 +88,26 @@ class DoodStreamIE(InfoExtractor):
         })
 
         pass_md5 = self._html_search_regex(r'(/pass_md5.*?)\'', webpage, 'pass_md5')
-        final_url = (
-            self._download_webpage('https://dood.to' + pass_md5, video_id, headers=headers, note='Downloading final URL')
-            + ''.join((random.choice(string.ascii_letters + string.digits) for _ in range(10)))
-        )
-        final_url = update_url_query(final_url, {'token': token, 'expiry': int(time.time() * 1000), })
+        # construct the media link
+        final_url = self._download_webpage(
+            'https://%s/%s' % (host, pass_md5), video_id, headers={
+                'Referer': url,
+            }, note='Downloading authpage URL')
+        final_url += ''.join((random_choice(ascii_letters + digits)
+                                        for _ in range(10)))
+        final_url = update_url_query(final_url, {
+            'token': token,
+            'expiry': int(time_time() * 1000),
+        })
 
         thumb = next(filter(None, (url_or_none(self._html_search_meta(x, webpage, default=None))
                                    for x in ('og:image', 'twitter:image'))), None)
         description = self._html_search_meta(
             ('og:description', 'description', 'twitter:description'), webpage, default=None)
 
-        webpage = self._download_webpage('https://dood.to/d/' + video_id, video_id, headers=headers, fatal=False) or ''
+        webpage = self._download_webpage(
+            'https://%s/d/%s' % (host, video_id), video_id, fatal=False,
+            note='Downloading alternative "/d/" page') or ''
 
         title = (
             self._html_search_meta(('og:title', 'twitter:title'), webpage, default=None)

From 98e6231a255b3f5751f9553d0f2283ccb1d2ae82 Mon Sep 17 00:00:00 2001
From: dirkf <fieldhouse@gmx.net>
Date: Fri, 29 Nov 2024 14:17:10 +0000
Subject: [PATCH 4/5] Further small improvements

---
 youtube_dl/extractor/doodstream.py | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/youtube_dl/extractor/doodstream.py b/youtube_dl/extractor/doodstream.py
index 8dd54a0ab..0d3271186 100644
--- a/youtube_dl/extractor/doodstream.py
+++ b/youtube_dl/extractor/doodstream.py
@@ -78,16 +78,16 @@ class DoodStreamIE(InfoExtractor):
             return self._html_search_regex(r'<title\b[^>]*>([^<]+?)(?:[|-]\s+DoodStream\s*)?</title', html, 'title', fatal=fatal)
 
         title = get_title(webpage)
-        if title == 'Video not found':
+        if title == 'Video not found' or (
+                title == '' and 'Not Found' == self._html_search_regex(r'<h1\b[^>]*>([^<]+?)</h1', webpage, 'heading1', default=None)):
             raise ExtractorError(title, expected=True)
-        token = self._html_search_regex(r'''[?&]token=([a-z0-9]+)[&']''', webpage, 'token')
 
-        headers.update({
-            # 'User-Agent': 'Mozilla/5.0',  # (Windows NT 6.1; WOW64; rv:53.0) Gecko/20100101 Firefox/66.0',
-            'referer': url
-        })
-
-        pass_md5 = self._html_search_regex(r'(/pass_md5.*?)\'', webpage, 'pass_md5')
+        pass_md5, token = self._search_regex(
+            r'["\']/(?P<pm>pass_md5/[\da-f-]+/(?P<tok>[\da-z]+))', webpage, 'tokens',
+            group=('pm', 'tok'))
+        headers = {
+            'Referer': url,
+        }
         # construct the media link
         final_url = self._download_webpage(
             'https://%s/%s' % (host, pass_md5), video_id, headers={
@@ -100,6 +100,7 @@ class DoodStreamIE(InfoExtractor):
             'expiry': int(time_time() * 1000),
         })
 
+        # get additional metadata
         thumb = next(filter(None, (url_or_none(self._html_search_meta(x, webpage, default=None))
                                    for x in ('og:image', 'twitter:image'))), None)
         description = self._html_search_meta(

From da90df06c3b8e7e6cc66a124c196aef4eb856a89 Mon Sep 17 00:00:00 2001
From: dirkf <fieldhouse@gmx.net>
Date: Fri, 29 Nov 2024 14:27:29 +0000
Subject: [PATCH 5/5] Linty

---
 youtube_dl/extractor/doodstream.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/youtube_dl/extractor/doodstream.py b/youtube_dl/extractor/doodstream.py
index 0d3271186..9350dee9c 100644
--- a/youtube_dl/extractor/doodstream.py
+++ b/youtube_dl/extractor/doodstream.py
@@ -61,7 +61,7 @@ class DoodStreamIE(InfoExtractor):
             'duration': 12.0,
         },
     }, {
-        'url': 'http://dood.ws /d/h7ecgw5oqn8k',
+        'url': 'http://dood.ws/d/h7ecgw5oqn8k',
         'only_matching': True,
     }, {
         'url': 'https://dood.li/d/wlihoael8uog',
@@ -94,7 +94,7 @@ class DoodStreamIE(InfoExtractor):
                 'Referer': url,
             }, note='Downloading authpage URL')
         final_url += ''.join((random_choice(ascii_letters + digits)
-                                        for _ in range(10)))
+                              for _ in range(10)))
         final_url = update_url_query(final_url, {
             'token': token,
             'expiry': int(time_time() * 1000),