# coding: utf-8 from __future__ import unicode_literals import random import string import time from ..compat import compat_filter as filter from ..utils import ( clean_html, ExtractorError, get_element_by_class, parse_duration, parse_filesize, update_url_query, unified_strdate, url_or_none, ) from .common import InfoExtractor class DoodStreamIE(InfoExtractor): _VALID_URL = r'https?://(?:www\.)?dood\.(?:to|watch)/[ed]/(?P[a-z0-9]+)' _TESTS = [{ 'url': 'http://dood.to/e/5s1wmbdacezb', 'md5': '4568b83b31e13242b3f1ff96c55f0595', 'info_dict': { 'id': '5s1wmbdacezb', 'ext': 'mp4', 'title': 'Kat Wonders - Monthly May 2020', 'description': 'Kat Wonders - Monthly May 2020 | DoodStream.com', 'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg', }, 'skip': 'Video not found', }, { 'url': 'http://dood.watch/d/5s1wmbdacezb', 'md5': '4568b83b31e13242b3f1ff96c55f0595', 'info_dict': { 'id': '5s1wmbdacezb', 'ext': 'mp4', 'title': 'Kat Wonders - Monthly May 2020', 'description': 'Kat Wonders - Monthly May 2020 | DoodStream.com', 'thumbnail': 'https://img.doodcdn.com/snaps/flyus84qgl2fsk4g.jpg', }, 'skip': 'Video not found', }, { 'url': 'https://dood.to/d/jzrxn12t2s7n', 'md5': '3207e199426eca7c2aa23c2872e6728a', 'info_dict': { 'id': 'jzrxn12t2s7n', 'ext': 'mp4', 'title': 'Stacy Cruz Cute ALLWAYSWELL', 'description': 'Stacy Cruz Cute ALLWAYSWELL | DoodStream.com', 'thumbnail': 'https://img.doodcdn.com/snaps/8edqd5nppkac3x8u.jpg', }, 'skip': 'Video not found', }, { 'url': 'https://dood.to/d/is34uy8wvaet', 'md5': '04740d3ba93bcd638aa7a097d9226710', 'info_dict': { 'id': 'is34uy8wvaet', 'ext': 'mp4', 'title': 'Akhanda (2021) Telugu DVDScr MP3 700MB - DoodStream', 'upload_date': '20211202', 'filesize_approx': int, 'duration': 9886, } }] def _real_extract(self, url): video_id = self._match_id(url) url = 'https://dood.to/e/' + video_id headers = { 'User-Agent': 'Mozilla/5.0', # (Windows NT 6.1; WOW64; rv:53.0) Gecko/20100101 Firefox/66.0', } webpage = self._download_webpage(url, video_id, headers=headers) title = self._html_search_meta(('og:title', 'twitter:title'), webpage, default=None) if not title: title = self._html_search_regex(r']*>([^<]+?)(?:\|\s+DoodStream\s*)?