added speedrun author and timer

optional (fatal=False) because the website's layout forced me into an unreliably regex.
2024-11-22 02:01:50 +00:00 · 2020-12-31 23:02:26 -05:00 · 2020-12-31 23:02:26 -05:00 · 9addbadd33
commit 9addbadd33
parent 14834bf977
1 changed files with 15 additions and 5 deletions
--- a/youtube_dl/extractor/tasvideos.py
+++ b/youtube_dl/extractor/tasvideos.py
@ -27,8 +27,13 @@ class TASVideosIE(InfoExtractor):
            r'<a [^>]+(?P<URL>archive\.org\/download[^<]+\.(?:mkv|mp4|avi))[^<]+<\/a>',
            webpage)
        title = self._search_regex(
-            r'<span title="Movie[^"]+">(?P<TITLE>[^<]+)<\/span>', webpage,
+            r'<span title="Movie[^"]+">(?P<TITLE>[^<]+)<\/span>',
-            'title')
+            webpage, 'title')
        time_and_author = self._html_search_regex(
            r'<th.*<\/span>(?P<time_and_author>.*)<\/th>', webpage,
            'title: speedrun timer and credit', fatal=False)
        if time_and_author is not None:
            title = title + time_and_author
        formats = []
        for url in video_urls:
@ -60,15 +65,20 @@ class TASVideosPlaylistIE(InfoExtractor):
        playlist_title = self._search_regex(
            r'<title>(?P<title>[^<]*)</title>', webpage, 'title')
        video_entries = get_elements_by_class('item', webpage)
-        
+
        entries = []
        for entry in video_entries:
            video_urls = re.findall(
                r'<a [^>]+(?P<URL>archive\.org\/download[^<]+\.(?:mkv|mp4|avi))[^<]+<\/a>',
                entry)
            title = self._search_regex(
-                r'<span title="Movie[^"]+">(?P<title>[^<]+)<\/span>', entry,
+                r'<span title="Movie[^"]+">(?P<title>[^<]+)<\/span>',
-                'title')
+                entry, 'title')
            time_and_author = self._html_search_regex(
                r'<th.*<\/span>(?P<time_and_author>.*)<\/th>', entry,
                'time_and_author', fatal=False)
            if time_and_author is not None:
                title = title + time_and_author
            video_id = self._search_regex(
                r'id="movie_(?P<id>\d+)', entry, 'video id') + 'M'