download all pages before start extracting info

2024-11-30 03:33:02 +00:00 · 2015-06-27 10:55:25 +01:00 · 2015-06-27 10:55:25 +01:00 · f39eb98bab
commit f39eb98bab
parent 7d7d469025
1 changed files with 4 additions and 5 deletions
--- a/youtube_dl/extractor/snagfilms.py
+++ b/youtube_dl/extractor/snagfilms.py
@ -34,7 +34,6 @@ def _real_extract(self, url):
        display_id, video_id = match(self._VALID_URL,url).groups()
        if display_id is None:
            embed_webpage = self._download_webpage('http://www.snagfilms.com/embed/player?filmId=' + video_id, video_id)
            display_id = self._html_search_regex(
                r"snagfilms\.com/films/title/(?P<display_id>.+?)(?:/|')",
                embed_webpage,
@ -48,16 +47,16 @@ def _real_extract(self, url):
            'data'
        ), display_id)
        if video_id is None:
            video_id = json_data['id']
            embed_webpage = self._download_webpage('http://www.snagfilms.com/embed/player?filmId=' + video_id, video_id)
        title = json_data['title']
        duration = int(json_data['duration'])
        description = json_data['synopsis']
        categories = [category['title'] for category in json_data['categories']]
        thumbnail = json_data['image']
        if video_id is None:
            video_id = json_data['id']
            embed_webpage = self._download_webpage('http://www.snagfilms.com/embed/player?filmId=' + video_id, video_id)
        sources = self._parse_json(js_to_json(self._html_search_regex(
            r'sources: (?P<sources>\[.*?\])',
            embed_webpage,