yt-dlp/yt_dlp/extractor/nebula.py

import itertools
import json

from .art19 import Art19IE
from .common import InfoExtractor
from ..networking.exceptions import HTTPError
from ..utils import (
    ExtractorError,
    int_or_none,
    make_archive_id,
    parse_iso8601,
    smuggle_url,
    try_call,
    unsmuggle_url,
    update_url_query,
    url_or_none,
    urljoin,
)
from ..utils.traversal import traverse_obj

_BASE_URL_RE = r'https?://(?:www\.|beta\.)?(?:watchnebula\.com|nebula\.app|nebula\.tv)'


class NebulaBaseIE(InfoExtractor):
    _NETRC_MACHINE = 'watchnebula'
    _token = _api_token = None

    def _perform_login(self, username, password):
        try:
            response = self._download_json(
                'https://nebula.tv/auth/login/', None,
                'Logging in to Nebula', 'Login failed',
                data=json.dumps({'email': username, 'password': password}).encode(),
                headers={'content-type': 'application/json'})
        except ExtractorError as e:
            if isinstance(e.cause, HTTPError) and e.cause.status == 400:
                raise ExtractorError('Login failed: Invalid username or password', expected=True)
            raise
        self._api_token = traverse_obj(response, ('key', {str}))
        if not self._api_token:
            raise ExtractorError('Login failed: No token')

    def _call_api(self, *args, **kwargs):
        if self._token:
            kwargs.setdefault('headers', {})['Authorization'] = f'Bearer {self._token}'
        try:
            return self._download_json(*args, **kwargs)
        except ExtractorError as e:
            if not isinstance(e.cause, HTTPError) or e.cause.status not in (401, 403):
                raise
            self.to_screen(
                f'Reauthorizing with Nebula and retrying, because last API call resulted in error {e.cause.status}')
            self._real_initialize()
            if self._token:
                kwargs.setdefault('headers', {})['Authorization'] = f'Bearer {self._token}'
            return self._download_json(*args, **kwargs)

    def _real_initialize(self):
        if not self._api_token:
            self._api_token = try_call(
                lambda: self._get_cookies('https://nebula.tv')['nebula_auth.apiToken'].value)
        self._token = self._download_json(
            'https://users.api.nebula.app/api/v1/authorization/', None,
            headers={'Authorization': f'Token {self._api_token}'} if self._api_token else None,
            note='Authorizing to Nebula', data=b'')['token']

    def _extract_formats(self, content_id, slug):
        for retry in (False, True):
            try:
                fmts, subs = self._extract_m3u8_formats_and_subtitles(
                    f'https://content.api.nebula.app/{content_id.split(":")[0]}s/{content_id}/manifest.m3u8',
                    slug, 'mp4', query={
                        'token': self._token,
                        'app_version': '23.10.0',
                        'platform': 'ios',
                    })
                return {'formats': fmts, 'subtitles': subs}
            except ExtractorError as e:
                if isinstance(e.cause, HTTPError) and e.cause.status == 401:
                    self.raise_login_required()
                if not retry and isinstance(e.cause, HTTPError) and e.cause.status == 403:
                    self.to_screen('Reauthorizing with Nebula and retrying, because fetching video resulted in error')
                    self._real_initialize()
                    continue
                raise

    def _extract_video_metadata(self, episode):
        channel_url = traverse_obj(
            episode, (('channel_slug', 'class_slug'), {lambda x: urljoin('https://nebula.tv/', x)}), get_all=False)
        return {
            'id': episode['id'].partition(':')[2],
            **traverse_obj(episode, {
                'display_id': 'slug',
                'title': 'title',
                'description': 'description',
                'timestamp': ('published_at', {parse_iso8601}),
                'duration': ('duration', {int_or_none}),
                'channel_id': 'channel_slug',
                'uploader_id': 'channel_slug',
                'channel': 'channel_title',
                'uploader': 'channel_title',
                'series': 'channel_title',
                'creator': 'channel_title',
                'thumbnail': ('images', 'thumbnail', 'src', {url_or_none}),
                'episode_number': ('order', {int_or_none}),
                # Old code was wrongly setting extractor_key from NebulaSubscriptionsIE
                '_old_archive_ids': ('zype_id', {lambda x: [
                    make_archive_id(NebulaIE, x), make_archive_id(NebulaSubscriptionsIE, x)] if x else None}),
            }),
            'channel_url': channel_url,
            'uploader_url': channel_url,
        }


class NebulaIE(NebulaBaseIE):
    IE_NAME = 'nebula:video'
    _VALID_URL = rf'{_BASE_URL_RE}/videos/(?P<id>[\w-]+)'
    _TESTS = [{
        'url': 'https://nebula.tv/videos/that-time-disney-remade-beauty-and-the-beast',
        'info_dict': {
            'id': '84ed544d-4afd-4723-8cd5-2b95261f0abf',
            'ext': 'mp4',
            'title': 'That Time Disney Remade Beauty and the Beast',
            'description': 'md5:2aae3c4cfc5ee09a1ecdff0909618cf4',
            'upload_date': '20180731',
            'timestamp': 1533009600,
            'channel': 'Lindsay Ellis',
            'channel_id': 'lindsayellis',
            'uploader': 'Lindsay Ellis',
            'uploader_id': 'lindsayellis',
            'uploader_url': r're:https://nebula\.(tv|app)/lindsayellis',
            'series': 'Lindsay Ellis',
            'display_id': 'that-time-disney-remade-beauty-and-the-beast',
            'channel_url': r're:https://nebula\.(tv|app)/lindsayellis',
            'creator': 'Lindsay Ellis',
            'duration': 2212,
            'thumbnail': r're:https://\w+\.cloudfront\.net/[\w-]+',
            '_old_archive_ids': ['nebula 5c271b40b13fd613090034fd', 'nebulasubscriptions 5c271b40b13fd613090034fd'],
        },
        'params': {'skip_download': 'm3u8'},
    }, {
        'url': 'https://nebula.tv/videos/the-logistics-of-d-day-landing-craft-how-the-allies-got-ashore',
        'md5': 'd05739cf6c38c09322422f696b569c23',
        'info_dict': {
            'id': '7e623145-1b44-4ca3-aa0b-ed25a247ea34',
            'ext': 'mp4',
            'title': 'Landing Craft - How The Allies Got Ashore',
            'description': r're:^In this episode we explore the unsung heroes of D-Day, the landing craft.',
            'upload_date': '20200327',
            'timestamp': 1585348140,
            'channel': 'Real Engineering — The Logistics of D-Day',
            'channel_id': 'd-day',
            'uploader': 'Real Engineering — The Logistics of D-Day',
            'uploader_id': 'd-day',
            'series': 'Real Engineering — The Logistics of D-Day',
            'display_id': 'the-logistics-of-d-day-landing-craft-how-the-allies-got-ashore',
            'creator': 'Real Engineering — The Logistics of D-Day',
            'duration': 841,
            'channel_url': 'https://nebula.tv/d-day',
            'uploader_url': 'https://nebula.tv/d-day',
            'thumbnail': r're:https://\w+\.cloudfront\.net/[\w-]+',
            '_old_archive_ids': ['nebula 5e7e78171aaf320001fbd6be', 'nebulasubscriptions 5e7e78171aaf320001fbd6be'],
        },
        'params': {'skip_download': 'm3u8'},
    }, {
        'url': 'https://nebula.tv/videos/money-episode-1-the-draw',
        'md5': 'ebe28a7ad822b9ee172387d860487868',
        'info_dict': {
            'id': 'b96c5714-9e2b-4ec3-b3f1-20f6e89cc553',
            'ext': 'mp4',
            'title': 'Episode 1: The Draw',
            'description': r'contains:There’s free money on offer… if the players can all work together.',
            'upload_date': '20200323',
            'timestamp': 1584980400,
            'channel': 'Tom Scott Presents: Money',
            'channel_id': 'tom-scott-presents-money',
            'uploader': 'Tom Scott Presents: Money',
            'uploader_id': 'tom-scott-presents-money',
            'uploader_url': 'https://nebula.tv/tom-scott-presents-money',
            'duration': 825,
            'channel_url': 'https://nebula.tv/tom-scott-presents-money',
            'series': 'Tom Scott Presents: Money',
            'display_id': 'money-episode-1-the-draw',
            'thumbnail': r're:https://\w+\.cloudfront\.net/[\w-]+',
            'creator': 'Tom Scott Presents: Money',
            '_old_archive_ids': ['nebula 5e779ebdd157bc0001d1c75a', 'nebulasubscriptions 5e779ebdd157bc0001d1c75a'],
        },
        'params': {'skip_download': 'm3u8'},
    }, {
        'url': 'https://watchnebula.com/videos/money-episode-1-the-draw',
        'only_matching': True,
    }, {
        'url': 'https://nebula.tv/videos/tldrnewseu-did-the-us-really-blow-up-the-nordstream-pipelines',
        'info_dict': {
            'id': 'e389af9d-1dab-44f2-8788-ee24deb7ff0d',
            'ext': 'mp4',
            'display_id': 'tldrnewseu-did-the-us-really-blow-up-the-nordstream-pipelines',
            'title': 'Did the US Really Blow Up the NordStream Pipelines?',
            'description': 'md5:b4e2a14e3ff08f546a3209c75261e789',
            'upload_date': '20230223',
            'timestamp': 1677144070,
            'channel': 'TLDR News EU',
            'channel_id': 'tldrnewseu',
            'uploader': 'TLDR News EU',
            'uploader_id': 'tldrnewseu',
            'uploader_url': r're:https://nebula\.(tv|app)/tldrnewseu',
            'duration': 524,
            'channel_url': r're:https://nebula\.(tv|app)/tldrnewseu',
            'series': 'TLDR News EU',
            'thumbnail': r're:https://\w+\.cloudfront\.net/[\w-]+',
            'creator': 'TLDR News EU',
            '_old_archive_ids': ['nebula 63f64c74366fcd00017c1513', 'nebulasubscriptions 63f64c74366fcd00017c1513'],
        },
        'params': {'skip_download': 'm3u8'},
    }, {
        'url': 'https://beta.nebula.tv/videos/money-episode-1-the-draw',
        'only_matching': True,
    }]

    def _real_extract(self, url):
        slug = self._match_id(url)
        url, smuggled_data = unsmuggle_url(url, {})
        if smuggled_data.get('id'):
            return {
                'id': smuggled_data['id'],
                'display_id': slug,
                'title': '',
                **self._extract_formats(smuggled_data['id'], slug),
            }

        metadata = self._call_api(
            f'https://content.api.nebula.app/content/videos/{slug}',
            slug, note='Fetching video metadata')
        return {
            **self._extract_video_metadata(metadata),
            **self._extract_formats(metadata['id'], slug),
        }


class NebulaClassIE(NebulaBaseIE):
    IE_NAME = 'nebula:media'
    _VALID_URL = rf'{_BASE_URL_RE}/(?!(?:myshows|library|videos)/)(?P<id>[\w-]+)/(?P<ep>[\w-]+)/?(?:$|[?#])'
    _TESTS = [{
        'url': 'https://nebula.tv/copyright-for-fun-and-profit/14',
        'info_dict': {
            'id': 'd7432cdc-c608-474d-942c-f74345daed7b',
            'ext': 'mp4',
            'display_id': '14',
            'channel_url': 'https://nebula.tv/copyright-for-fun-and-profit',
            'episode_number': 14,
            'thumbnail': 'https://dj423fildxgac.cloudfront.net/d533718d-9307-42d4-8fb0-e283285e99c9',
            'uploader_url': 'https://nebula.tv/copyright-for-fun-and-profit',
            'duration': 646,
            'episode': 'Episode 14',
            'title': 'Photos, Sculpture, and Video',
        },
        'params': {'skip_download': 'm3u8'},
    }, {
        'url': 'https://nebula.tv/extremitiespodcast/pyramiden-the-high-arctic-soviet-ghost-town',
        'info_dict': {
            'ext': 'mp3',
            'id': '018f65f0-0033-4021-8f87-2d132beb19aa',
            'description': 'md5:05d2b23ab780c955e2511a2b9127acff',
            'series_id': '335e8159-d663-491a-888f-1732285706ac',
            'modified_timestamp': 1599091504,
            'episode_id': '018f65f0-0033-4021-8f87-2d132beb19aa',
            'series': 'Extremities',
            'modified_date': '20200903',
            'upload_date': '20200902',
            'title': 'Pyramiden: The High-Arctic Soviet Ghost Town',
            'release_timestamp': 1571237958,
            'thumbnail': r're:^https?://content\.production\.cdn\.art19\.com.*\.jpeg$',
            'duration': 1546.05714,
            'timestamp': 1599085608,
            'release_date': '20191016',
        },
    }, {
        'url': 'https://nebula.tv/thelayover/the-layover-episode-1',
        'info_dict': {
            'ext': 'mp3',
            'id': '9d74a762-00bb-45a8-9e8d-9ed47c04a1d0',
            'episode_number': 1,
            'thumbnail': r're:^https?://content\.production\.cdn\.art19\.com.*\.jpeg$',
            'release_date': '20230304',
            'modified_date': '20230403',
            'series': 'The Layover',
            'episode_id': '9d74a762-00bb-45a8-9e8d-9ed47c04a1d0',
            'modified_timestamp': 1680554566,
            'duration': 3130.46401,
            'release_timestamp': 1677943800,
            'title': 'The Layover — Episode 1',
            'series_id': '874303a5-4900-4626-a4b6-2aacac34466a',
            'upload_date': '20230303',
            'episode': 'Episode 1',
            'timestamp': 1677883672,
            'description': 'md5:002cca89258e3bc7c268d5b8c24ba482',
        },
    }]

    def _real_extract(self, url):
        slug, episode = self._match_valid_url(url).group('id', 'ep')
        url, smuggled_data = unsmuggle_url(url, {})
        if smuggled_data.get('id'):
            return {
                'id': smuggled_data['id'],
                'display_id': slug,
                'title': '',
                **self._extract_formats(smuggled_data['id'], slug),
            }

        metadata = self._call_api(
            f'https://content.api.nebula.app/content/{slug}/{episode}/?include=lessons',
            slug, note='Fetching class/podcast metadata')
        content_type = metadata.get('type')
        if content_type == 'lesson':
            return {
                **self._extract_video_metadata(metadata),
                **self._extract_formats(metadata['id'], slug),
            }
        elif content_type == 'podcast_episode':
            episode_url = metadata['episode_url']
            if not episode_url and metadata.get('premium'):
                self.raise_login_required()

            if Art19IE.suitable(episode_url):
                return self.url_result(episode_url, Art19IE)
            return traverse_obj(metadata, {
                'id': ('id', {str}),
                'url': ('episode_url', {url_or_none}),
                'title': ('title', {str}),
                'description': ('description', {str}),
                'timestamp': ('published_at', {parse_iso8601}),
                'duration': ('duration', {int_or_none}),
                'channel_id': ('channel_id', {str}),
                'chnanel': ('channel_title', {str}),
                'thumbnail': ('assets', 'regular', {url_or_none}),
            })

        raise ExtractorError(f'Unexpected content type {content_type!r}')


class NebulaSubscriptionsIE(NebulaBaseIE):
    IE_NAME = 'nebula:subscriptions'
    _VALID_URL = rf'{_BASE_URL_RE}/(?P<id>myshows|library/latest-videos)/?(?:$|[?#])'
    _TESTS = [{
        'url': 'https://nebula.tv/myshows',
        'playlist_mincount': 1,
        'info_dict': {
            'id': 'myshows',
        },
    }]

    def _generate_playlist_entries(self):
        next_url = update_url_query('https://content.api.nebula.app/video_episodes/', {
            'following': 'true',
            'include': 'engagement',
            'ordering': '-published_at',
        })
        for page_num in itertools.count(1):
            channel = self._call_api(
                next_url, 'myshows', note=f'Retrieving subscriptions page {page_num}')
            for episode in channel['results']:
                metadata = self._extract_video_metadata(episode)
                yield self.url_result(smuggle_url(
                    f'https://nebula.tv/videos/{metadata["display_id"]}',
                    {'id': episode['id']}), NebulaIE, url_transparent=True, **metadata)
            next_url = channel.get('next')
            if not next_url:
                return

    def _real_extract(self, url):
        return self.playlist_result(self._generate_playlist_entries(), 'myshows')


class NebulaChannelIE(NebulaBaseIE):
    IE_NAME = 'nebula:channel'
    _VALID_URL = rf'{_BASE_URL_RE}/(?!myshows|library|videos)(?P<id>[\w-]+)/?(?:$|[?#])'
    _TESTS = [{
        'url': 'https://nebula.tv/tom-scott-presents-money',
        'info_dict': {
            'id': 'tom-scott-presents-money',
            'title': 'Tom Scott Presents: Money',
            'description': 'Tom Scott hosts a series all about trust, negotiation and money.',
        },
        'playlist_count': 5,
    }, {
        'url': 'https://nebula.tv/lindsayellis',
        'info_dict': {
            'id': 'lindsayellis',
            'title': 'Lindsay Ellis',
            'description': 'Enjoy these hottest of takes on Disney, Transformers, and Musicals.',
        },
        'playlist_mincount': 2,
    }, {
        'url': 'https://nebula.tv/johnnyharris',
        'info_dict': {
            'id': 'johnnyharris',
            'title': 'Johnny Harris',
            'description': 'I make videos about maps and many other things.',
        },
        'playlist_mincount': 90,
    }, {
        'url': 'https://nebula.tv/copyright-for-fun-and-profit',
        'info_dict': {
            'id': 'copyright-for-fun-and-profit',
            'title': 'Copyright for Fun and Profit',
            'description': 'md5:6690248223eed044a9f11cd5a24f9742',
        },
        'playlist_count': 23,
    }, {
        'url': 'https://nebula.tv/trussissuespodcast',
        'info_dict': {
            'id': 'trussissuespodcast',
            'title': 'The TLDR News Podcast',
            'description': 'md5:a08c4483bc0b705881d3e0199e721385',
        },
        'playlist_mincount': 80,
    }]

    def _generate_playlist_entries(self, collection_id, collection_slug):
        next_url = f'https://content.api.nebula.app/video_channels/{collection_id}/video_episodes/?ordering=-published_at'
        for page_num in itertools.count(1):
            episodes = self._call_api(next_url, collection_slug, note=f'Retrieving channel page {page_num}')
            for episode in episodes['results']:
                metadata = self._extract_video_metadata(episode)
                yield self.url_result(smuggle_url(
                    episode.get('share_url') or f'https://nebula.tv/videos/{metadata["display_id"]}',
                    {'id': episode['id']}), NebulaIE, url_transparent=True, **metadata)
            next_url = episodes.get('next')
            if not next_url:
                break

    def _generate_class_entries(self, channel):
        for lesson in channel['lessons']:
            metadata = self._extract_video_metadata(lesson)
            yield self.url_result(smuggle_url(
                lesson.get('share_url') or f'https://nebula.tv/{metadata["class_slug"]}/{metadata["slug"]}',
                {'id': lesson['id']}), NebulaClassIE, url_transparent=True, **metadata)

    def _generate_podcast_entries(self, collection_id, collection_slug):
        next_url = f'https://content.api.nebula.app/podcast_channels/{collection_id}/podcast_episodes/?ordering=-published_at&premium=true'
        for page_num in itertools.count(1):
            episodes = self._call_api(next_url, collection_slug, note=f'Retrieving podcast page {page_num}')

            for episode in traverse_obj(episodes, ('results', lambda _, v: url_or_none(v['share_url']))):
                yield self.url_result(episode['share_url'], NebulaClassIE)
            next_url = episodes.get('next')
            if not next_url:
                break

    def _real_extract(self, url):
        collection_slug = self._match_id(url)
        channel = self._call_api(
            f'https://content.api.nebula.app/content/{collection_slug}/?include=lessons',
            collection_slug, note='Retrieving channel')

        if channel.get('type') == 'class':
            entries = self._generate_class_entries(channel)
        elif channel.get('type') == 'podcast_channel':
            entries = self._generate_podcast_entries(channel['id'], collection_slug)
        else:
            entries = self._generate_playlist_entries(channel['id'], collection_slug)

        return self.playlist_result(
            entries=entries,
            playlist_id=collection_slug,
            playlist_title=channel.get('title'),
            playlist_description=channel.get('description'))
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								import itertools
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
+								import json
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								from .art19 import Art19IE
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								from .common import InfoExtractor
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 07:53:02 +00:00
+								from ..networking.exceptions import HTTPError
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								from ..utils import (
 								    ExtractorError,
 								    int_or_none,
 								    make_archive_id,
 								    parse_iso8601,
 								    smuggle_url,
 								    try_call,
 								    unsmuggle_url,
 								    update_url_query,
 								    url_or_none,
 								    urljoin,
 								)
 								from ..utils.traversal import traverse_obj
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
-												[extractor/nebula] Add `beta.nebula.tv` (#6516)

Authored by: unbeatable-101
											
										
										
											2023-03-12 23:25:05 +00:00
+								_BASE_URL_RE = r'https?://(?:www\.|beta\.)?(?:watchnebula\.com|nebula\.app|nebula\.tv)'
-												[extractor/nebula] Add nebula.tv (#4918)

Closes #4917
Authored by: tannertechnology
											
										
										
											2022-09-22 01:44:07 +00:00
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
 								class NebulaBaseIE(InfoExtractor):
 								    _NETRC_MACHINE = 'watchnebula'
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    _token = _api_token = None
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    def _perform_login(self, username, password):
 								        try:
 								            response = self._download_json(
 								                'https://nebula.tv/auth/login/', None,
 								                'Logging in to Nebula', 'Login failed',
 								                data=json.dumps({'email': username, 'password': password}).encode(),
 								                headers={'content-type': 'application/json'})
 								        except ExtractorError as e:
 								            if isinstance(e.cause, HTTPError) and e.cause.status == 400:
 								                raise ExtractorError('Login failed: Invalid username or password', expected=True)
 								            raise
 								        self._api_token = traverse_obj(response, ('key', {str}))
 								        if not self._api_token:
 								            raise ExtractorError('Login failed: No token')
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    def _call_api(self, *args, **kwargs):
 								        if self._token:
 								            kwargs.setdefault('headers', {})['Authorization'] = f'Bearer {self._token}'
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								        try:
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								            return self._download_json(*args, **kwargs)
 								        except ExtractorError as e:
 								            if not isinstance(e.cause, HTTPError) or e.cause.status not in (401, 403):
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								                raise
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								            self.to_screen(
 								                f'Reauthorizing with Nebula and retrying, because last API call resulted in error {e.cause.status}')
 								            self._real_initialize()
 								            if self._token:
 								                kwargs.setdefault('headers', {})['Authorization'] = f'Bearer {self._token}'
 								            return self._download_json(*args, **kwargs)
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    def _real_initialize(self):
 								        if not self._api_token:
 								            self._api_token = try_call(
 								                lambda: self._get_cookies('https://nebula.tv')['nebula_auth.apiToken'].value)
 								        self._token = self._download_json(
 								            'https://users.api.nebula.app/api/v1/authorization/', None,
 								            headers={'Authorization': f'Token {self._api_token}'} if self._api_token else None,
 								            note='Authorizing to Nebula', data=b'')['token']
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    def _extract_formats(self, content_id, slug):
 								        for retry in (False, True):
 								            try:
 								                fmts, subs = self._extract_m3u8_formats_and_subtitles(
 								                    f'https://content.api.nebula.app/{content_id.split(":")[0]}s/{content_id}/manifest.m3u8',
 								                    slug, 'mp4', query={
 								                        'token': self._token,
 								                        'app_version': '23.10.0',
 								                        'platform': 'ios',
 								                    })
 								                return {'formats': fmts, 'subtitles': subs}
 								            except ExtractorError as e:
 								                if isinstance(e.cause, HTTPError) and e.cause.status == 401:
 								                    self.raise_login_required()
 								                if not retry and isinstance(e.cause, HTTPError) and e.cause.status == 403:
 								                    self.to_screen('Reauthorizing with Nebula and retrying, because fetching video resulted in error')
 								                    self._real_initialize()
 								                    continue
 								                raise
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    def _extract_video_metadata(self, episode):
 								        channel_url = traverse_obj(
 								            episode, (('channel_slug', 'class_slug'), {lambda x: urljoin('https://nebula.tv/', x)}), get_all=False)
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								        return {
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								            'id': episode['id'].partition(':')[2],
 								            **traverse_obj(episode, {
 								                'display_id': 'slug',
 								                'title': 'title',
 								                'description': 'description',
 								                'timestamp': ('published_at', {parse_iso8601}),
 								                'duration': ('duration', {int_or_none}),
 								                'channel_id': 'channel_slug',
 								                'uploader_id': 'channel_slug',
 								                'channel': 'channel_title',
 								                'uploader': 'channel_title',
 								                'series': 'channel_title',
 								                'creator': 'channel_title',
 								                'thumbnail': ('images', 'thumbnail', 'src', {url_or_none}),
 								                'episode_number': ('order', {int_or_none}),
 								                # Old code was wrongly setting extractor_key from NebulaSubscriptionsIE
 								                '_old_archive_ids': ('zype_id', {lambda x: [
 								                    make_archive_id(NebulaIE, x), make_archive_id(NebulaSubscriptionsIE, x)] if x else None}),
 								            }),
 								            'channel_url': channel_url,
 								            'uploader_url': channel_url,
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								        }
 								class NebulaIE(NebulaBaseIE):
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								    IE_NAME = 'nebula:video'
 								    _VALID_URL = rf'{_BASE_URL_RE}/videos/(?P<id>[\w-]+)'
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    _TESTS = [{
 								        'url': 'https://nebula.tv/videos/that-time-disney-remade-beauty-and-the-beast',
 								        'info_dict': {
 								            'id': '84ed544d-4afd-4723-8cd5-2b95261f0abf',
 								            'ext': 'mp4',
 								            'title': 'That Time Disney Remade Beauty and the Beast',
 								            'description': 'md5:2aae3c4cfc5ee09a1ecdff0909618cf4',
 								            'upload_date': '20180731',
 								            'timestamp': 1533009600,
 								            'channel': 'Lindsay Ellis',
 								            'channel_id': 'lindsayellis',
 								            'uploader': 'Lindsay Ellis',
 								            'uploader_id': 'lindsayellis',
 								            'uploader_url': r're:https://nebula\.(tv|app)/lindsayellis',
 								            'series': 'Lindsay Ellis',
 								            'display_id': 'that-time-disney-remade-beauty-and-the-beast',
 								            'channel_url': r're:https://nebula\.(tv|app)/lindsayellis',
 								            'creator': 'Lindsay Ellis',
 								            'duration': 2212,
 								            'thumbnail': r're:https://\w+\.cloudfront\.net/[\w-]+',
 								            '_old_archive_ids': ['nebula 5c271b40b13fd613090034fd', 'nebulasubscriptions 5c271b40b13fd613090034fd'],
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
+								        },
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        'params': {'skip_download': 'm3u8'},
 								    }, {
 								        'url': 'https://nebula.tv/videos/the-logistics-of-d-day-landing-craft-how-the-allies-got-ashore',
 								        'md5': 'd05739cf6c38c09322422f696b569c23',
 								        'info_dict': {
 								            'id': '7e623145-1b44-4ca3-aa0b-ed25a247ea34',
 								            'ext': 'mp4',
 								            'title': 'Landing Craft - How The Allies Got Ashore',
 								            'description': r're:^In this episode we explore the unsung heroes of D-Day, the landing craft.',
 								            'upload_date': '20200327',
 								            'timestamp': 1585348140,
 								            'channel': 'Real Engineering — The Logistics of D-Day',
 								            'channel_id': 'd-day',
 								            'uploader': 'Real Engineering — The Logistics of D-Day',
 								            'uploader_id': 'd-day',
 								            'series': 'Real Engineering — The Logistics of D-Day',
 								            'display_id': 'the-logistics-of-d-day-landing-craft-how-the-allies-got-ashore',
 								            'creator': 'Real Engineering — The Logistics of D-Day',
 								            'duration': 841,
 								            'channel_url': 'https://nebula.tv/d-day',
 								            'uploader_url': 'https://nebula.tv/d-day',
 								            'thumbnail': r're:https://\w+\.cloudfront\.net/[\w-]+',
 								            '_old_archive_ids': ['nebula 5e7e78171aaf320001fbd6be', 'nebulasubscriptions 5e7e78171aaf320001fbd6be'],
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
+								        },
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        'params': {'skip_download': 'm3u8'},
 								    }, {
 								        'url': 'https://nebula.tv/videos/money-episode-1-the-draw',
 								        'md5': 'ebe28a7ad822b9ee172387d860487868',
 								        'info_dict': {
 								            'id': 'b96c5714-9e2b-4ec3-b3f1-20f6e89cc553',
 								            'ext': 'mp4',
 								            'title': 'Episode 1: The Draw',
 								            'description': r'contains:There’s free money on offer… if the players can all work together.',
 								            'upload_date': '20200323',
 								            'timestamp': 1584980400,
 								            'channel': 'Tom Scott Presents: Money',
 								            'channel_id': 'tom-scott-presents-money',
 								            'uploader': 'Tom Scott Presents: Money',
 								            'uploader_id': 'tom-scott-presents-money',
 								            'uploader_url': 'https://nebula.tv/tom-scott-presents-money',
 								            'duration': 825,
 								            'channel_url': 'https://nebula.tv/tom-scott-presents-money',
 								            'series': 'Tom Scott Presents: Money',
 								            'display_id': 'money-episode-1-the-draw',
 								            'thumbnail': r're:https://\w+\.cloudfront\.net/[\w-]+',
 								            'creator': 'Tom Scott Presents: Money',
 								            '_old_archive_ids': ['nebula 5e779ebdd157bc0001d1c75a', 'nebulasubscriptions 5e779ebdd157bc0001d1c75a'],
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
+								        },
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        'params': {'skip_download': 'm3u8'},
 								    }, {
 								        'url': 'https://watchnebula.com/videos/money-episode-1-the-draw',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://nebula.tv/videos/tldrnewseu-did-the-us-really-blow-up-the-nordstream-pipelines',
 								        'info_dict': {
 								            'id': 'e389af9d-1dab-44f2-8788-ee24deb7ff0d',
 								            'ext': 'mp4',
 								            'display_id': 'tldrnewseu-did-the-us-really-blow-up-the-nordstream-pipelines',
 								            'title': 'Did the US Really Blow Up the NordStream Pipelines?',
 								            'description': 'md5:b4e2a14e3ff08f546a3209c75261e789',
 								            'upload_date': '20230223',
 								            'timestamp': 1677144070,
 								            'channel': 'TLDR News EU',
 								            'channel_id': 'tldrnewseu',
 								            'uploader': 'TLDR News EU',
 								            'uploader_id': 'tldrnewseu',
 								            'uploader_url': r're:https://nebula\.(tv|app)/tldrnewseu',
 								            'duration': 524,
 								            'channel_url': r're:https://nebula\.(tv|app)/tldrnewseu',
 								            'series': 'TLDR News EU',
 								            'thumbnail': r're:https://\w+\.cloudfront\.net/[\w-]+',
 								            'creator': 'TLDR News EU',
 								            '_old_archive_ids': ['nebula 63f64c74366fcd00017c1513', 'nebulasubscriptions 63f64c74366fcd00017c1513'],
-												[extractor/nebula] Add `beta.nebula.tv` (#6516)

Authored by: unbeatable-101
											
										
										
											2023-03-12 23:25:05 +00:00
+								        },
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        'params': {'skip_download': 'm3u8'},
 								    }, {
 								        'url': 'https://beta.nebula.tv/videos/money-episode-1-the-draw',
 								        'only_matching': True,
 								    }]
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								    def _real_extract(self, url):
 								        slug = self._match_id(url)
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        url, smuggled_data = unsmuggle_url(url, {})
 								        if smuggled_data.get('id'):
 								            return {
 								                'id': smuggled_data['id'],
 								                'display_id': slug,
 								                'title': '',
 								                **self._extract_formats(smuggled_data['id'], slug),
 								            }
 								        metadata = self._call_api(
 								            f'https://content.api.nebula.app/content/videos/{slug}',
 								            slug, note='Fetching video metadata')
 								        return {
 								            **self._extract_video_metadata(metadata),
 								            **self._extract_formats(metadata['id'], slug),
 								        }
 								class NebulaClassIE(NebulaBaseIE):
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								    IE_NAME = 'nebula:media'
 								    _VALID_URL = rf'{_BASE_URL_RE}/(?!(?:myshows|library|videos)/)(?P<id>[\w-]+)/(?P<ep>[\w-]+)/?(?:$|[?#])'
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    _TESTS = [{
 								        'url': 'https://nebula.tv/copyright-for-fun-and-profit/14',
 								        'info_dict': {
 								            'id': 'd7432cdc-c608-474d-942c-f74345daed7b',
 								            'ext': 'mp4',
 								            'display_id': '14',
 								            'channel_url': 'https://nebula.tv/copyright-for-fun-and-profit',
 								            'episode_number': 14,
 								            'thumbnail': 'https://dj423fildxgac.cloudfront.net/d533718d-9307-42d4-8fb0-e283285e99c9',
 								            'uploader_url': 'https://nebula.tv/copyright-for-fun-and-profit',
 								            'duration': 646,
 								            'episode': 'Episode 14',
 								            'title': 'Photos, Sculpture, and Video',
 								        },
 								        'params': {'skip_download': 'm3u8'},
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								    }, {
 								        'url': 'https://nebula.tv/extremitiespodcast/pyramiden-the-high-arctic-soviet-ghost-town',
 								        'info_dict': {
 								            'ext': 'mp3',
 								            'id': '018f65f0-0033-4021-8f87-2d132beb19aa',
 								            'description': 'md5:05d2b23ab780c955e2511a2b9127acff',
 								            'series_id': '335e8159-d663-491a-888f-1732285706ac',
 								            'modified_timestamp': 1599091504,
 								            'episode_id': '018f65f0-0033-4021-8f87-2d132beb19aa',
 								            'series': 'Extremities',
 								            'modified_date': '20200903',
 								            'upload_date': '20200902',
 								            'title': 'Pyramiden: The High-Arctic Soviet Ghost Town',
 								            'release_timestamp': 1571237958,
 								            'thumbnail': r're:^https?://content\.production\.cdn\.art19\.com.*\.jpeg$',
 								            'duration': 1546.05714,
 								            'timestamp': 1599085608,
 								            'release_date': '20191016',
 								        },
 								    }, {
 								        'url': 'https://nebula.tv/thelayover/the-layover-episode-1',
 								        'info_dict': {
 								            'ext': 'mp3',
 								            'id': '9d74a762-00bb-45a8-9e8d-9ed47c04a1d0',
 								            'episode_number': 1,
 								            'thumbnail': r're:^https?://content\.production\.cdn\.art19\.com.*\.jpeg$',
 								            'release_date': '20230304',
 								            'modified_date': '20230403',
 								            'series': 'The Layover',
 								            'episode_id': '9d74a762-00bb-45a8-9e8d-9ed47c04a1d0',
 								            'modified_timestamp': 1680554566,
 								            'duration': 3130.46401,
 								            'release_timestamp': 1677943800,
 								            'title': 'The Layover — Episode 1',
 								            'series_id': '874303a5-4900-4626-a4b6-2aacac34466a',
 								            'upload_date': '20230303',
 								            'episode': 'Episode 1',
 								            'timestamp': 1677883672,
 								            'description': 'md5:002cca89258e3bc7c268d5b8c24ba482',
 								        },
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    }]
 								    def _real_extract(self, url):
 								        slug, episode = self._match_valid_url(url).group('id', 'ep')
 								        url, smuggled_data = unsmuggle_url(url, {})
 								        if smuggled_data.get('id'):
 								            return {
 								                'id': smuggled_data['id'],
 								                'display_id': slug,
 								                'title': '',
 								                **self._extract_formats(smuggled_data['id'], slug),
 								            }
 								        metadata = self._call_api(
 								            f'https://content.api.nebula.app/content/{slug}/{episode}/?include=lessons',
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								            slug, note='Fetching class/podcast metadata')
 								        content_type = metadata.get('type')
 								        if content_type == 'lesson':
 								            return {
 								                **self._extract_video_metadata(metadata),
 								                **self._extract_formats(metadata['id'], slug),
 								            }
 								        elif content_type == 'podcast_episode':
 								            episode_url = metadata['episode_url']
 								            if not episode_url and metadata.get('premium'):
 								                self.raise_login_required()
 								            if Art19IE.suitable(episode_url):
 								                return self.url_result(episode_url, Art19IE)
 								            return traverse_obj(metadata, {
 								                'id': ('id', {str}),
 								                'url': ('episode_url', {url_or_none}),
 								                'title': ('title', {str}),
 								                'description': ('description', {str}),
 								                'timestamp': ('published_at', {parse_iso8601}),
 								                'duration': ('duration', {int_or_none}),
 								                'channel_id': ('channel_id', {str}),
 								                'chnanel': ('channel_title', {str}),
 								                'thumbnail': ('assets', 'regular', {url_or_none}),
 								            })
 								        raise ExtractorError(f'Unexpected content type {content_type!r}')
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
-												[nebula] Add support for subscriptions (#3719)

Closes #3609 
Authored by: hheimbuerger
											
										
										
											2022-05-15 11:55:44 +00:00
+								class NebulaSubscriptionsIE(NebulaBaseIE):
 								    IE_NAME = 'nebula:subscriptions'
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								    _VALID_URL = rf'{_BASE_URL_RE}/(?P<id>myshows|library/latest-videos)/?(?:$|[?#])'
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    _TESTS = [{
 								        'url': 'https://nebula.tv/myshows',
 								        'playlist_mincount': 1,
 								        'info_dict': {
 								            'id': 'myshows',
-												[nebula] Add support for subscriptions (#3719)

Closes #3609 
Authored by: hheimbuerger
											
										
										
											2022-05-15 11:55:44 +00:00
+								        },
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    }]
-												[nebula] Add support for subscriptions (#3719)

Closes #3609 
Authored by: hheimbuerger
											
										
										
											2022-05-15 11:55:44 +00:00
 								    def _generate_playlist_entries(self):
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        next_url = update_url_query('https://content.api.nebula.app/video_episodes/', {
 								            'following': 'true',
 								            'include': 'engagement',
 								            'ordering': '-published_at',
 								        })
 								        for page_num in itertools.count(1):
 								            channel = self._call_api(
 								                next_url, 'myshows', note=f'Retrieving subscriptions page {page_num}')
-												[nebula] Add support for subscriptions (#3719)

Closes #3609 
Authored by: hheimbuerger
											
										
										
											2022-05-15 11:55:44 +00:00
+								            for episode in channel['results']:
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								                metadata = self._extract_video_metadata(episode)
 								                yield self.url_result(smuggle_url(
 								                    f'https://nebula.tv/videos/{metadata["display_id"]}',
 								                    {'id': episode['id']}), NebulaIE, url_transparent=True, **metadata)
 								            next_url = channel.get('next')
 								            if not next_url:
 								                return
-												[nebula] Add support for subscriptions (#3719)

Closes #3609 
Authored by: hheimbuerger
											
										
										
											2022-05-15 11:55:44 +00:00
 								    def _real_extract(self, url):
 								        return self.playlist_result(self._generate_playlist_entries(), 'myshows')
 								class NebulaChannelIE(NebulaBaseIE):
 								    IE_NAME = 'nebula:channel'
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								    _VALID_URL = rf'{_BASE_URL_RE}/(?!myshows|library|videos)(?P<id>[\w-]+)/?(?:$|[?#])'
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    _TESTS = [{
 								        'url': 'https://nebula.tv/tom-scott-presents-money',
 								        'info_dict': {
 								            'id': 'tom-scott-presents-money',
 								            'title': 'Tom Scott Presents: Money',
 								            'description': 'Tom Scott hosts a series all about trust, negotiation and money.',
 								        },
 								        'playlist_count': 5,
 								    }, {
 								        'url': 'https://nebula.tv/lindsayellis',
 								        'info_dict': {
 								            'id': 'lindsayellis',
 								            'title': 'Lindsay Ellis',
 								            'description': 'Enjoy these hottest of takes on Disney, Transformers, and Musicals.',
 								        },
 								        'playlist_mincount': 2,
 								    }, {
 								        'url': 'https://nebula.tv/johnnyharris',
 								        'info_dict': {
 								            'id': 'johnnyharris',
 								            'title': 'Johnny Harris',
 								            'description': 'I make videos about maps and many other things.',
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								        },
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        'playlist_mincount': 90,
 								    }, {
 								        'url': 'https://nebula.tv/copyright-for-fun-and-profit',
 								        'info_dict': {
 								            'id': 'copyright-for-fun-and-profit',
 								            'title': 'Copyright for Fun and Profit',
 								            'description': 'md5:6690248223eed044a9f11cd5a24f9742',
 								        },
 								        'playlist_count': 23,
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								    }, {
 								        'url': 'https://nebula.tv/trussissuespodcast',
 								        'info_dict': {
 								            'id': 'trussissuespodcast',
 								            'title': 'The TLDR News Podcast',
 								            'description': 'md5:a08c4483bc0b705881d3e0199e721385',
 								        },
 								        'playlist_mincount': 80,
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    }]
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								    def _generate_playlist_entries(self, collection_id, collection_slug):
 								        next_url = f'https://content.api.nebula.app/video_channels/{collection_id}/video_episodes/?ordering=-published_at'
 								        for page_num in itertools.count(1):
 								            episodes = self._call_api(next_url, collection_slug, note=f'Retrieving channel page {page_num}')
 								            for episode in episodes['results']:
 								                metadata = self._extract_video_metadata(episode)
 								                yield self.url_result(smuggle_url(
 								                    episode.get('share_url') or f'https://nebula.tv/videos/{metadata["display_id"]}',
 								                    {'id': episode['id']}), NebulaIE, url_transparent=True, **metadata)
 								            next_url = episodes.get('next')
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								            if not next_url:
 								                break
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
 								    def _generate_class_entries(self, channel):
 								        for lesson in channel['lessons']:
 								            metadata = self._extract_video_metadata(lesson)
 								            yield self.url_result(smuggle_url(
 								                lesson.get('share_url') or f'https://nebula.tv/{metadata["class_slug"]}/{metadata["slug"]}',
 								                {'id': lesson['id']}), NebulaClassIE, url_transparent=True, **metadata)
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								    def _generate_podcast_entries(self, collection_id, collection_slug):
 								        next_url = f'https://content.api.nebula.app/podcast_channels/{collection_id}/podcast_episodes/?ordering=-published_at&premium=true'
 								        for page_num in itertools.count(1):
 								            episodes = self._call_api(next_url, collection_slug, note=f'Retrieving podcast page {page_num}')
 								            for episode in traverse_obj(episodes, ('results', lambda _, v: url_or_none(v['share_url']))):
 								                yield self.url_result(episode['share_url'], NebulaClassIE)
 								            next_url = episodes.get('next')
 								            if not next_url:
 								                break
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
+								    def _real_extract(self, url):
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        collection_slug = self._match_id(url)
 								        channel = self._call_api(
 								            f'https://content.api.nebula.app/content/{collection_slug}/?include=lessons',
 								            collection_slug, note='Retrieving channel')
 								        if channel.get('type') == 'class':
 								            entries = self._generate_class_entries(channel)
-												[ie/nebula] Support podcasts (#9140)

Closes #8838
Authored by: seproDev, c-basalt

Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-02-24 16:08:47 +00:00
+								        elif channel.get('type') == 'podcast_channel':
 								            entries = self._generate_podcast_entries(channel['id'], collection_slug)
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								        else:
 								            entries = self._generate_playlist_entries(channel['id'], collection_slug)
-												[cleanup] Fix line endings for `nebula.py` (#1064)

:ci skip
Authored by: glenn-slayden
											
										
										
											2021-09-23 09:05:01 +00:00
-												[nebula] Add NebulaCollectionIE and rewrite extractor (#1694)

Closes #1690
Authored by: hheimbuerger
											
										
										
											2021-11-27 06:51:32 +00:00
+								        return self.playlist_result(
-												[ie/nebula] Overhaul extractors (#8566)

Closes #4300, Closes #5814, Closes #7588, Closes #6334, Closes #6538
Authored by: elyse0, pukkandan, seproDev

Co-authored-by: Elyse <26639800+elyse0@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2023-11-20 01:03:33 +00:00
+								            entries=entries,
 								            playlist_id=collection_slug,
 								            playlist_title=channel.get('title'),
 								            playlist_description=channel.get('description'))