2021-11-27 06:51:32 +00:00
import itertools
2021-09-23 09:05:01 +00:00
import json
2021-11-27 06:51:32 +00:00
from . common import InfoExtractor
2023-07-09 07:53:02 +00:00
from . . networking . exceptions import HTTPError
2023-06-21 08:29:34 +00:00
from . . utils import ExtractorError , make_archive_id , parse_iso8601 , remove_start
2021-11-27 06:51:32 +00:00
2023-03-12 23:25:05 +00:00
_BASE_URL_RE = r ' https?://(?:www \ .|beta \ .)?(?:watchnebula \ .com|nebula \ .app|nebula \ .tv) '
2022-09-22 01:44:07 +00:00
2021-11-27 06:51:32 +00:00
class NebulaBaseIE ( InfoExtractor ) :
_NETRC_MACHINE = ' watchnebula '
_nebula_api_token = None
_nebula_bearer_token = None
2022-05-15 11:55:44 +00:00
def _perform_nebula_auth ( self , username , password ) :
if not username or not password :
2023-02-17 08:32:55 +00:00
self . raise_login_required ( method = ' password ' )
2021-11-27 06:51:32 +00:00
data = json . dumps ( { ' email ' : username , ' password ' : password } ) . encode ( ' utf8 ' )
response = self . _download_json (
' https://api.watchnebula.com/api/v1/auth/login/ ' ,
data = data , fatal = False , video_id = None ,
headers = {
' content-type ' : ' application/json ' ,
# Submitting the 'sessionid' cookie always causes a 403 on auth endpoint
' cookie ' : ' '
} ,
note = ' Logging in to Nebula with supplied credentials ' ,
errnote = ' Authentication failed or rejected ' )
if not response or not response . get ( ' key ' ) :
2023-02-17 08:32:55 +00:00
self . raise_login_required ( method = ' password ' )
2021-11-27 06:51:32 +00:00
return response [ ' key ' ]
def _call_nebula_api ( self , url , video_id = None , method = ' GET ' , auth_type = ' api ' , note = ' ' ) :
assert method in ( ' GET ' , ' POST ' , )
assert auth_type in ( ' api ' , ' bearer ' , )
2021-09-23 09:05:01 +00:00
2021-11-27 06:51:32 +00:00
def inner_call ( ) :
authorization = f ' Token { self . _nebula_api_token } ' if auth_type == ' api ' else f ' Bearer { self . _nebula_bearer_token } '
return self . _download_json (
url , video_id , note = note , headers = { ' Authorization ' : authorization } ,
data = b ' ' if method == ' POST ' else None )
try :
return inner_call ( )
except ExtractorError as exc :
# if 401 or 403, attempt credential re-auth and retry
2023-07-09 07:53:02 +00:00
if exc . cause and isinstance ( exc . cause , HTTPError ) and exc . cause . status in ( 401 , 403 ) :
2021-11-27 06:51:32 +00:00
self . to_screen ( f ' Reauthenticating to Nebula and retrying, because last { auth_type } call resulted in error { exc . cause . code } ' )
2022-04-02 05:50:31 +00:00
self . _perform_login ( )
2021-11-27 06:51:32 +00:00
return inner_call ( )
else :
raise
def _fetch_nebula_bearer_token ( self ) :
"""
Get a Bearer token for the Nebula API . This will be required to fetch video meta data .
"""
response = self . _call_nebula_api ( ' https://api.watchnebula.com/api/v1/authorization/ ' ,
method = ' POST ' ,
note = ' Authorizing to Nebula ' )
return response [ ' token ' ]
2021-09-23 09:05:01 +00:00
2023-02-17 08:32:55 +00:00
def _fetch_video_formats ( self , slug ) :
2023-06-21 08:29:34 +00:00
stream_info = self . _call_nebula_api ( f ' https://content.api.nebula.app/video/ { slug } /stream/ ' ,
2023-02-17 08:32:55 +00:00
video_id = slug ,
auth_type = ' bearer ' ,
note = ' Fetching video stream info ' )
manifest_url = stream_info [ ' manifest ' ]
2023-06-21 08:29:34 +00:00
return self . _extract_m3u8_formats_and_subtitles ( manifest_url , slug , ' mp4 ' )
2021-11-27 06:51:32 +00:00
def _build_video_info ( self , episode ) :
2023-02-17 08:32:55 +00:00
fmts , subs = self . _fetch_video_formats ( episode [ ' slug ' ] )
2021-11-27 06:51:32 +00:00
channel_slug = episode [ ' channel_slug ' ]
2023-02-17 08:32:55 +00:00
channel_title = episode [ ' channel_title ' ]
2023-06-21 08:29:34 +00:00
zype_id = episode . get ( ' zype_id ' )
2021-11-27 06:51:32 +00:00
return {
2023-06-21 08:29:34 +00:00
' id ' : remove_start ( episode [ ' id ' ] , ' video_episode: ' ) ,
2021-11-27 06:51:32 +00:00
' display_id ' : episode [ ' slug ' ] ,
2023-02-17 08:32:55 +00:00
' formats ' : fmts ,
' subtitles ' : subs ,
' webpage_url ' : f ' https://nebula.tv/ { episode [ " slug " ] } ' ,
2021-11-27 06:51:32 +00:00
' title ' : episode [ ' title ' ] ,
' description ' : episode [ ' description ' ] ,
' timestamp ' : parse_iso8601 ( episode [ ' published_at ' ] ) ,
' thumbnails ' : [ {
# 'id': tn.get('name'), # this appears to be null
' url ' : tn [ ' original ' ] ,
' height ' : key ,
} for key , tn in episode [ ' assets ' ] [ ' thumbnail ' ] . items ( ) ] ,
' duration ' : episode [ ' duration ' ] ,
2023-02-17 08:32:55 +00:00
' channel ' : channel_title ,
2021-11-27 06:51:32 +00:00
' channel_id ' : channel_slug ,
2023-02-17 08:32:55 +00:00
' channel_url ' : f ' https://nebula.tv/ { channel_slug } ' ,
' uploader ' : channel_title ,
2021-11-27 06:51:32 +00:00
' uploader_id ' : channel_slug ,
2023-02-17 08:32:55 +00:00
' uploader_url ' : f ' https://nebula.tv/ { channel_slug } ' ,
' series ' : channel_title ,
' creator ' : channel_title ,
2023-06-21 08:29:34 +00:00
' extractor_key ' : NebulaIE . ie_key ( ) ,
' extractor ' : NebulaIE . IE_NAME ,
' _old_archive_ids ' : [ make_archive_id ( NebulaIE , zype_id ) ] if zype_id else None ,
2021-11-27 06:51:32 +00:00
}
2022-03-18 20:53:33 +00:00
def _perform_login ( self , username = None , password = None ) :
2023-02-17 08:32:55 +00:00
self . _nebula_api_token = self . _perform_nebula_auth ( username , password )
2021-11-27 06:51:32 +00:00
self . _nebula_bearer_token = self . _fetch_nebula_bearer_token ( )
class NebulaIE ( NebulaBaseIE ) :
2022-09-22 01:44:07 +00:00
_VALID_URL = rf ' { _BASE_URL_RE } /videos/(?P<id>[- \ w]+) '
2021-09-23 09:05:01 +00:00
_TESTS = [
{
2023-02-17 08:32:55 +00:00
' url ' : ' https://nebula.tv/videos/that-time-disney-remade-beauty-and-the-beast ' ,
2022-05-15 11:55:44 +00:00
' md5 ' : ' 14944cfee8c7beeea106320c47560efc ' ,
2021-09-23 09:05:01 +00:00
' info_dict ' : {
2023-06-21 08:29:34 +00:00
' id ' : ' 84ed544d-4afd-4723-8cd5-2b95261f0abf ' ,
2021-09-23 09:05:01 +00:00
' ext ' : ' mp4 ' ,
' title ' : ' That Time Disney Remade Beauty and the Beast ' ,
' description ' : ' Note: this video was originally posted on YouTube with the sponsor read included. We weren’ t able to remove it without reducing video quality, so it’ s presented here in its original context. ' ,
' upload_date ' : ' 20180731 ' ,
' timestamp ' : 1533009600 ,
' channel ' : ' Lindsay Ellis ' ,
2021-11-27 06:51:32 +00:00
' channel_id ' : ' lindsayellis ' ,
2021-09-23 09:05:01 +00:00
' uploader ' : ' Lindsay Ellis ' ,
2021-11-27 06:51:32 +00:00
' uploader_id ' : ' lindsayellis ' ,
2022-05-15 11:55:44 +00:00
' timestamp ' : 1533009600 ,
2023-02-17 08:32:55 +00:00
' uploader_url ' : ' https://nebula.tv/lindsayellis ' ,
2022-05-15 11:55:44 +00:00
' series ' : ' Lindsay Ellis ' ,
' display_id ' : ' that-time-disney-remade-beauty-and-the-beast ' ,
2023-02-17 08:32:55 +00:00
' channel_url ' : ' https://nebula.tv/lindsayellis ' ,
2022-05-15 11:55:44 +00:00
' creator ' : ' Lindsay Ellis ' ,
' duration ' : 2212 ,
' thumbnail ' : r ' re:https:// \ w+ \ .cloudfront \ .net/[ \ w-]+ \ .jpeg?.* ' ,
2021-09-23 09:05:01 +00:00
} ,
} ,
{
2023-02-17 08:32:55 +00:00
' url ' : ' https://nebula.tv/videos/the-logistics-of-d-day-landing-craft-how-the-allies-got-ashore ' ,
2022-05-15 11:55:44 +00:00
' md5 ' : ' d05739cf6c38c09322422f696b569c23 ' ,
2021-09-23 09:05:01 +00:00
' info_dict ' : {
2023-06-21 08:29:34 +00:00
' id ' : ' 7e623145-1b44-4ca3-aa0b-ed25a247ea34 ' ,
2021-09-23 09:05:01 +00:00
' ext ' : ' mp4 ' ,
' title ' : ' Landing Craft - How The Allies Got Ashore ' ,
' description ' : r ' re:^In this episode we explore the unsung heroes of D-Day, the landing craft. ' ,
' upload_date ' : ' 20200327 ' ,
' timestamp ' : 1585348140 ,
2023-06-21 08:29:34 +00:00
' channel ' : ' Real Engineering — The Logistics of D-Day ' ,
' channel_id ' : ' d-day ' ,
' uploader ' : ' Real Engineering — The Logistics of D-Day ' ,
' uploader_id ' : ' d-day ' ,
' series ' : ' Real Engineering — The Logistics of D-Day ' ,
2022-05-15 11:55:44 +00:00
' display_id ' : ' the-logistics-of-d-day-landing-craft-how-the-allies-got-ashore ' ,
2023-06-21 08:29:34 +00:00
' creator ' : ' Real Engineering — The Logistics of D-Day ' ,
2022-05-15 11:55:44 +00:00
' duration ' : 841 ,
2023-06-21 08:29:34 +00:00
' channel_url ' : ' https://nebula.tv/d-day ' ,
' uploader_url ' : ' https://nebula.tv/d-day ' ,
2022-05-15 11:55:44 +00:00
' thumbnail ' : r ' re:https:// \ w+ \ .cloudfront \ .net/[ \ w-]+ \ .jpeg?.* ' ,
2021-09-23 09:05:01 +00:00
} ,
} ,
{
2023-02-17 08:32:55 +00:00
' url ' : ' https://nebula.tv/videos/money-episode-1-the-draw ' ,
2022-05-15 11:55:44 +00:00
' md5 ' : ' ebe28a7ad822b9ee172387d860487868 ' ,
2021-09-23 09:05:01 +00:00
' info_dict ' : {
2023-06-21 08:29:34 +00:00
' id ' : ' b96c5714-9e2b-4ec3-b3f1-20f6e89cc553 ' ,
2021-09-23 09:05:01 +00:00
' ext ' : ' mp4 ' ,
' title ' : ' Episode 1: The Draw ' ,
' description ' : r ' contains:There’ s free money on offer… if the players can all work together. ' ,
' upload_date ' : ' 20200323 ' ,
' timestamp ' : 1584980400 ,
' channel ' : ' Tom Scott Presents: Money ' ,
2021-11-27 06:51:32 +00:00
' channel_id ' : ' tom-scott-presents-money ' ,
2021-09-23 09:05:01 +00:00
' uploader ' : ' Tom Scott Presents: Money ' ,
2021-11-27 06:51:32 +00:00
' uploader_id ' : ' tom-scott-presents-money ' ,
2023-02-17 08:32:55 +00:00
' uploader_url ' : ' https://nebula.tv/tom-scott-presents-money ' ,
2022-05-15 11:55:44 +00:00
' duration ' : 825 ,
2023-02-17 08:32:55 +00:00
' channel_url ' : ' https://nebula.tv/tom-scott-presents-money ' ,
2022-05-15 11:55:44 +00:00
' series ' : ' Tom Scott Presents: Money ' ,
' display_id ' : ' money-episode-1-the-draw ' ,
' thumbnail ' : r ' re:https:// \ w+ \ .cloudfront \ .net/[ \ w-]+ \ .jpeg?.* ' ,
' creator ' : ' Tom Scott Presents: Money ' ,
2021-09-23 09:05:01 +00:00
} ,
} ,
{
' url ' : ' https://watchnebula.com/videos/money-episode-1-the-draw ' ,
' only_matching ' : True ,
} ,
2023-03-12 23:25:05 +00:00
{
' url ' : ' https://beta.nebula.tv/videos/money-episode-1-the-draw ' ,
' only_matching ' : True ,
} ,
2021-09-23 09:05:01 +00:00
]
2021-11-27 06:51:32 +00:00
def _fetch_video_metadata ( self , slug ) :
2023-06-21 08:29:34 +00:00
return self . _call_nebula_api ( f ' https://content.api.nebula.app/video/ { slug } / ' ,
2021-11-27 06:51:32 +00:00
video_id = slug ,
auth_type = ' bearer ' ,
note = ' Fetching video meta data ' )
2021-09-23 09:05:01 +00:00
2021-11-27 06:51:32 +00:00
def _real_extract ( self , url ) :
slug = self . _match_id ( url )
video = self . _fetch_video_metadata ( slug )
return self . _build_video_info ( video )
2021-09-23 09:05:01 +00:00
2022-05-15 11:55:44 +00:00
class NebulaSubscriptionsIE ( NebulaBaseIE ) :
IE_NAME = ' nebula:subscriptions '
2022-09-22 01:44:07 +00:00
_VALID_URL = rf ' { _BASE_URL_RE } /myshows '
2022-05-15 11:55:44 +00:00
_TESTS = [
{
2023-02-17 08:32:55 +00:00
' url ' : ' https://nebula.tv/myshows ' ,
2022-05-15 11:55:44 +00:00
' playlist_mincount ' : 1 ,
' info_dict ' : {
' id ' : ' myshows ' ,
} ,
} ,
]
def _generate_playlist_entries ( self ) :
next_url = ' https://content.watchnebula.com/library/video/?page_size=100 '
page_num = 1
while next_url :
channel = self . _call_nebula_api ( next_url , ' myshows ' , auth_type = ' bearer ' ,
note = f ' Retrieving subscriptions page { page_num } ' )
for episode in channel [ ' results ' ] :
yield self . _build_video_info ( episode )
next_url = channel [ ' next ' ]
page_num + = 1
def _real_extract ( self , url ) :
return self . playlist_result ( self . _generate_playlist_entries ( ) , ' myshows ' )
class NebulaChannelIE ( NebulaBaseIE ) :
IE_NAME = ' nebula:channel '
2022-09-22 01:44:07 +00:00
_VALID_URL = rf ' { _BASE_URL_RE } /(?!myshows|videos/)(?P<id>[- \ w]+) '
2021-11-27 06:51:32 +00:00
_TESTS = [
{
2023-02-17 08:32:55 +00:00
' url ' : ' https://nebula.tv/tom-scott-presents-money ' ,
2021-11-27 06:51:32 +00:00
' info_dict ' : {
' id ' : ' tom-scott-presents-money ' ,
' title ' : ' Tom Scott Presents: Money ' ,
' description ' : ' Tom Scott hosts a series all about trust, negotiation and money. ' ,
2021-09-23 09:05:01 +00:00
} ,
2021-11-27 06:51:32 +00:00
' playlist_count ' : 5 ,
} , {
2023-02-17 08:32:55 +00:00
' url ' : ' https://nebula.tv/lindsayellis ' ,
2021-11-27 06:51:32 +00:00
' info_dict ' : {
' id ' : ' lindsayellis ' ,
' title ' : ' Lindsay Ellis ' ,
' description ' : ' Enjoy these hottest of takes on Disney, Transformers, and Musicals. ' ,
} ,
2023-02-17 08:32:55 +00:00
' playlist_mincount ' : 2 ,
2021-11-27 06:51:32 +00:00
} ,
]
2021-09-23 09:05:01 +00:00
2021-11-27 06:51:32 +00:00
def _generate_playlist_entries ( self , collection_id , channel ) :
episodes = channel [ ' episodes ' ] [ ' results ' ]
for page_num in itertools . count ( 2 ) :
for episode in episodes :
yield self . _build_video_info ( episode )
next_url = channel [ ' episodes ' ] [ ' next ' ]
if not next_url :
break
channel = self . _call_nebula_api ( next_url , collection_id , auth_type = ' bearer ' ,
note = f ' Retrieving channel page { page_num } ' )
episodes = channel [ ' episodes ' ] [ ' results ' ]
2021-09-23 09:05:01 +00:00
def _real_extract ( self , url ) :
2021-11-27 06:51:32 +00:00
collection_id = self . _match_id ( url )
channel_url = f ' https://content.watchnebula.com/video/channels/ { collection_id } / '
channel = self . _call_nebula_api ( channel_url , collection_id , auth_type = ' bearer ' , note = ' Retrieving channel ' )
channel_details = channel [ ' details ' ]
2021-09-23 09:05:01 +00:00
2021-11-27 06:51:32 +00:00
return self . playlist_result (
entries = self . _generate_playlist_entries ( collection_id , channel ) ,
playlist_id = collection_id ,
playlist_title = channel_details [ ' title ' ] ,
playlist_description = channel_details [ ' description ' ]
)