0
0
Fork 0
mirror of https://github.com/yt-dlp/yt-dlp.git synced 2024-12-01 03:43:02 +00:00

Allow downloading videos with other characters in their titles

Especially html entities
This commit is contained in:
Jaime Marquínez Ferrándiz 2013-01-03 21:05:04 +01:00
parent f5ebb61495
commit 9cf98a2bcc

View file

@ -3694,9 +3694,10 @@ def _real_extract(self, url):
videourl = 'http://store.steampowered.com/video/%s/' % gameID videourl = 'http://store.steampowered.com/video/%s/' % gameID
webpage = self._download_webpage(videourl, gameID) webpage = self._download_webpage(videourl, gameID)
mweb = re.finditer(urlRE, webpage) mweb = re.finditer(urlRE, webpage)
namesRE = r'<span class=\"title\">(?P<videoName>[\w:/\.\?=\+\s-]+)</span>' namesRE = r'<span class="title">(?P<videoName>.+)</span>'
titles = list(re.finditer(namesRE, webpage)) titles = list(re.finditer(namesRE, webpage))
videos = [] videos = []
unescaper = compat_html_parser.HTMLParser()
for vid,vtitle in zip(mweb,titles): for vid,vtitle in zip(mweb,titles):
video_id = vid.group('videoID') video_id = vid.group('videoID')
title = vtitle.group('videoName') title = vtitle.group('videoName')
@ -3707,7 +3708,7 @@ def _real_extract(self, url):
'id':video_id, 'id':video_id,
'url':video_url, 'url':video_url,
'ext': 'flv', 'ext': 'flv',
'title': title 'title': unescaper.unescape(title)
} }
videos.append(info) videos.append(info)
return videos return videos