stv.py 3.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788
  1. from .common import InfoExtractor
  2. from ..utils import (
  3. float_or_none,
  4. int_or_none,
  5. smuggle_url,
  6. str_or_none,
  7. try_get,
  8. )
  9. class STVPlayerIE(InfoExtractor):
  10. IE_NAME = 'stv:player'
  11. _VALID_URL = r'https?://player\.stv\.tv/(?P<type>episode|video)/(?P<id>[a-z0-9]{4})'
  12. _TESTS = [{
  13. # shortform
  14. 'url': 'https://player.stv.tv/video/4gwd/emmerdale/60-seconds-on-set-with-laura-norton/',
  15. 'md5': '5adf9439c31d554f8be0707c7abe7e0a',
  16. 'info_dict': {
  17. 'id': '5333973339001',
  18. 'ext': 'mp4',
  19. 'upload_date': '20170301',
  20. 'title': '60 seconds on set with Laura Norton',
  21. 'description': "How many questions can Laura - a.k.a Kerry Wyatt - answer in 60 seconds? Let's find out!",
  22. 'timestamp': 1488388054,
  23. 'uploader_id': '1486976045',
  24. },
  25. 'skip': 'this resource is unavailable outside of the UK',
  26. }, {
  27. # episodes
  28. 'url': 'https://player.stv.tv/episode/4125/jennifer-saunders-memory-lane',
  29. 'only_matching': True,
  30. }]
  31. BRIGHTCOVE_URL_TEMPLATE = 'http://players.brightcove.net/1486976045/default_default/index.html?videoId=%s'
  32. _PTYPE_MAP = {
  33. 'episode': 'episodes',
  34. 'video': 'shortform',
  35. }
  36. def _real_extract(self, url):
  37. ptype, video_id = self._match_valid_url(url).groups()
  38. webpage = self._download_webpage(url, video_id, fatal=False) or ''
  39. props = self._search_nextjs_data(webpage, video_id, default={}).get('props') or {}
  40. player_api_cache = try_get(
  41. props, lambda x: x['initialReduxState']['playerApiCache']) or {}
  42. api_path, resp = None, {}
  43. for k, v in player_api_cache.items():
  44. if k.startswith(('/episodes/', '/shortform/')):
  45. api_path, resp = k, v
  46. break
  47. else:
  48. episode_id = str_or_none(try_get(
  49. props, lambda x: x['pageProps']['episodeId']))
  50. api_path = f'/{self._PTYPE_MAP[ptype]}/{episode_id or video_id}'
  51. result = resp.get('results')
  52. if not result:
  53. resp = self._download_json(
  54. 'https://player.api.stv.tv/v1' + api_path, video_id)
  55. result = resp['results']
  56. video = result['video']
  57. video_id = str(video['id'])
  58. subtitles = {}
  59. _subtitles = result.get('_subtitles') or {}
  60. for ext, sub_url in _subtitles.items():
  61. subtitles.setdefault('en', []).append({
  62. 'ext': 'vtt' if ext == 'webvtt' else ext,
  63. 'url': sub_url,
  64. })
  65. programme = result.get('programme') or {}
  66. if programme.get('drmEnabled'):
  67. self.report_drm(video_id)
  68. return {
  69. '_type': 'url_transparent',
  70. 'id': video_id,
  71. 'url': smuggle_url(self.BRIGHTCOVE_URL_TEMPLATE % video_id, {'geo_countries': ['GB']}),
  72. 'description': result.get('summary'),
  73. 'duration': float_or_none(video.get('length'), 1000),
  74. 'subtitles': subtitles,
  75. 'view_count': int_or_none(result.get('views')),
  76. 'series': programme.get('name') or programme.get('shortName'),
  77. 'ie_key': 'BrightcoveNew',
  78. }