tennistv.py 7.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155
  1. import urllib.parse
  2. from .common import InfoExtractor
  3. from ..utils import (
  4. ExtractorError,
  5. random_uuidv4,
  6. unified_timestamp,
  7. urlencode_postdata,
  8. )
  9. class TennisTVIE(InfoExtractor):
  10. _VALID_URL = r'https?://(?:www\.)?tennistv\.com/videos/(?P<id>[-a-z0-9]+)'
  11. _TESTS = [{
  12. 'url': 'https://www.tennistv.com/videos/indian-wells-2018-verdasco-fritz',
  13. 'info_dict': {
  14. 'id': 'indian-wells-2018-verdasco-fritz',
  15. 'ext': 'mp4',
  16. 'title': 'Fernando Verdasco v Taylor Fritz',
  17. 'description': 're:^After his stunning victory.{174}$',
  18. 'thumbnail': 'https://atp-prod.akamaized.net/api/images/v1/images/112831/landscape/1242/0',
  19. 'timestamp': 1521017381,
  20. 'upload_date': '20180314',
  21. },
  22. 'params': {
  23. 'skip_download': True,
  24. },
  25. 'skip': 'Requires email and password of a subscribed account',
  26. }, {
  27. 'url': 'https://www.tennistv.com/videos/2650480/best-matches-of-2022-part-5',
  28. 'info_dict': {
  29. 'id': '2650480',
  30. 'ext': 'mp4',
  31. 'title': 'Best Matches of 2022 - Part 5',
  32. 'description': 'md5:36dec3bfae7ed74bd79e48045b17264c',
  33. 'thumbnail': 'https://open.http.mp.streamamg.com/p/3001482/sp/300148200/thumbnail/entry_id/0_myef18pd/version/100001/height/1920',
  34. },
  35. 'params': {'skip_download': 'm3u8'},
  36. 'skip': 'Requires email and password of a subscribed account',
  37. }]
  38. _NETRC_MACHINE = 'tennistv'
  39. access_token, refresh_token = None, None
  40. _PARTNER_ID = 3001482
  41. _FORMAT_URL = 'https://open.http.mp.streamamg.com/p/{partner}/sp/{partner}00/playManifest/entryId/{entry}/format/applehttp/protocol/https/a.m3u8?ks={session}'
  42. _AUTH_BASE_URL = 'https://sso.tennistv.com/auth/realms/TennisTV/protocol/openid-connect'
  43. _HEADERS = {
  44. 'origin': 'https://www.tennistv.com',
  45. 'referer': 'https://www.tennistv.com/',
  46. 'content-Type': 'application/x-www-form-urlencoded',
  47. }
  48. def _perform_login(self, username, password):
  49. login_page = self._download_webpage(
  50. f'{self._AUTH_BASE_URL}/auth', None, 'Downloading login page',
  51. query={
  52. 'client_id': 'tennis-tv-web',
  53. 'redirect_uri': 'https://tennistv.com',
  54. 'response_mode': 'fragment',
  55. 'response_type': 'code',
  56. 'scope': 'openid',
  57. })
  58. post_url = self._html_search_regex(r'action=["\']([^"\']+?)["\']\s+method=["\']post["\']', login_page, 'login POST url')
  59. temp_page = self._download_webpage(
  60. post_url, None, 'Sending login data', 'Unable to send login data',
  61. headers=self._HEADERS, data=urlencode_postdata({
  62. 'username': username,
  63. 'password': password,
  64. 'submitAction': 'Log In',
  65. }))
  66. if 'Your username or password was incorrect' in temp_page:
  67. raise ExtractorError('Your username or password was incorrect', expected=True)
  68. handle = self._request_webpage(
  69. f'{self._AUTH_BASE_URL}/auth', None, 'Logging in', headers=self._HEADERS,
  70. query={
  71. 'client_id': 'tennis-tv-web',
  72. 'redirect_uri': 'https://www.tennistv.com/resources/v1.1.10/html/silent-check-sso.html',
  73. 'state': random_uuidv4(),
  74. 'response_mode': 'fragment',
  75. 'response_type': 'code',
  76. 'scope': 'openid',
  77. 'nonce': random_uuidv4(),
  78. 'prompt': 'none',
  79. })
  80. self.get_token(None, {
  81. 'code': urllib.parse.parse_qs(handle.url)['code'][-1],
  82. 'grant_type': 'authorization_code',
  83. 'client_id': 'tennis-tv-web',
  84. 'redirect_uri': 'https://www.tennistv.com/resources/v1.1.10/html/silent-check-sso.html',
  85. })
  86. def get_token(self, video_id, payload):
  87. res = self._download_json(
  88. f'{self._AUTH_BASE_URL}/token', video_id, 'Fetching tokens',
  89. 'Unable to fetch tokens', headers=self._HEADERS, data=urlencode_postdata(payload))
  90. self.access_token = res.get('access_token') or self.access_token
  91. self.refresh_token = res.get('refresh_token') or self.refresh_token
  92. def _real_initialize(self):
  93. if self.access_token and self.refresh_token:
  94. return
  95. cookies = self._get_cookies('https://www.tennistv.com/')
  96. if not cookies.get('access_token') or not cookies.get('refresh_token'):
  97. self.raise_login_required()
  98. self.access_token, self.refresh_token = cookies['access_token'].value, cookies['refresh_token'].value
  99. def _download_session_json(self, video_id, entryid):
  100. return self._download_json(
  101. f'https://atppayments.streamamg.com/api/v1/session/ksession/?lang=en&apijwttoken={self.access_token}&entryId={entryid}',
  102. video_id, 'Downloading ksession token', 'Failed to download ksession token', headers=self._HEADERS)
  103. def _real_extract(self, url):
  104. video_id = self._match_id(url)
  105. webpage = self._download_webpage(url, video_id)
  106. entryid = self._search_regex(r'data-entry-id=["\']([^"\']+)', webpage, 'entryID')
  107. session_json = self._download_session_json(video_id, entryid)
  108. k_session = session_json.get('KSession')
  109. if k_session is None:
  110. self.get_token(video_id, {
  111. 'grant_type': 'refresh_token',
  112. 'refresh_token': self.refresh_token,
  113. 'client_id': 'tennis-tv-web',
  114. })
  115. k_session = self._download_session_json(video_id, entryid).get('KSession')
  116. if k_session is None:
  117. raise ExtractorError('Failed to get KSession, possibly a premium video', expected=True)
  118. if session_json.get('ErrorMessage'):
  119. self.report_warning(session_json['ErrorMessage'])
  120. formats, subtitles = self._extract_m3u8_formats_and_subtitles(
  121. self._FORMAT_URL.format(partner=self._PARTNER_ID, entry=entryid, session=k_session), video_id)
  122. return {
  123. 'id': video_id,
  124. 'title': self._generic_title('', webpage),
  125. 'description': self._html_search_regex(
  126. (r'<span itemprop="description" content=["\']([^"\']+)["\']>', *self._og_regexes('description')),
  127. webpage, 'description', fatal=False),
  128. 'thumbnail': f'https://open.http.mp.streamamg.com/p/{self._PARTNER_ID}/sp/{self._PARTNER_ID}00/thumbnail/entry_id/{entryid}/version/100001/height/1920',
  129. 'timestamp': unified_timestamp(self._html_search_regex(
  130. r'<span itemprop="uploadDate" content=["\']([^"\']+)["\']>', webpage, 'upload time', fatal=False)),
  131. 'series': self._html_search_regex(r'data-series\s*?=\s*?"(.*?)"', webpage, 'series', fatal=False) or None,
  132. 'season': self._html_search_regex(r'data-tournament-city\s*?=\s*?"(.*?)"', webpage, 'season', fatal=False) or None,
  133. 'episode': self._html_search_regex(r'data-round\s*?=\s*?"(.*?)"', webpage, 'round', fatal=False) or None,
  134. 'formats': formats,
  135. 'subtitles': subtitles,
  136. }