foxsports.py 2.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152
  1. from .common import InfoExtractor
  2. from .uplynk import UplynkPreplayIE
  3. from ..networking import HEADRequest
  4. from ..utils import float_or_none, make_archive_id, smuggle_url
  5. class FoxSportsIE(InfoExtractor):
  6. _VALID_URL = r'https?://(?:www\.)?foxsports\.com/watch/(?P<id>[\w-]+)'
  7. _TESTS = [{
  8. 'url': 'https://www.foxsports.com/watch/play-612168c6700004b',
  9. 'info_dict': {
  10. 'id': 'b72f5bd8658140baa5791bb676433733',
  11. 'ext': 'mp4',
  12. 'display_id': 'play-612168c6700004b',
  13. 'title': 'md5:e0c4ecac3a1f25295b4fae22fb5c126a',
  14. 'description': 'md5:371bc43609708ae2b9e1a939229762af',
  15. 'uploader_id': '06b4a36349624051a9ba52ac3a91d268',
  16. 'upload_date': '20221205',
  17. 'timestamp': 1670262586,
  18. 'duration': 31.7317,
  19. 'thumbnail': r're:^https?://.*\.jpg$',
  20. 'extra_param_to_segment_url': str,
  21. },
  22. 'params': {
  23. 'skip_download': 'm3u8',
  24. },
  25. }]
  26. def _real_extract(self, url):
  27. video_id = self._match_id(url)
  28. webpage = self._download_webpage(url, video_id)
  29. json_ld = self._search_json_ld(webpage, video_id, expected_type='VideoObject', default={})
  30. data = self._download_json(
  31. f'https://api3.fox.com/v2.0/vodplayer/sportsclip/{video_id}',
  32. video_id, note='Downloading API JSON', headers={
  33. 'x-api-key': 'cf289e299efdfa39fb6316f259d1de93',
  34. })
  35. preplay_url = self._request_webpage(
  36. HEADRequest(data['url']), video_id, 'Fetching preplay URL').url
  37. return {
  38. '_type': 'url_transparent',
  39. 'ie_key': UplynkPreplayIE.ie_key(),
  40. 'url': smuggle_url(preplay_url, {'Origin': 'https://www.foxsports.com'}),
  41. 'display_id': video_id,
  42. 'title': data.get('name') or json_ld.get('title'),
  43. 'description': data.get('description') or json_ld.get('description'),
  44. 'duration': float_or_none(data.get('durationInSeconds')),
  45. 'timestamp': json_ld.get('timestamp'),
  46. 'thumbnails': json_ld.get('thumbnails'),
  47. '_old_archive_ids': [make_archive_id(self, video_id)],
  48. }