mirrorcouk.py 4.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798
  1. from .common import InfoExtractor
  2. from ..utils import unescapeHTML
  3. class MirrorCoUKIE(InfoExtractor):
  4. _VALID_URL = r'https?://(?:www\.)?mirror\.co\.uk/[/+[\w-]+-(?P<id>\d+)'
  5. _TESTS = [{
  6. 'url': 'https://www.mirror.co.uk/tv/tv-news/love-island-fans-baffled-after-27163139',
  7. 'info_dict': {
  8. 'id': 'voyyS7SV',
  9. 'ext': 'mp4',
  10. 'title': 'Love Island: Gemma Owen enters the villa',
  11. 'description': 'Love Island: Michael Owen\'s daughter Gemma Owen enters the villa.',
  12. 'thumbnail': 'https://cdn.jwplayer.com/v2/media/voyyS7SV/poster.jpg?width=720',
  13. 'display_id': '27163139',
  14. 'timestamp': 1654547895,
  15. 'duration': 57.0,
  16. 'upload_date': '20220606',
  17. },
  18. }, {
  19. 'url': 'https://www.mirror.co.uk/3am/celebrity-news/michael-jacksons-son-blankets-new-25344890',
  20. 'info_dict': {
  21. 'id': 'jyXpdvxp',
  22. 'ext': 'mp4',
  23. 'title': 'Michael Jackson’s son Bigi calls for action on climate change',
  24. 'description': 'md5:d39ceaba2b7a615b4ca6557e7bc40222',
  25. 'thumbnail': 'https://cdn.jwplayer.com/v2/media/jyXpdvxp/poster.jpg?width=720',
  26. 'display_id': '25344890',
  27. 'timestamp': 1635749907,
  28. 'duration': 56.0,
  29. 'upload_date': '20211101',
  30. },
  31. }, {
  32. 'url': 'https://www.mirror.co.uk/sport/football/news/antonio-conte-next-tottenham-manager-25346042',
  33. 'info_dict': {
  34. 'id': 'q6FkKa4p',
  35. 'ext': 'mp4',
  36. 'title': 'Nuno sacked by Tottenham after fifth Premier League defeat of the season',
  37. 'description': 'Nuno Espirito Santo has been sacked as Tottenham boss after only four months in charge.',
  38. 'thumbnail': 'https://cdn.jwplayer.com/v2/media/q6FkKa4p/poster.jpg?width=720',
  39. 'display_id': '25346042',
  40. 'timestamp': 1635763157,
  41. 'duration': 40.0,
  42. 'upload_date': '20211101',
  43. },
  44. }, {
  45. 'url': 'https://www.mirror.co.uk/3am/celebrity-news/johnny-depp-splashes-50k-curry-27160737',
  46. 'info_dict': {
  47. 'id': 'IT0oa1nH',
  48. 'ext': 'mp4',
  49. 'title': 'Johnny Depp Leaves The Grand Hotel in Birmingham',
  50. 'description': 'Johnny Depp Leaves The Grand Hotel in Birmingham.',
  51. 'thumbnail': 'https://cdn.jwplayer.com/v2/media/IT0oa1nH/poster.jpg?width=720',
  52. 'display_id': '27160737',
  53. 'timestamp': 1654524120,
  54. 'duration': 65.0,
  55. 'upload_date': '20220606',
  56. },
  57. }, {
  58. 'url': 'https://www.mirror.co.uk/tv/tv-news/love-islands-liam-could-first-27162602',
  59. 'info_dict': {
  60. 'id': 'EaPr5Z2j',
  61. 'ext': 'mp4',
  62. 'title': 'Love Island: Davide reveals plot twist after receiving text',
  63. 'description': 'Love Island: Davide reveals plot twist after receiving text',
  64. 'thumbnail': 'https://cdn.jwplayer.com/v2/media/EaPr5Z2j/poster.jpg?width=720',
  65. 'display_id': '27162602',
  66. 'timestamp': 1654552597,
  67. 'duration': 23.0,
  68. 'upload_date': '20220606',
  69. },
  70. }, {
  71. 'url': 'https://www.mirror.co.uk/news/uk-news/william-kate-sent-message-george-27160572',
  72. 'info_dict': {
  73. 'id': 'ygtceXIu',
  74. 'ext': 'mp4',
  75. 'title': 'Prince William and Kate arrive in Wales with George and Charlotte',
  76. 'description': 'Prince William and Kate Middleton arrive in Wales with children Prince George and Princess Charlotte.',
  77. 'thumbnail': 'https://cdn.jwplayer.com/v2/media/ygtceXIu/poster.jpg?width=720',
  78. 'display_id': '27160572',
  79. 'timestamp': 1654349678,
  80. 'duration': 106.0,
  81. 'upload_date': '20220604',
  82. },
  83. }]
  84. def _real_extract(self, url):
  85. display_id = self._match_id(url)
  86. webpage = self._download_webpage(url, display_id)
  87. data = self._search_json(r'div\s+class="json-placeholder"\s+data-json="',
  88. webpage, 'data', display_id, transform_source=unescapeHTML)['videoData']
  89. return {
  90. '_type': 'url_transparent',
  91. 'url': f'jwplatform:{data["videoId"]}',
  92. 'ie_key': 'JWPlatform',
  93. 'display_id': display_id,
  94. }