prankcast.py 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137
  1. import json
  2. from .common import InfoExtractor
  3. from ..utils import float_or_none, parse_iso8601, str_or_none, try_call
  4. from ..utils.traversal import traverse_obj
  5. class PrankCastIE(InfoExtractor):
  6. _VALID_URL = r'https?://(?:www\.)?prankcast\.com/[^/?#]+/showreel/(?P<id>\d+)-(?P<display_id>[^/?#]+)'
  7. _TESTS = [{
  8. 'url': 'https://prankcast.com/Devonanustart/showreel/1561-Beverly-is-back-like-a-heart-attack-',
  9. 'info_dict': {
  10. 'id': '1561',
  11. 'ext': 'mp3',
  12. 'title': 'Beverly is back like a heart attack!',
  13. 'display_id': 'Beverly-is-back-like-a-heart-attack-',
  14. 'timestamp': 1661391575,
  15. 'uploader': 'Devonanustart',
  16. 'channel_id': '4',
  17. 'duration': 7918,
  18. 'cast': ['Devonanustart', 'Phonelosers'],
  19. 'description': '',
  20. 'categories': ['prank'],
  21. 'tags': ['prank call', 'prank', 'live show'],
  22. 'upload_date': '20220825',
  23. },
  24. }, {
  25. 'url': 'https://prankcast.com/phonelosers/showreel/2048-NOT-COOL',
  26. 'info_dict': {
  27. 'id': '2048',
  28. 'ext': 'mp3',
  29. 'title': 'NOT COOL',
  30. 'display_id': 'NOT-COOL',
  31. 'timestamp': 1665028364,
  32. 'uploader': 'phonelosers',
  33. 'channel_id': '6',
  34. 'duration': 4044,
  35. 'cast': ['phonelosers'],
  36. 'description': '',
  37. 'categories': ['prank'],
  38. 'tags': ['prank call', 'prank', 'live show'],
  39. 'upload_date': '20221006',
  40. },
  41. }]
  42. def _real_extract(self, url):
  43. video_id, display_id = self._match_valid_url(url).group('id', 'display_id')
  44. webpage = self._download_webpage(url, video_id)
  45. json_info = self._search_nextjs_data(webpage, video_id)['props']['pageProps']['ssr_data_showreel']
  46. uploader = json_info.get('user_name')
  47. guests_json = self._parse_json(json_info.get('guests_json') or '{}', video_id)
  48. start_date = parse_iso8601(json_info.get('start_date'))
  49. return {
  50. 'id': video_id,
  51. 'title': json_info.get('broadcast_title') or self._og_search_title(webpage),
  52. 'display_id': display_id,
  53. 'url': f'{json_info["broadcast_url"]}{json_info["recording_hash"]}.mp3',
  54. 'timestamp': start_date,
  55. 'uploader': uploader,
  56. 'channel_id': str_or_none(json_info.get('user_id')),
  57. 'duration': try_call(lambda: parse_iso8601(json_info['end_date']) - start_date),
  58. 'cast': list(filter(None, [uploader, *traverse_obj(guests_json, (..., 'name'))])),
  59. 'description': json_info.get('broadcast_description'),
  60. 'categories': [json_info.get('broadcast_category')],
  61. 'tags': try_call(lambda: json_info['broadcast_tags'].split(',')),
  62. }
  63. class PrankCastPostIE(InfoExtractor):
  64. _VALID_URL = r'https?://(?:www\.)?prankcast\.com/[^/?#]+/posts/(?P<id>\d+)-(?P<display_id>[^/?#]+)'
  65. _TESTS = [{
  66. 'url': 'https://prankcast.com/devonanustart/posts/6214-happy-national-rachel-day-',
  67. 'info_dict': {
  68. 'id': '6214',
  69. 'ext': 'mp3',
  70. 'title': 'Happy National Rachel Day!',
  71. 'display_id': 'happy-national-rachel-day-',
  72. 'timestamp': 1704333938,
  73. 'uploader': 'Devonanustart',
  74. 'channel_id': '4',
  75. 'duration': 13175,
  76. 'cast': ['Devonanustart'],
  77. 'description': '',
  78. 'categories': ['prank call'],
  79. 'upload_date': '20240104',
  80. },
  81. }, {
  82. 'url': 'https://prankcast.com/despicabledogs/posts/6217-jake-the-work-crow-',
  83. 'info_dict': {
  84. 'id': '6217',
  85. 'ext': 'mp3',
  86. 'title': 'Jake the Work Crow!',
  87. 'display_id': 'jake-the-work-crow-',
  88. 'timestamp': 1704346592,
  89. 'uploader': 'despicabledogs',
  90. 'channel_id': '957',
  91. 'duration': 263.287,
  92. 'cast': ['despicabledogs'],
  93. 'description': 'https://imgur.com/a/vtxLvKU',
  94. 'categories': [],
  95. 'upload_date': '20240104',
  96. },
  97. }]
  98. def _real_extract(self, url):
  99. video_id, display_id = self._match_valid_url(url).group('id', 'display_id')
  100. webpage = self._download_webpage(url, video_id)
  101. post = self._search_nextjs_data(webpage, video_id)['props']['pageProps']['ssr_data_posts']
  102. content = self._parse_json(post['post_contents_json'], video_id)[0]
  103. uploader = post.get('user_name')
  104. guests_json = traverse_obj(content, ('guests_json', {json.loads}, {dict})) or {}
  105. return {
  106. 'id': video_id,
  107. 'title': post.get('post_title') or self._og_search_title(webpage),
  108. 'display_id': display_id,
  109. 'url': content.get('url'),
  110. 'timestamp': parse_iso8601(content.get('start_date') or content.get('crdate'), ' '),
  111. 'uploader': uploader,
  112. 'channel_id': str_or_none(post.get('user_id')),
  113. 'duration': float_or_none(content.get('duration')),
  114. 'cast': list(filter(None, [uploader, *traverse_obj(guests_json, (..., 'name'))])),
  115. 'description': post.get('post_body'),
  116. 'categories': list(filter(None, [content.get('category')])),
  117. 'tags': try_call(lambda: list(filter('', post['post_tags'].split(',')))),
  118. 'subtitles': {
  119. 'live_chat': [{
  120. 'url': f'https://prankcast.com/api/private/chat/select-broadcast?id={post["content_id"]}&cache=',
  121. 'ext': 'json',
  122. }],
  123. } if post.get('content_id') else None,
  124. }