fathom.py 1.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354
  1. import json
  2. from .common import InfoExtractor
  3. from ..utils import (
  4. extract_attributes,
  5. float_or_none,
  6. get_element_html_by_id,
  7. parse_iso8601,
  8. )
  9. from ..utils.traversal import traverse_obj
  10. class FathomIE(InfoExtractor):
  11. _VALID_URL = r'https?://(?:www\.)?fathom\.video/share/(?P<id>[^/?#&]+)'
  12. _TESTS = [{
  13. 'url': 'https://fathom.video/share/G9mkjkspnohVVZ_L5nrsoPycyWcB8y7s',
  14. 'md5': '0decd5343b8f30ae268625e79a02b60f',
  15. 'info_dict': {
  16. 'id': '47200596',
  17. 'ext': 'mp4',
  18. 'title': 'eCom Inucbator - Coaching Session',
  19. 'duration': 8125.380507,
  20. 'timestamp': 1699048914,
  21. 'upload_date': '20231103',
  22. },
  23. }, {
  24. 'url': 'https://fathom.video/share/mEws3bybftHL2QLymxYEDeE21vtLxGVm',
  25. 'md5': '4f5cb382126c22d1aba8a939f9c49690',
  26. 'info_dict': {
  27. 'id': '46812957',
  28. 'ext': 'mp4',
  29. 'title': 'Jon, Lawrence, Neman chat about practice',
  30. 'duration': 3571.517847,
  31. 'timestamp': 1698933600,
  32. 'upload_date': '20231102',
  33. },
  34. }]
  35. def _real_extract(self, url):
  36. display_id = self._match_id(url)
  37. webpage = self._download_webpage(url, display_id)
  38. props = traverse_obj(
  39. get_element_html_by_id('app', webpage), ({extract_attributes}, 'data-page', {json.loads}, 'props'))
  40. video_id = str(props['call']['id'])
  41. return {
  42. 'id': video_id,
  43. 'formats': self._extract_m3u8_formats(props['call']['video_url'], video_id, 'mp4'),
  44. **traverse_obj(props, {
  45. 'title': ('head', 'title', {str}),
  46. 'duration': ('duration', {float_or_none}),
  47. 'timestamp': ('call', 'started_at', {parse_iso8601}),
  48. }),
  49. }