brilliantpala.py 5.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136
  1. import hashlib
  2. from .common import InfoExtractor
  3. from ..utils import (
  4. ExtractorError,
  5. traverse_obj,
  6. urlencode_postdata,
  7. )
  8. class BrilliantpalaBaseIE(InfoExtractor):
  9. _NETRC_MACHINE = 'brilliantpala'
  10. _DOMAIN = '{subdomain}.brilliantpala.org'
  11. def _initialize_pre_login(self):
  12. self._HOMEPAGE = f'https://{self._DOMAIN}'
  13. self._LOGIN_API = f'{self._HOMEPAGE}/login/'
  14. self._LOGOUT_DEVICES_API = f'{self._HOMEPAGE}/logout_devices/?next=/'
  15. self._CONTENT_API = f'{self._HOMEPAGE}/api/v2.4/contents/{{content_id}}/'
  16. self._HLS_AES_URI = f'{self._HOMEPAGE}/api/v2.5/video_contents/{{content_id}}/key/'
  17. def _get_logged_in_username(self, url, video_id):
  18. webpage, urlh = self._download_webpage_handle(url, video_id)
  19. if urlh.url.startswith(self._LOGIN_API):
  20. self.raise_login_required()
  21. return self._html_search_regex(
  22. r'"username"\s*:\s*"(?P<username>[^"]+)"', webpage, 'logged-in username')
  23. def _perform_login(self, username, password):
  24. login_page, urlh = self._download_webpage_handle(
  25. self._LOGIN_API, None, 'Downloading login page', expected_status=401)
  26. if urlh.status != 401 and not urlh.url.startswith(self._LOGIN_API):
  27. self.write_debug('Cookies are valid, no login required.')
  28. return
  29. if urlh.status == 401:
  30. self.write_debug('Got HTTP Error 401; cookies have been invalidated')
  31. login_page = self._download_webpage(self._LOGIN_API, None, 'Re-downloading login page')
  32. login_form = self._hidden_inputs(login_page)
  33. login_form.update({
  34. 'username': username,
  35. 'password': password,
  36. })
  37. self._set_cookie(self._DOMAIN, 'csrftoken', login_form['csrfmiddlewaretoken'])
  38. logged_page = self._download_webpage(
  39. self._LOGIN_API, None, note='Logging in', headers={'Referer': self._LOGIN_API},
  40. data=urlencode_postdata(login_form))
  41. if self._html_search_regex(
  42. r'(Your username / email and password)', logged_page, 'auth fail', default=None):
  43. raise ExtractorError('wrong username or password', expected=True)
  44. # the maximum number of logins is one
  45. if self._html_search_regex(
  46. r'(Logout Other Devices)', logged_page, 'logout devices button', default=None):
  47. logout_device_form = self._hidden_inputs(logged_page)
  48. self._download_webpage(
  49. self._LOGOUT_DEVICES_API, None, headers={'Referer': self._LOGIN_API},
  50. note='Logging out other devices', data=urlencode_postdata(logout_device_form))
  51. def _real_extract(self, url):
  52. course_id, content_id = self._match_valid_url(url).group('course_id', 'content_id')
  53. video_id = f'{course_id}-{content_id}'
  54. username = self._get_logged_in_username(url, video_id)
  55. content_json = self._download_json(
  56. self._CONTENT_API.format(content_id=content_id), video_id,
  57. note='Fetching content info', errnote='Unable to fetch content info')
  58. entries = []
  59. for stream in traverse_obj(content_json, ('video', 'streams', lambda _, v: v['id'] and v['url'])):
  60. formats = self._extract_m3u8_formats(stream['url'], video_id, fatal=False)
  61. if not formats:
  62. continue
  63. entries.append({
  64. 'id': str(stream['id']),
  65. 'title': content_json.get('title'),
  66. 'formats': formats,
  67. 'hls_aes': {'uri': self._HLS_AES_URI.format(content_id=content_id)},
  68. 'http_headers': {'X-Key': hashlib.sha256(username.encode('ascii')).hexdigest()},
  69. 'thumbnail': content_json.get('cover_image'),
  70. })
  71. return self.playlist_result(
  72. entries, playlist_id=video_id, playlist_title=content_json.get('title'))
  73. class BrilliantpalaElearnIE(BrilliantpalaBaseIE):
  74. IE_NAME = 'Brilliantpala:Elearn'
  75. IE_DESC = 'VoD on elearn.brilliantpala.org'
  76. _VALID_URL = r'https?://elearn\.brilliantpala\.org/courses/(?P<course_id>\d+)/contents/(?P<content_id>\d+)/?'
  77. _TESTS = [{
  78. 'url': 'https://elearn.brilliantpala.org/courses/42/contents/12345/',
  79. 'only_matching': True,
  80. }, {
  81. 'url': 'https://elearn.brilliantpala.org/courses/98/contents/36683/',
  82. 'info_dict': {
  83. 'id': '23577',
  84. 'ext': 'mp4',
  85. 'title': 'Physical World, Units and Measurements - 1',
  86. 'thumbnail': 'https://d1j3vi2u94ebt0.cloudfront.net/institute/brilliantpalalms/chapter_contents/26237/e657f81b90874be19795c7ea081f8d5c.png',
  87. 'live_status': 'not_live',
  88. },
  89. 'params': {
  90. 'skip_download': True,
  91. },
  92. }]
  93. _DOMAIN = BrilliantpalaBaseIE._DOMAIN.format(subdomain='elearn')
  94. class BrilliantpalaClassesIE(BrilliantpalaBaseIE):
  95. IE_NAME = 'Brilliantpala:Classes'
  96. IE_DESC = 'VoD on classes.brilliantpala.org'
  97. _VALID_URL = r'https?://classes\.brilliantpala\.org/courses/(?P<course_id>\d+)/contents/(?P<content_id>\d+)/?'
  98. _TESTS = [{
  99. 'url': 'https://classes.brilliantpala.org/courses/42/contents/12345/',
  100. 'only_matching': True,
  101. }, {
  102. 'url': 'https://classes.brilliantpala.org/courses/416/contents/25445/',
  103. 'info_dict': {
  104. 'id': '9128',
  105. 'ext': 'mp4',
  106. 'title': 'Motion in a Straight Line - Class 1',
  107. 'thumbnail': 'https://d3e4y8hquds3ek.cloudfront.net/institute/brilliantpalaelearn/chapter_contents/ff5ba838d0ec43419f67387fe1a01fa8.png',
  108. 'live_status': 'not_live',
  109. },
  110. 'params': {
  111. 'skip_download': True,
  112. },
  113. }]
  114. _DOMAIN = BrilliantpalaBaseIE._DOMAIN.format(subdomain='classes')