musicdex.py 7.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174
  1. from .common import InfoExtractor
  2. from ..utils import (
  3. date_from_str,
  4. format_field,
  5. try_get,
  6. unified_strdate,
  7. )
  8. class MusicdexBaseIE(InfoExtractor):
  9. def _return_info(self, track_json, album_json, video_id):
  10. return {
  11. 'id': str(video_id),
  12. 'title': track_json.get('name'),
  13. 'track': track_json.get('name'),
  14. 'description': track_json.get('description'),
  15. 'track_number': track_json.get('number'),
  16. 'url': format_field(track_json, 'url', 'https://www.musicdex.org/%s'),
  17. 'duration': track_json.get('duration'),
  18. 'genres': [genre.get('name') for genre in track_json.get('genres') or []],
  19. 'like_count': track_json.get('likes_count'),
  20. 'view_count': track_json.get('plays'),
  21. 'artists': [artist.get('name') for artist in track_json.get('artists') or []],
  22. 'album_artists': [artist.get('name') for artist in album_json.get('artists') or []],
  23. 'thumbnail': format_field(album_json, 'image', 'https://www.musicdex.org/%s'),
  24. 'album': album_json.get('name'),
  25. 'release_year': try_get(album_json, lambda x: date_from_str(unified_strdate(x['release_date'])).year),
  26. 'extractor_key': MusicdexSongIE.ie_key(),
  27. 'extractor': 'MusicdexSong',
  28. }
  29. class MusicdexSongIE(MusicdexBaseIE):
  30. _VALID_URL = r'https?://(?:www\.)?musicdex\.org/track/(?P<id>\d+)'
  31. _TESTS = [{
  32. 'url': 'https://www.musicdex.org/track/306/dual-existence',
  33. 'info_dict': {
  34. 'id': '306',
  35. 'ext': 'mp3',
  36. 'title': 'dual existence',
  37. 'description': '#NIPPONSEI @ IRC.RIZON.NET',
  38. 'track': 'dual existence',
  39. 'track_number': 1,
  40. 'duration': 266000,
  41. 'genres': ['Anime'],
  42. 'like_count': int,
  43. 'view_count': int,
  44. 'artists': ['fripSide'],
  45. 'album_artists': ['fripSide'],
  46. 'thumbnail': 'https://www.musicdex.org/storage/album/9iDIam1DHTVqUG4UclFIEq1WAFGXfPW4y0TtZa91.png',
  47. 'album': 'To Aru Kagaku no Railgun T OP2 Single - dual existence',
  48. 'release_year': 2020,
  49. },
  50. 'params': {'skip_download': True},
  51. }]
  52. def _real_extract(self, url):
  53. video_id = self._match_id(url)
  54. data_json = self._download_json(
  55. f'https://www.musicdex.org/secure/tracks/{video_id}?defaultRelations=true', video_id)['track']
  56. return self._return_info(data_json, data_json.get('album') or {}, video_id)
  57. class MusicdexAlbumIE(MusicdexBaseIE):
  58. _VALID_URL = r'https?://(?:www\.)?musicdex\.org/album/(?P<id>\d+)'
  59. _TESTS = [{
  60. 'url': 'https://www.musicdex.org/album/56/tenmon-and-eiichiro-yanagi-minori/ef-a-tale-of-memories-original-soundtrack-2-fortissimo',
  61. 'playlist_mincount': 28,
  62. 'info_dict': {
  63. 'id': '56',
  64. 'genres': ['OST'],
  65. 'view_count': int,
  66. 'artists': ['TENMON & Eiichiro Yanagi / minori'],
  67. 'title': 'ef - a tale of memories Original Soundtrack 2 ~fortissimo~',
  68. 'release_year': 2008,
  69. 'thumbnail': 'https://www.musicdex.org/storage/album/2rSHkyYBYfB7sbvElpEyTMcUn6toY7AohOgJuDlE.jpg',
  70. },
  71. }]
  72. def _real_extract(self, url):
  73. playlist_id = self._match_id(url)
  74. data_json = self._download_json(
  75. f'https://www.musicdex.org/secure/albums/{playlist_id}?defaultRelations=true', playlist_id)['album']
  76. entries = [self._return_info(track, data_json, track['id'])
  77. for track in data_json.get('tracks') or [] if track.get('id')]
  78. return {
  79. '_type': 'playlist',
  80. 'id': playlist_id,
  81. 'title': data_json.get('name'),
  82. 'description': data_json.get('description'),
  83. 'genres': [genre.get('name') for genre in data_json.get('genres') or []],
  84. 'view_count': data_json.get('plays'),
  85. 'artists': [artist.get('name') for artist in data_json.get('artists') or []],
  86. 'thumbnail': format_field(data_json, 'image', 'https://www.musicdex.org/%s'),
  87. 'release_year': try_get(data_json, lambda x: date_from_str(unified_strdate(x['release_date'])).year),
  88. 'entries': entries,
  89. }
  90. class MusicdexPageIE(MusicdexBaseIE): # XXX: Conventionally, base classes should end with BaseIE/InfoExtractor
  91. def _entries(self, playlist_id):
  92. next_page_url = self._API_URL % playlist_id
  93. while next_page_url:
  94. data_json = self._download_json(next_page_url, playlist_id)['pagination']
  95. yield from data_json.get('data') or []
  96. next_page_url = data_json.get('next_page_url')
  97. class MusicdexArtistIE(MusicdexPageIE):
  98. _VALID_URL = r'https?://(?:www\.)?musicdex\.org/artist/(?P<id>\d+)'
  99. _API_URL = 'https://www.musicdex.org/secure/artists/%s/albums?page=1'
  100. _TESTS = [{
  101. 'url': 'https://www.musicdex.org/artist/11/fripside',
  102. 'playlist_mincount': 28,
  103. 'info_dict': {
  104. 'id': '11',
  105. 'view_count': int,
  106. 'title': 'fripSide',
  107. 'thumbnail': 'https://www.musicdex.org/storage/artist/ZmOz0lN2vsweegB660em3xWffCjLPmTQHqJls5Xx.jpg',
  108. },
  109. }]
  110. def _real_extract(self, url):
  111. playlist_id = self._match_id(url)
  112. data_json = self._download_json(f'https://www.musicdex.org/secure/artists/{playlist_id}', playlist_id)['artist']
  113. entries = []
  114. for album in self._entries(playlist_id):
  115. entries.extend(self._return_info(track, album, track['id']) for track in album.get('tracks') or [] if track.get('id'))
  116. return {
  117. '_type': 'playlist',
  118. 'id': playlist_id,
  119. 'title': data_json.get('name'),
  120. 'view_count': data_json.get('plays'),
  121. 'thumbnail': format_field(data_json, 'image_small', 'https://www.musicdex.org/%s'),
  122. 'entries': entries,
  123. }
  124. class MusicdexPlaylistIE(MusicdexPageIE):
  125. _VALID_URL = r'https?://(?:www\.)?musicdex\.org/playlist/(?P<id>\d+)'
  126. _API_URL = 'https://www.musicdex.org/secure/playlists/%s/tracks?perPage=10000&page=1'
  127. _TESTS = [{
  128. 'url': 'https://www.musicdex.org/playlist/9/test',
  129. 'playlist_mincount': 73,
  130. 'info_dict': {
  131. 'id': '9',
  132. 'view_count': int,
  133. 'title': 'Test',
  134. 'thumbnail': 'https://www.musicdex.org/storage/album/jXATI79f0IbQ2sgsKYOYRCW3zRwF3XsfHhzITCuJ.jpg',
  135. 'description': 'Test 123 123 21312 32121321321321312',
  136. },
  137. }]
  138. def _real_extract(self, url):
  139. playlist_id = self._match_id(url)
  140. data_json = self._download_json(f'https://www.musicdex.org/secure/playlists/{playlist_id}', playlist_id)['playlist']
  141. entries = [self._return_info(track, track.get('album') or {}, track['id'])
  142. for track in self._entries(playlist_id) or [] if track.get('id')]
  143. return {
  144. '_type': 'playlist',
  145. 'id': playlist_id,
  146. 'title': data_json.get('name'),
  147. 'description': data_json.get('description'),
  148. 'view_count': data_json.get('plays'),
  149. 'thumbnail': format_field(data_json, 'image', 'https://www.musicdex.org/%s'),
  150. 'entries': entries,
  151. }