trtcocuk.py 1.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748
  1. from .common import InfoExtractor
  2. from ..utils import ExtractorError, int_or_none, parse_iso8601, traverse_obj
  3. class TrtCocukVideoIE(InfoExtractor):
  4. _VALID_URL = r'https?://www\.trtcocuk\.net\.tr/video/(?P<id>[\w-]+)'
  5. _TESTS = [{
  6. 'url': 'https://www.trtcocuk.net.tr/video/kaptan-pengu-ve-arkadaslari-1',
  7. 'info_dict': {
  8. 'id': '3789738',
  9. 'ext': 'mp4',
  10. 'season_number': 1,
  11. 'series': '"Kaptan Pengu ve Arkadaşları"',
  12. 'season': 'Season 1',
  13. 'title': 'Kaptan Pengu ve Arkadaşları 1 Bölüm İzle TRT Çocuk',
  14. 'release_date': '20201209',
  15. 'release_timestamp': 1607513774,
  16. },
  17. }, {
  18. 'url': 'https://www.trtcocuk.net.tr/video/sef-rokanin-lezzet-dunyasi-17',
  19. 'info_dict': {
  20. 'id': '10260842',
  21. 'ext': 'mp4',
  22. 'series': '"Şef Roka\'nın Lezzet Dünyası"',
  23. 'title': 'Şef Roka\'nın Lezzet Dünyası 17 Bölüm İzle TRT Çocuk',
  24. },
  25. }]
  26. def _real_extract(self, url):
  27. display_id = self._match_id(url)
  28. webpage = self._download_webpage(url, display_id)
  29. nuxtjs_data = self._search_nuxt_data(webpage, display_id)['data']
  30. try:
  31. video_url = self._parse_json(nuxtjs_data['video'], display_id)
  32. except ExtractorError:
  33. video_url = nuxtjs_data['video']
  34. formats, subtitles = self._extract_m3u8_formats_and_subtitles(video_url, display_id)
  35. return {
  36. 'id': str(nuxtjs_data['id']),
  37. 'formats': formats,
  38. 'subtitles': subtitles,
  39. 'season_number': int_or_none(nuxtjs_data.get('season')),
  40. 'release_timestamp': parse_iso8601(nuxtjs_data.get('publishedDate')),
  41. 'series': traverse_obj(nuxtjs_data, ('show', 0, 'title')),
  42. 'title': self._html_extract_title(webpage), # TODO: get better title
  43. }