karaoketv.py 2.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061
  1. from .common import InfoExtractor
  2. class KaraoketvIE(InfoExtractor):
  3. _VALID_URL = r'https?://(?:www\.)?karaoketv\.co\.il/[^/]+/(?P<id>\d+)'
  4. _TEST = {
  5. 'url': 'http://www.karaoketv.co.il/%D7%A9%D7%99%D7%A8%D7%99_%D7%A7%D7%A8%D7%99%D7%95%D7%A7%D7%99/58356/%D7%90%D7%99%D7%96%D7%95%D7%9F',
  6. 'info_dict': {
  7. 'id': '58356',
  8. 'ext': 'flv',
  9. 'title': 'קריוקי של איזון',
  10. },
  11. 'params': {
  12. # rtmp download
  13. 'skip_download': True,
  14. },
  15. }
  16. def _real_extract(self, url):
  17. video_id = self._match_id(url)
  18. webpage = self._download_webpage(url, video_id)
  19. api_page_url = self._search_regex(
  20. r'<iframe[^>]+src=(["\'])(?P<url>https?://www\.karaoke\.co\.il/api_play\.php\?.+?)\1',
  21. webpage, 'API play URL', group='url')
  22. api_page = self._download_webpage(api_page_url, video_id)
  23. video_cdn_url = self._search_regex(
  24. r'<iframe[^>]+src=(["\'])(?P<url>https?://www\.video-cdn\.com/embed/iframe/.+?)\1',
  25. api_page, 'video cdn URL', group='url')
  26. video_cdn = self._download_webpage(video_cdn_url, video_id)
  27. play_path = self._parse_json(
  28. self._search_regex(
  29. r'var\s+options\s*=\s*({.+?});', video_cdn, 'options'),
  30. video_id)['clip']['url']
  31. settings = self._parse_json(
  32. self._search_regex(
  33. r'var\s+settings\s*=\s*({.+?});', video_cdn, 'servers', default='{}'),
  34. video_id, fatal=False) or {}
  35. servers = settings.get('servers')
  36. if not servers or not isinstance(servers, list):
  37. servers = ('wowzail.video-cdn.com:80/vodcdn', )
  38. formats = [{
  39. 'url': f'rtmp://{server}' if not server.startswith('rtmp') else server,
  40. 'play_path': play_path,
  41. 'app': 'vodcdn',
  42. 'page_url': video_cdn_url,
  43. 'player_url': 'http://www.video-cdn.com/assets/flowplayer/flowplayer.commercial-3.2.18.swf',
  44. 'rtmp_real_time': True,
  45. 'ext': 'flv',
  46. } for server in servers]
  47. return {
  48. 'id': video_id,
  49. 'title': self._og_search_title(webpage),
  50. 'formats': formats,
  51. }