make_lazy_extractors.py 4.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128
  1. #!/usr/bin/env python3
  2. # Allow direct execution
  3. import os
  4. import sys
  5. sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
  6. import optparse
  7. from inspect import getsource
  8. NO_ATTR = object()
  9. STATIC_CLASS_PROPERTIES = ['IE_NAME', 'IE_DESC', 'SEARCH_KEY', '_WORKING', '_NETRC_MACHINE', 'age_limit']
  10. CLASS_METHODS = [
  11. 'ie_key', 'working', 'description', 'suitable', '_match_valid_url', '_match_id', 'get_temp_id', 'is_suitable'
  12. ]
  13. IE_TEMPLATE = '''
  14. class {name}({bases}):
  15. _module = {module!r}
  16. '''
  17. with open('devscripts/lazy_load_template.py', encoding='utf-8') as f:
  18. MODULE_TEMPLATE = f.read()
  19. def main():
  20. parser = optparse.OptionParser(usage='%prog [OUTFILE.py]')
  21. args = parser.parse_args()[1] or ['yt_dlp/extractor/lazy_extractors.py']
  22. if len(args) != 1:
  23. parser.error('Expected only an output filename')
  24. lazy_extractors_filename = args[0]
  25. if os.path.exists(lazy_extractors_filename):
  26. os.remove(lazy_extractors_filename)
  27. _ALL_CLASSES = get_all_ies() # Must be before import
  28. from yt_dlp.extractor.common import InfoExtractor, SearchInfoExtractor
  29. DummyInfoExtractor = type('InfoExtractor', (InfoExtractor,), {'IE_NAME': NO_ATTR})
  30. module_src = '\n'.join((
  31. MODULE_TEMPLATE,
  32. ' _module = None',
  33. *extra_ie_code(DummyInfoExtractor),
  34. '\nclass LazyLoadSearchExtractor(LazyLoadExtractor):\n pass\n',
  35. *build_ies(_ALL_CLASSES, (InfoExtractor, SearchInfoExtractor), DummyInfoExtractor),
  36. ))
  37. with open(lazy_extractors_filename, 'wt', encoding='utf-8') as f:
  38. f.write(f'{module_src}\n')
  39. def get_all_ies():
  40. PLUGINS_DIRNAME = 'ytdlp_plugins'
  41. BLOCKED_DIRNAME = f'{PLUGINS_DIRNAME}_blocked'
  42. if os.path.exists(PLUGINS_DIRNAME):
  43. os.rename(PLUGINS_DIRNAME, BLOCKED_DIRNAME)
  44. try:
  45. from yt_dlp.extractor.extractors import _ALL_CLASSES
  46. finally:
  47. if os.path.exists(BLOCKED_DIRNAME):
  48. os.rename(BLOCKED_DIRNAME, PLUGINS_DIRNAME)
  49. return _ALL_CLASSES
  50. def extra_ie_code(ie, base=None):
  51. for var in STATIC_CLASS_PROPERTIES:
  52. val = getattr(ie, var)
  53. if val != (getattr(base, var) if base else NO_ATTR):
  54. yield f' {var} = {val!r}'
  55. yield ''
  56. for name in CLASS_METHODS:
  57. f = getattr(ie, name)
  58. if not base or f.__func__ != getattr(base, name).__func__:
  59. yield getsource(f)
  60. def build_ies(ies, bases, attr_base):
  61. names = []
  62. for ie in sort_ies(ies, bases):
  63. yield build_lazy_ie(ie, ie.__name__, attr_base)
  64. if ie in ies:
  65. names.append(ie.__name__)
  66. yield f'\n_ALL_CLASSES = [{", ".join(names)}]'
  67. def sort_ies(ies, ignored_bases):
  68. """find the correct sorting and add the required base classes so that subclasses can be correctly created"""
  69. classes, returned_classes = ies[:-1], set()
  70. assert ies[-1].__name__ == 'GenericIE', 'Last IE must be GenericIE'
  71. while classes:
  72. for c in classes[:]:
  73. bases = set(c.__bases__) - {object, *ignored_bases}
  74. restart = False
  75. for b in sorted(bases, key=lambda x: x.__name__):
  76. if b not in classes and b not in returned_classes:
  77. assert b.__name__ != 'GenericIE', 'Cannot inherit from GenericIE'
  78. classes.insert(0, b)
  79. restart = True
  80. if restart:
  81. break
  82. if bases <= returned_classes:
  83. yield c
  84. returned_classes.add(c)
  85. classes.remove(c)
  86. break
  87. yield ies[-1]
  88. def build_lazy_ie(ie, name, attr_base):
  89. bases = ', '.join({
  90. 'InfoExtractor': 'LazyLoadExtractor',
  91. 'SearchInfoExtractor': 'LazyLoadSearchExtractor',
  92. }.get(base.__name__, base.__name__) for base in ie.__bases__)
  93. s = IE_TEMPLATE.format(name=name, module=ie.__module__, bases=bases)
  94. valid_url = getattr(ie, '_VALID_URL', None)
  95. if not valid_url and hasattr(ie, '_make_valid_url'):
  96. valid_url = ie._make_valid_url()
  97. if valid_url:
  98. s += f' _VALID_URL = {valid_url!r}\n'
  99. return s + '\n'.join(extra_ie_code(ie, attr_base))
  100. if __name__ == '__main__':
  101. main()