ism.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284
  1. import binascii
  2. import io
  3. import struct
  4. import time
  5. from .fragment import FragmentFD
  6. from ..compat import compat_urllib_error
  7. u8 = struct.Struct('>B')
  8. u88 = struct.Struct('>Bx')
  9. u16 = struct.Struct('>H')
  10. u1616 = struct.Struct('>Hxx')
  11. u32 = struct.Struct('>I')
  12. u64 = struct.Struct('>Q')
  13. s88 = struct.Struct('>bx')
  14. s16 = struct.Struct('>h')
  15. s1616 = struct.Struct('>hxx')
  16. s32 = struct.Struct('>i')
  17. unity_matrix = (s32.pack(0x10000) + s32.pack(0) * 3) * 2 + s32.pack(0x40000000)
  18. TRACK_ENABLED = 0x1
  19. TRACK_IN_MOVIE = 0x2
  20. TRACK_IN_PREVIEW = 0x4
  21. SELF_CONTAINED = 0x1
  22. def box(box_type, payload):
  23. return u32.pack(8 + len(payload)) + box_type + payload
  24. def full_box(box_type, version, flags, payload):
  25. return box(box_type, u8.pack(version) + u32.pack(flags)[1:] + payload)
  26. def write_piff_header(stream, params):
  27. track_id = params['track_id']
  28. fourcc = params['fourcc']
  29. duration = params['duration']
  30. timescale = params.get('timescale', 10000000)
  31. language = params.get('language', 'und')
  32. height = params.get('height', 0)
  33. width = params.get('width', 0)
  34. stream_type = params['stream_type']
  35. creation_time = modification_time = int(time.time())
  36. ftyp_payload = b'isml' # major brand
  37. ftyp_payload += u32.pack(1) # minor version
  38. ftyp_payload += b'piff' + b'iso2' # compatible brands
  39. stream.write(box(b'ftyp', ftyp_payload)) # File Type Box
  40. mvhd_payload = u64.pack(creation_time)
  41. mvhd_payload += u64.pack(modification_time)
  42. mvhd_payload += u32.pack(timescale)
  43. mvhd_payload += u64.pack(duration)
  44. mvhd_payload += s1616.pack(1) # rate
  45. mvhd_payload += s88.pack(1) # volume
  46. mvhd_payload += u16.pack(0) # reserved
  47. mvhd_payload += u32.pack(0) * 2 # reserved
  48. mvhd_payload += unity_matrix
  49. mvhd_payload += u32.pack(0) * 6 # pre defined
  50. mvhd_payload += u32.pack(0xffffffff) # next track id
  51. moov_payload = full_box(b'mvhd', 1, 0, mvhd_payload) # Movie Header Box
  52. tkhd_payload = u64.pack(creation_time)
  53. tkhd_payload += u64.pack(modification_time)
  54. tkhd_payload += u32.pack(track_id) # track id
  55. tkhd_payload += u32.pack(0) # reserved
  56. tkhd_payload += u64.pack(duration)
  57. tkhd_payload += u32.pack(0) * 2 # reserved
  58. tkhd_payload += s16.pack(0) # layer
  59. tkhd_payload += s16.pack(0) # alternate group
  60. tkhd_payload += s88.pack(1 if stream_type == 'audio' else 0) # volume
  61. tkhd_payload += u16.pack(0) # reserved
  62. tkhd_payload += unity_matrix
  63. tkhd_payload += u1616.pack(width)
  64. tkhd_payload += u1616.pack(height)
  65. trak_payload = full_box(b'tkhd', 1, TRACK_ENABLED | TRACK_IN_MOVIE | TRACK_IN_PREVIEW, tkhd_payload) # Track Header Box
  66. mdhd_payload = u64.pack(creation_time)
  67. mdhd_payload += u64.pack(modification_time)
  68. mdhd_payload += u32.pack(timescale)
  69. mdhd_payload += u64.pack(duration)
  70. mdhd_payload += u16.pack(((ord(language[0]) - 0x60) << 10) | ((ord(language[1]) - 0x60) << 5) | (ord(language[2]) - 0x60))
  71. mdhd_payload += u16.pack(0) # pre defined
  72. mdia_payload = full_box(b'mdhd', 1, 0, mdhd_payload) # Media Header Box
  73. hdlr_payload = u32.pack(0) # pre defined
  74. if stream_type == 'audio': # handler type
  75. hdlr_payload += b'soun'
  76. hdlr_payload += u32.pack(0) * 3 # reserved
  77. hdlr_payload += b'SoundHandler\0' # name
  78. elif stream_type == 'video':
  79. hdlr_payload += b'vide'
  80. hdlr_payload += u32.pack(0) * 3 # reserved
  81. hdlr_payload += b'VideoHandler\0' # name
  82. elif stream_type == 'text':
  83. hdlr_payload += b'subt'
  84. hdlr_payload += u32.pack(0) * 3 # reserved
  85. hdlr_payload += b'SubtitleHandler\0' # name
  86. else:
  87. assert False
  88. mdia_payload += full_box(b'hdlr', 0, 0, hdlr_payload) # Handler Reference Box
  89. if stream_type == 'audio':
  90. smhd_payload = s88.pack(0) # balance
  91. smhd_payload += u16.pack(0) # reserved
  92. media_header_box = full_box(b'smhd', 0, 0, smhd_payload) # Sound Media Header
  93. elif stream_type == 'video':
  94. vmhd_payload = u16.pack(0) # graphics mode
  95. vmhd_payload += u16.pack(0) * 3 # opcolor
  96. media_header_box = full_box(b'vmhd', 0, 1, vmhd_payload) # Video Media Header
  97. elif stream_type == 'text':
  98. media_header_box = full_box(b'sthd', 0, 0, b'') # Subtitle Media Header
  99. else:
  100. assert False
  101. minf_payload = media_header_box
  102. dref_payload = u32.pack(1) # entry count
  103. dref_payload += full_box(b'url ', 0, SELF_CONTAINED, b'') # Data Entry URL Box
  104. dinf_payload = full_box(b'dref', 0, 0, dref_payload) # Data Reference Box
  105. minf_payload += box(b'dinf', dinf_payload) # Data Information Box
  106. stsd_payload = u32.pack(1) # entry count
  107. sample_entry_payload = u8.pack(0) * 6 # reserved
  108. sample_entry_payload += u16.pack(1) # data reference index
  109. if stream_type == 'audio':
  110. sample_entry_payload += u32.pack(0) * 2 # reserved
  111. sample_entry_payload += u16.pack(params.get('channels', 2))
  112. sample_entry_payload += u16.pack(params.get('bits_per_sample', 16))
  113. sample_entry_payload += u16.pack(0) # pre defined
  114. sample_entry_payload += u16.pack(0) # reserved
  115. sample_entry_payload += u1616.pack(params['sampling_rate'])
  116. if fourcc == 'AACL':
  117. sample_entry_box = box(b'mp4a', sample_entry_payload)
  118. elif stream_type == 'video':
  119. sample_entry_payload += u16.pack(0) # pre defined
  120. sample_entry_payload += u16.pack(0) # reserved
  121. sample_entry_payload += u32.pack(0) * 3 # pre defined
  122. sample_entry_payload += u16.pack(width)
  123. sample_entry_payload += u16.pack(height)
  124. sample_entry_payload += u1616.pack(0x48) # horiz resolution 72 dpi
  125. sample_entry_payload += u1616.pack(0x48) # vert resolution 72 dpi
  126. sample_entry_payload += u32.pack(0) # reserved
  127. sample_entry_payload += u16.pack(1) # frame count
  128. sample_entry_payload += u8.pack(0) * 32 # compressor name
  129. sample_entry_payload += u16.pack(0x18) # depth
  130. sample_entry_payload += s16.pack(-1) # pre defined
  131. codec_private_data = binascii.unhexlify(params['codec_private_data'].encode())
  132. if fourcc in ('H264', 'AVC1'):
  133. sps, pps = codec_private_data.split(u32.pack(1))[1:]
  134. avcc_payload = u8.pack(1) # configuration version
  135. avcc_payload += sps[1:4] # avc profile indication + profile compatibility + avc level indication
  136. avcc_payload += u8.pack(0xfc | (params.get('nal_unit_length_field', 4) - 1)) # complete representation (1) + reserved (11111) + length size minus one
  137. avcc_payload += u8.pack(1) # reserved (0) + number of sps (0000001)
  138. avcc_payload += u16.pack(len(sps))
  139. avcc_payload += sps
  140. avcc_payload += u8.pack(1) # number of pps
  141. avcc_payload += u16.pack(len(pps))
  142. avcc_payload += pps
  143. sample_entry_payload += box(b'avcC', avcc_payload) # AVC Decoder Configuration Record
  144. sample_entry_box = box(b'avc1', sample_entry_payload) # AVC Simple Entry
  145. else:
  146. assert False
  147. elif stream_type == 'text':
  148. if fourcc == 'TTML':
  149. sample_entry_payload += b'http://www.w3.org/ns/ttml\0' # namespace
  150. sample_entry_payload += b'\0' # schema location
  151. sample_entry_payload += b'\0' # auxilary mime types(??)
  152. sample_entry_box = box(b'stpp', sample_entry_payload)
  153. else:
  154. assert False
  155. else:
  156. assert False
  157. stsd_payload += sample_entry_box
  158. stbl_payload = full_box(b'stsd', 0, 0, stsd_payload) # Sample Description Box
  159. stts_payload = u32.pack(0) # entry count
  160. stbl_payload += full_box(b'stts', 0, 0, stts_payload) # Decoding Time to Sample Box
  161. stsc_payload = u32.pack(0) # entry count
  162. stbl_payload += full_box(b'stsc', 0, 0, stsc_payload) # Sample To Chunk Box
  163. stco_payload = u32.pack(0) # entry count
  164. stbl_payload += full_box(b'stco', 0, 0, stco_payload) # Chunk Offset Box
  165. minf_payload += box(b'stbl', stbl_payload) # Sample Table Box
  166. mdia_payload += box(b'minf', minf_payload) # Media Information Box
  167. trak_payload += box(b'mdia', mdia_payload) # Media Box
  168. moov_payload += box(b'trak', trak_payload) # Track Box
  169. mehd_payload = u64.pack(duration)
  170. mvex_payload = full_box(b'mehd', 1, 0, mehd_payload) # Movie Extends Header Box
  171. trex_payload = u32.pack(track_id) # track id
  172. trex_payload += u32.pack(1) # default sample description index
  173. trex_payload += u32.pack(0) # default sample duration
  174. trex_payload += u32.pack(0) # default sample size
  175. trex_payload += u32.pack(0) # default sample flags
  176. mvex_payload += full_box(b'trex', 0, 0, trex_payload) # Track Extends Box
  177. moov_payload += box(b'mvex', mvex_payload) # Movie Extends Box
  178. stream.write(box(b'moov', moov_payload)) # Movie Box
  179. def extract_box_data(data, box_sequence):
  180. data_reader = io.BytesIO(data)
  181. while True:
  182. box_size = u32.unpack(data_reader.read(4))[0]
  183. box_type = data_reader.read(4)
  184. if box_type == box_sequence[0]:
  185. box_data = data_reader.read(box_size - 8)
  186. if len(box_sequence) == 1:
  187. return box_data
  188. return extract_box_data(box_data, box_sequence[1:])
  189. data_reader.seek(box_size - 8, 1)
  190. class IsmFD(FragmentFD):
  191. """
  192. Download segments in a ISM manifest
  193. """
  194. def real_download(self, filename, info_dict):
  195. segments = info_dict['fragments'][:1] if self.params.get(
  196. 'test', False) else info_dict['fragments']
  197. ctx = {
  198. 'filename': filename,
  199. 'total_frags': len(segments),
  200. }
  201. self._prepare_and_start_frag_download(ctx, info_dict)
  202. extra_state = ctx.setdefault('extra_state', {
  203. 'ism_track_written': False,
  204. })
  205. fragment_retries = self.params.get('fragment_retries', 0)
  206. skip_unavailable_fragments = self.params.get('skip_unavailable_fragments', True)
  207. frag_index = 0
  208. for i, segment in enumerate(segments):
  209. frag_index += 1
  210. if frag_index <= ctx['fragment_index']:
  211. continue
  212. count = 0
  213. while count <= fragment_retries:
  214. try:
  215. success = self._download_fragment(ctx, segment['url'], info_dict)
  216. if not success:
  217. return False
  218. frag_content = self._read_fragment(ctx)
  219. if not extra_state['ism_track_written']:
  220. tfhd_data = extract_box_data(frag_content, [b'moof', b'traf', b'tfhd'])
  221. info_dict['_download_params']['track_id'] = u32.unpack(tfhd_data[4:8])[0]
  222. write_piff_header(ctx['dest_stream'], info_dict['_download_params'])
  223. extra_state['ism_track_written'] = True
  224. self._append_fragment(ctx, frag_content)
  225. break
  226. except compat_urllib_error.HTTPError as err:
  227. count += 1
  228. if count <= fragment_retries:
  229. self.report_retry_fragment(err, frag_index, count, fragment_retries)
  230. if count > fragment_retries:
  231. if skip_unavailable_fragments:
  232. self.report_skip_fragment(frag_index)
  233. continue
  234. self.report_error('giving up after %s fragment retries' % fragment_retries)
  235. return False
  236. self._finish_frag_download(ctx, info_dict)
  237. return True