oggenc.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360
  1. /*
  2. * Ogg muxer
  3. * Copyright (c) 2007 Baptiste Coudurier <baptiste dot coudurier at free dot fr>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "libavutil/crc.h"
  22. #include "libavcodec/xiph.h"
  23. #include "libavcodec/bytestream.h"
  24. #include "libavcodec/flac.h"
  25. #include "avformat.h"
  26. #include "internal.h"
  27. typedef struct {
  28. int64_t duration;
  29. unsigned page_counter;
  30. uint8_t *header[3];
  31. int header_len[3];
  32. /** for theora granule */
  33. int kfgshift;
  34. int64_t last_kf_pts;
  35. int vrev;
  36. int eos;
  37. } OGGStreamContext;
  38. static void ogg_update_checksum(AVFormatContext *s, int64_t crc_offset)
  39. {
  40. int64_t pos = url_ftell(s->pb);
  41. uint32_t checksum = get_checksum(s->pb);
  42. url_fseek(s->pb, crc_offset, SEEK_SET);
  43. put_be32(s->pb, checksum);
  44. url_fseek(s->pb, pos, SEEK_SET);
  45. }
  46. static int ogg_write_page(AVFormatContext *s, const uint8_t *data, int size,
  47. int64_t granule, int stream_index, int flags)
  48. {
  49. OGGStreamContext *oggstream = s->streams[stream_index]->priv_data;
  50. int64_t crc_offset;
  51. int page_segments, i;
  52. if (size >= 255*255) {
  53. granule = -1;
  54. size = 255*255;
  55. } else if (oggstream->eos)
  56. flags |= 4;
  57. page_segments = FFMIN((size/255)+!!size, 255);
  58. init_checksum(s->pb, ff_crc04C11DB7_update, 0);
  59. put_tag(s->pb, "OggS");
  60. put_byte(s->pb, 0);
  61. put_byte(s->pb, flags);
  62. put_le64(s->pb, granule);
  63. put_le32(s->pb, stream_index);
  64. put_le32(s->pb, oggstream->page_counter++);
  65. crc_offset = url_ftell(s->pb);
  66. put_le32(s->pb, 0); // crc
  67. put_byte(s->pb, page_segments);
  68. for (i = 0; i < page_segments-1; i++)
  69. put_byte(s->pb, 255);
  70. if (size) {
  71. put_byte(s->pb, size - (page_segments-1)*255);
  72. put_buffer(s->pb, data, size);
  73. }
  74. ogg_update_checksum(s, crc_offset);
  75. put_flush_packet(s->pb);
  76. return size;
  77. }
  78. static uint8_t *ogg_write_vorbiscomment(int offset, int bitexact,
  79. int *header_len)
  80. {
  81. const char *vendor = bitexact ? "ffmpeg" : LIBAVFORMAT_IDENT;
  82. int size;
  83. uint8_t *p, *p0;
  84. size = offset + 4 + strlen(vendor) + 4;
  85. p = av_mallocz(size);
  86. if (!p)
  87. return NULL;
  88. p0 = p;
  89. p += offset;
  90. bytestream_put_le32(&p, strlen(vendor));
  91. bytestream_put_buffer(&p, vendor, strlen(vendor));
  92. bytestream_put_le32(&p, 0); // user comment list length
  93. *header_len = size;
  94. return p0;
  95. }
  96. static int ogg_build_flac_headers(AVCodecContext *avctx,
  97. OGGStreamContext *oggstream, int bitexact)
  98. {
  99. enum FLACExtradataFormat format;
  100. uint8_t *streaminfo;
  101. uint8_t *p;
  102. if (!ff_flac_is_extradata_valid(avctx, &format, &streaminfo))
  103. return -1;
  104. // first packet: STREAMINFO
  105. oggstream->header_len[0] = 51;
  106. oggstream->header[0] = av_mallocz(51); // per ogg flac specs
  107. p = oggstream->header[0];
  108. if (!p)
  109. return AVERROR_NOMEM;
  110. bytestream_put_byte(&p, 0x7F);
  111. bytestream_put_buffer(&p, "FLAC", 4);
  112. bytestream_put_byte(&p, 1); // major version
  113. bytestream_put_byte(&p, 0); // minor version
  114. bytestream_put_be16(&p, 1); // headers packets without this one
  115. bytestream_put_buffer(&p, "fLaC", 4);
  116. bytestream_put_byte(&p, 0x00); // streaminfo
  117. bytestream_put_be24(&p, 34);
  118. bytestream_put_buffer(&p, streaminfo, FLAC_STREAMINFO_SIZE);
  119. // second packet: VorbisComment
  120. p = ogg_write_vorbiscomment(4, bitexact, &oggstream->header_len[1]);
  121. if (!p)
  122. return AVERROR_NOMEM;
  123. oggstream->header[1] = p;
  124. bytestream_put_byte(&p, 0x84); // last metadata block and vorbis comment
  125. bytestream_put_be24(&p, oggstream->header_len[1] - 4);
  126. return 0;
  127. }
  128. #define SPEEX_HEADER_SIZE 80
  129. static int ogg_build_speex_headers(AVCodecContext *avctx,
  130. OGGStreamContext *oggstream, int bitexact)
  131. {
  132. uint8_t *p;
  133. if (avctx->extradata_size < SPEEX_HEADER_SIZE)
  134. return -1;
  135. // first packet: Speex header
  136. p = av_mallocz(SPEEX_HEADER_SIZE);
  137. if (!p)
  138. return AVERROR_NOMEM;
  139. oggstream->header[0] = p;
  140. oggstream->header_len[0] = SPEEX_HEADER_SIZE;
  141. bytestream_put_buffer(&p, avctx->extradata, SPEEX_HEADER_SIZE);
  142. AV_WL32(&oggstream->header[0][68], 0); // set extra_headers to 0
  143. // second packet: VorbisComment
  144. p = ogg_write_vorbiscomment(0, bitexact, &oggstream->header_len[1]);
  145. if (!p)
  146. return AVERROR_NOMEM;
  147. oggstream->header[1] = p;
  148. return 0;
  149. }
  150. static int ogg_write_header(AVFormatContext *s)
  151. {
  152. OGGStreamContext *oggstream;
  153. int i, j;
  154. for (i = 0; i < s->nb_streams; i++) {
  155. AVStream *st = s->streams[i];
  156. if (st->codec->codec_type == CODEC_TYPE_AUDIO)
  157. av_set_pts_info(st, 64, 1, st->codec->sample_rate);
  158. else if (st->codec->codec_type == CODEC_TYPE_VIDEO)
  159. av_set_pts_info(st, 64, st->codec->time_base.num, st->codec->time_base.den);
  160. if (st->codec->codec_id != CODEC_ID_VORBIS &&
  161. st->codec->codec_id != CODEC_ID_THEORA &&
  162. st->codec->codec_id != CODEC_ID_SPEEX &&
  163. st->codec->codec_id != CODEC_ID_FLAC) {
  164. av_log(s, AV_LOG_ERROR, "Unsupported codec id in stream %d\n", i);
  165. return -1;
  166. }
  167. if (!st->codec->extradata || !st->codec->extradata_size) {
  168. av_log(s, AV_LOG_ERROR, "No extradata present\n");
  169. return -1;
  170. }
  171. oggstream = av_mallocz(sizeof(*oggstream));
  172. st->priv_data = oggstream;
  173. if (st->codec->codec_id == CODEC_ID_FLAC) {
  174. int err = ogg_build_flac_headers(st->codec, oggstream,
  175. st->codec->flags & CODEC_FLAG_BITEXACT);
  176. if (err) {
  177. av_log(s, AV_LOG_ERROR, "Error writing FLAC headers\n");
  178. av_freep(&st->priv_data);
  179. return err;
  180. }
  181. } else if (st->codec->codec_id == CODEC_ID_SPEEX) {
  182. int err = ogg_build_speex_headers(st->codec, oggstream,
  183. st->codec->flags & CODEC_FLAG_BITEXACT);
  184. if (err) {
  185. av_log(s, AV_LOG_ERROR, "Error writing Speex headers\n");
  186. av_freep(&st->priv_data);
  187. return err;
  188. }
  189. } else {
  190. if (ff_split_xiph_headers(st->codec->extradata, st->codec->extradata_size,
  191. st->codec->codec_id == CODEC_ID_VORBIS ? 30 : 42,
  192. oggstream->header, oggstream->header_len) < 0) {
  193. av_log(s, AV_LOG_ERROR, "Extradata corrupted\n");
  194. av_freep(&st->priv_data);
  195. return -1;
  196. }
  197. if (st->codec->codec_id == CODEC_ID_THEORA) {
  198. /** KFGSHIFT is the width of the less significant section of the granule position
  199. The less significant section is the frame count since the last keyframe */
  200. oggstream->kfgshift = ((oggstream->header[0][40]&3)<<3)|(oggstream->header[0][41]>>5);
  201. oggstream->vrev = oggstream->header[0][9];
  202. av_log(s, AV_LOG_DEBUG, "theora kfgshift %d, vrev %d\n",
  203. oggstream->kfgshift, oggstream->vrev);
  204. }
  205. }
  206. }
  207. for (i = 0; i < 3; i++) {
  208. for (j = 0; j < s->nb_streams; j++) {
  209. AVStream *st = s->streams[j];
  210. OGGStreamContext *oggstream = st->priv_data;
  211. if (oggstream && oggstream->header_len[i]) {
  212. ogg_write_page(s, oggstream->header[i], oggstream->header_len[i],
  213. 0, st->index, i ? 0 : 2); // bos
  214. }
  215. }
  216. }
  217. return 0;
  218. }
  219. static int ogg_write_packet(AVFormatContext *s, AVPacket *pkt)
  220. {
  221. AVStream *st = s->streams[pkt->stream_index];
  222. OGGStreamContext *oggstream = st->priv_data;
  223. uint8_t *ptr = pkt->data;
  224. int ret, size = pkt->size;
  225. int64_t granule;
  226. if (st->codec->codec_id == CODEC_ID_THEORA) {
  227. int64_t pts = oggstream->vrev < 1 ? pkt->pts : pkt->pts + pkt->duration;
  228. int pframe_count;
  229. if (pkt->flags & PKT_FLAG_KEY)
  230. oggstream->last_kf_pts = pts;
  231. pframe_count = pts - oggstream->last_kf_pts;
  232. // prevent frame count from overflow if key frame flag is not set
  233. if (pframe_count >= (1<<oggstream->kfgshift)) {
  234. oggstream->last_kf_pts += pframe_count;
  235. pframe_count = 0;
  236. }
  237. granule = (oggstream->last_kf_pts<<oggstream->kfgshift) | pframe_count;
  238. } else
  239. granule = pkt->pts + pkt->duration;
  240. oggstream->duration = granule;
  241. do {
  242. ret = ogg_write_page(s, ptr, size, granule, pkt->stream_index, ptr != pkt->data);
  243. ptr += ret; size -= ret;
  244. } while (size > 0 || ret == 255*255); // need to output a last nil page
  245. return 0;
  246. }
  247. static int ogg_compare_granule(AVFormatContext *s, AVPacket *next, AVPacket *pkt)
  248. {
  249. AVStream *st2 = s->streams[next->stream_index];
  250. AVStream *st = s->streams[pkt ->stream_index];
  251. int64_t next_granule = av_rescale_q(next->pts + next->duration,
  252. st2->time_base, AV_TIME_BASE_Q);
  253. int64_t cur_granule = av_rescale_q(pkt ->pts + pkt ->duration,
  254. st ->time_base, AV_TIME_BASE_Q);
  255. return next_granule > cur_granule;
  256. }
  257. static int ogg_interleave_per_granule(AVFormatContext *s, AVPacket *out, AVPacket *pkt, int flush)
  258. {
  259. AVPacketList *pktl;
  260. int stream_count = 0;
  261. int streams[MAX_STREAMS] = {0};
  262. int interleaved = 0;
  263. if (pkt) {
  264. ff_interleave_add_packet(s, pkt, ogg_compare_granule);
  265. }
  266. pktl = s->packet_buffer;
  267. while (pktl) {
  268. if (streams[pktl->pkt.stream_index] == 0)
  269. stream_count++;
  270. streams[pktl->pkt.stream_index]++;
  271. // need to buffer at least one packet to set eos flag
  272. if (streams[pktl->pkt.stream_index] == 2)
  273. interleaved++;
  274. pktl = pktl->next;
  275. }
  276. if ((s->nb_streams == stream_count && interleaved == stream_count) ||
  277. (flush && stream_count)) {
  278. pktl= s->packet_buffer;
  279. *out= pktl->pkt;
  280. s->packet_buffer = pktl->next;
  281. if (flush && streams[out->stream_index] == 1) {
  282. OGGStreamContext *ogg = s->streams[out->stream_index]->priv_data;
  283. ogg->eos = 1;
  284. }
  285. if(!s->packet_buffer)
  286. s->packet_buffer_end= NULL;
  287. if(s->streams[out->stream_index]->last_in_packet_buffer == pktl)
  288. s->streams[out->stream_index]->last_in_packet_buffer= NULL;
  289. av_freep(&pktl);
  290. return 1;
  291. } else {
  292. av_init_packet(out);
  293. return 0;
  294. }
  295. }
  296. static int ogg_write_trailer(AVFormatContext *s)
  297. {
  298. int i;
  299. for (i = 0; i < s->nb_streams; i++) {
  300. AVStream *st = s->streams[i];
  301. OGGStreamContext *oggstream = st->priv_data;
  302. if (st->codec->codec_id == CODEC_ID_FLAC ||
  303. st->codec->codec_id == CODEC_ID_SPEEX) {
  304. av_free(oggstream->header[0]);
  305. av_free(oggstream->header[1]);
  306. }
  307. av_freep(&st->priv_data);
  308. }
  309. return 0;
  310. }
  311. AVOutputFormat ogg_muxer = {
  312. "ogg",
  313. NULL_IF_CONFIG_SMALL("Ogg"),
  314. "application/ogg",
  315. "ogg,ogv,spx",
  316. 0,
  317. CODEC_ID_FLAC,
  318. CODEC_ID_THEORA,
  319. ogg_write_header,
  320. ogg_write_packet,
  321. ogg_write_trailer,
  322. .interleave_packet = ogg_interleave_per_granule,
  323. };