dpcm.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319
  1. /*
  2. * Assorted DPCM codecs
  3. * Copyright (c) 2003 The ffmpeg Project
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file: dpcm.c
  23. * Assorted DPCM (differential pulse code modulation) audio codecs
  24. * by Mike Melanson (melanson@pcisys.net)
  25. * Xan DPCM decoder by Mario Brito (mbrito@student.dei.uc.pt)
  26. * for more information on the specific data formats, visit:
  27. * http://www.pcisys.net/~melanson/codecs/simpleaudio.html
  28. * SOL DPCMs implemented by Konstantin Shishkov
  29. *
  30. * Note about using the Xan DPCM decoder: Xan DPCM is used in AVI files
  31. * found in the Wing Commander IV computer game. These AVI files contain
  32. * WAVEFORMAT headers which report the audio format as 0x01: raw PCM.
  33. * Clearly incorrect. To detect Xan DPCM, you will probably have to
  34. * special-case your AVI demuxer to use Xan DPCM if the file uses 'Xxan'
  35. * (Xan video) for its video codec. Alternately, such AVI files also contain
  36. * the fourcc 'Axan' in the 'auds' chunk of the AVI header.
  37. */
  38. #include "libavutil/intreadwrite.h"
  39. #include "avcodec.h"
  40. typedef struct DPCMContext {
  41. int channels;
  42. short roq_square_array[256];
  43. long sample[2];//for SOL_DPCM
  44. const int *sol_table;//for SOL_DPCM
  45. } DPCMContext;
  46. #define SE_16BIT(x) if (x & 0x8000) x -= 0x10000;
  47. static const int interplay_delta_table[] = {
  48. 0, 1, 2, 3, 4, 5, 6, 7,
  49. 8, 9, 10, 11, 12, 13, 14, 15,
  50. 16, 17, 18, 19, 20, 21, 22, 23,
  51. 24, 25, 26, 27, 28, 29, 30, 31,
  52. 32, 33, 34, 35, 36, 37, 38, 39,
  53. 40, 41, 42, 43, 47, 51, 56, 61,
  54. 66, 72, 79, 86, 94, 102, 112, 122,
  55. 133, 145, 158, 173, 189, 206, 225, 245,
  56. 267, 292, 318, 348, 379, 414, 452, 493,
  57. 538, 587, 640, 699, 763, 832, 908, 991,
  58. 1081, 1180, 1288, 1405, 1534, 1673, 1826, 1993,
  59. 2175, 2373, 2590, 2826, 3084, 3365, 3672, 4008,
  60. 4373, 4772, 5208, 5683, 6202, 6767, 7385, 8059,
  61. 8794, 9597, 10472, 11428, 12471, 13609, 14851, 16206,
  62. 17685, 19298, 21060, 22981, 25078, 27367, 29864, 32589,
  63. -29973, -26728, -23186, -19322, -15105, -10503, -5481, -1,
  64. 1, 1, 5481, 10503, 15105, 19322, 23186, 26728,
  65. 29973, -32589, -29864, -27367, -25078, -22981, -21060, -19298,
  66. -17685, -16206, -14851, -13609, -12471, -11428, -10472, -9597,
  67. -8794, -8059, -7385, -6767, -6202, -5683, -5208, -4772,
  68. -4373, -4008, -3672, -3365, -3084, -2826, -2590, -2373,
  69. -2175, -1993, -1826, -1673, -1534, -1405, -1288, -1180,
  70. -1081, -991, -908, -832, -763, -699, -640, -587,
  71. -538, -493, -452, -414, -379, -348, -318, -292,
  72. -267, -245, -225, -206, -189, -173, -158, -145,
  73. -133, -122, -112, -102, -94, -86, -79, -72,
  74. -66, -61, -56, -51, -47, -43, -42, -41,
  75. -40, -39, -38, -37, -36, -35, -34, -33,
  76. -32, -31, -30, -29, -28, -27, -26, -25,
  77. -24, -23, -22, -21, -20, -19, -18, -17,
  78. -16, -15, -14, -13, -12, -11, -10, -9,
  79. -8, -7, -6, -5, -4, -3, -2, -1
  80. };
  81. static const int sol_table_old[16] =
  82. { 0x0, 0x1, 0x2 , 0x3, 0x6, 0xA, 0xF, 0x15,
  83. -0x15, -0xF, -0xA, -0x6, -0x3, -0x2, -0x1, 0x0};
  84. static const int sol_table_new[16] =
  85. { 0x0, 0x1, 0x2, 0x3, 0x6, 0xA, 0xF, 0x15,
  86. 0x0, -0x1, -0x2, -0x3, -0x6, -0xA, -0xF, -0x15};
  87. static const int sol_table_16[128] = {
  88. 0x000, 0x008, 0x010, 0x020, 0x030, 0x040, 0x050, 0x060, 0x070, 0x080,
  89. 0x090, 0x0A0, 0x0B0, 0x0C0, 0x0D0, 0x0E0, 0x0F0, 0x100, 0x110, 0x120,
  90. 0x130, 0x140, 0x150, 0x160, 0x170, 0x180, 0x190, 0x1A0, 0x1B0, 0x1C0,
  91. 0x1D0, 0x1E0, 0x1F0, 0x200, 0x208, 0x210, 0x218, 0x220, 0x228, 0x230,
  92. 0x238, 0x240, 0x248, 0x250, 0x258, 0x260, 0x268, 0x270, 0x278, 0x280,
  93. 0x288, 0x290, 0x298, 0x2A0, 0x2A8, 0x2B0, 0x2B8, 0x2C0, 0x2C8, 0x2D0,
  94. 0x2D8, 0x2E0, 0x2E8, 0x2F0, 0x2F8, 0x300, 0x308, 0x310, 0x318, 0x320,
  95. 0x328, 0x330, 0x338, 0x340, 0x348, 0x350, 0x358, 0x360, 0x368, 0x370,
  96. 0x378, 0x380, 0x388, 0x390, 0x398, 0x3A0, 0x3A8, 0x3B0, 0x3B8, 0x3C0,
  97. 0x3C8, 0x3D0, 0x3D8, 0x3E0, 0x3E8, 0x3F0, 0x3F8, 0x400, 0x440, 0x480,
  98. 0x4C0, 0x500, 0x540, 0x580, 0x5C0, 0x600, 0x640, 0x680, 0x6C0, 0x700,
  99. 0x740, 0x780, 0x7C0, 0x800, 0x900, 0xA00, 0xB00, 0xC00, 0xD00, 0xE00,
  100. 0xF00, 0x1000, 0x1400, 0x1800, 0x1C00, 0x2000, 0x3000, 0x4000
  101. };
  102. static av_cold int dpcm_decode_init(AVCodecContext *avctx)
  103. {
  104. DPCMContext *s = avctx->priv_data;
  105. int i;
  106. short square;
  107. s->channels = avctx->channels;
  108. s->sample[0] = s->sample[1] = 0;
  109. switch(avctx->codec->id) {
  110. case CODEC_ID_ROQ_DPCM:
  111. /* initialize square table */
  112. for (i = 0; i < 128; i++) {
  113. square = i * i;
  114. s->roq_square_array[i] = square;
  115. s->roq_square_array[i + 128] = -square;
  116. }
  117. break;
  118. case CODEC_ID_SOL_DPCM:
  119. switch(avctx->codec_tag){
  120. case 1:
  121. s->sol_table=sol_table_old;
  122. s->sample[0] = s->sample[1] = 0x80;
  123. break;
  124. case 2:
  125. s->sol_table=sol_table_new;
  126. s->sample[0] = s->sample[1] = 0x80;
  127. break;
  128. case 3:
  129. s->sol_table=sol_table_16;
  130. break;
  131. default:
  132. av_log(avctx, AV_LOG_ERROR, "Unknown SOL subcodec\n");
  133. return -1;
  134. }
  135. break;
  136. default:
  137. break;
  138. }
  139. avctx->sample_fmt = SAMPLE_FMT_S16;
  140. return 0;
  141. }
  142. static int dpcm_decode_frame(AVCodecContext *avctx,
  143. void *data, int *data_size,
  144. const uint8_t *buf, int buf_size)
  145. {
  146. DPCMContext *s = avctx->priv_data;
  147. int in, out = 0;
  148. int predictor[2];
  149. int channel_number = 0;
  150. int stereo = s->channels - 1;
  151. short *output_samples = data;
  152. int shift[2];
  153. unsigned char byte;
  154. short diff;
  155. if (!buf_size)
  156. return 0;
  157. if (stereo && (buf_size & 1))
  158. buf_size--;
  159. // almost every DPCM variant expands one byte of data into two
  160. if(*data_size/2 < buf_size)
  161. return -1;
  162. switch(avctx->codec->id) {
  163. case CODEC_ID_ROQ_DPCM:
  164. if (s->channels == 1)
  165. predictor[0] = AV_RL16(&buf[6]);
  166. else {
  167. predictor[0] = buf[7] << 8;
  168. predictor[1] = buf[6] << 8;
  169. }
  170. SE_16BIT(predictor[0]);
  171. SE_16BIT(predictor[1]);
  172. /* decode the samples */
  173. for (in = 8, out = 0; in < buf_size; in++, out++) {
  174. predictor[channel_number] += s->roq_square_array[buf[in]];
  175. predictor[channel_number] = av_clip_int16(predictor[channel_number]);
  176. output_samples[out] = predictor[channel_number];
  177. /* toggle channel */
  178. channel_number ^= s->channels - 1;
  179. }
  180. break;
  181. case CODEC_ID_INTERPLAY_DPCM:
  182. in = 6; /* skip over the stream mask and stream length */
  183. predictor[0] = AV_RL16(&buf[in]);
  184. in += 2;
  185. SE_16BIT(predictor[0])
  186. output_samples[out++] = predictor[0];
  187. if (s->channels == 2) {
  188. predictor[1] = AV_RL16(&buf[in]);
  189. in += 2;
  190. SE_16BIT(predictor[1])
  191. output_samples[out++] = predictor[1];
  192. }
  193. while (in < buf_size) {
  194. predictor[channel_number] += interplay_delta_table[buf[in++]];
  195. predictor[channel_number] = av_clip_int16(predictor[channel_number]);
  196. output_samples[out++] = predictor[channel_number];
  197. /* toggle channel */
  198. channel_number ^= s->channels - 1;
  199. }
  200. break;
  201. case CODEC_ID_XAN_DPCM:
  202. in = 0;
  203. shift[0] = shift[1] = 4;
  204. predictor[0] = AV_RL16(&buf[in]);
  205. in += 2;
  206. SE_16BIT(predictor[0]);
  207. if (s->channels == 2) {
  208. predictor[1] = AV_RL16(&buf[in]);
  209. in += 2;
  210. SE_16BIT(predictor[1]);
  211. }
  212. while (in < buf_size) {
  213. byte = buf[in++];
  214. diff = (byte & 0xFC) << 8;
  215. if ((byte & 0x03) == 3)
  216. shift[channel_number]++;
  217. else
  218. shift[channel_number] -= (2 * (byte & 3));
  219. /* saturate the shifter to a lower limit of 0 */
  220. if (shift[channel_number] < 0)
  221. shift[channel_number] = 0;
  222. diff >>= shift[channel_number];
  223. predictor[channel_number] += diff;
  224. predictor[channel_number] = av_clip_int16(predictor[channel_number]);
  225. output_samples[out++] = predictor[channel_number];
  226. /* toggle channel */
  227. channel_number ^= s->channels - 1;
  228. }
  229. break;
  230. case CODEC_ID_SOL_DPCM:
  231. in = 0;
  232. if (avctx->codec_tag != 3) {
  233. if(*data_size/4 < buf_size)
  234. return -1;
  235. while (in < buf_size) {
  236. int n1, n2;
  237. n1 = (buf[in] >> 4) & 0xF;
  238. n2 = buf[in++] & 0xF;
  239. s->sample[0] += s->sol_table[n1];
  240. if (s->sample[0] < 0) s->sample[0] = 0;
  241. if (s->sample[0] > 255) s->sample[0] = 255;
  242. output_samples[out++] = (s->sample[0] - 128) << 8;
  243. s->sample[s->channels - 1] += s->sol_table[n2];
  244. if (s->sample[s->channels - 1] < 0) s->sample[s->channels - 1] = 0;
  245. if (s->sample[s->channels - 1] > 255) s->sample[s->channels - 1] = 255;
  246. output_samples[out++] = (s->sample[s->channels - 1] - 128) << 8;
  247. }
  248. } else {
  249. while (in < buf_size) {
  250. int n;
  251. n = buf[in++];
  252. if (n & 0x80) s->sample[channel_number] -= s->sol_table[n & 0x7F];
  253. else s->sample[channel_number] += s->sol_table[n & 0x7F];
  254. s->sample[channel_number] = av_clip_int16(s->sample[channel_number]);
  255. output_samples[out++] = s->sample[channel_number];
  256. /* toggle channel */
  257. channel_number ^= s->channels - 1;
  258. }
  259. }
  260. break;
  261. }
  262. *data_size = out * sizeof(short);
  263. return buf_size;
  264. }
  265. #define DPCM_DECODER(id, name, long_name_) \
  266. AVCodec name ## _decoder = { \
  267. #name, \
  268. CODEC_TYPE_AUDIO, \
  269. id, \
  270. sizeof(DPCMContext), \
  271. dpcm_decode_init, \
  272. NULL, \
  273. NULL, \
  274. dpcm_decode_frame, \
  275. .long_name = NULL_IF_CONFIG_SMALL(long_name_), \
  276. };
  277. DPCM_DECODER(CODEC_ID_INTERPLAY_DPCM, interplay_dpcm, "DPCM Interplay");
  278. DPCM_DECODER(CODEC_ID_ROQ_DPCM, roq_dpcm, "DPCM id RoQ");
  279. DPCM_DECODER(CODEC_ID_SOL_DPCM, sol_dpcm, "DPCM Sol");
  280. DPCM_DECODER(CODEC_ID_XAN_DPCM, xan_dpcm, "DPCM Xan");