yuv2rgb.c 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926
  1. /*
  2. * software YUV to RGB converter
  3. *
  4. * Copyright (C) 2009 Konstantin Shishkov
  5. *
  6. * 1,4,8bpp support and context / deglobalize stuff
  7. * by Michael Niedermayer (michaelni@gmx.at)
  8. *
  9. * This file is part of FFmpeg.
  10. *
  11. * FFmpeg is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * FFmpeg is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with FFmpeg; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include <stdio.h>
  26. #include <stdlib.h>
  27. #include <inttypes.h>
  28. #include "libavutil/cpu.h"
  29. #include "libavutil/bswap.h"
  30. #include "config.h"
  31. #include "rgb2rgb.h"
  32. #include "swscale.h"
  33. #include "swscale_internal.h"
  34. #include "libavutil/pixdesc.h"
  35. extern const uint8_t dither_2x2_4[2][8];
  36. extern const uint8_t dither_2x2_8[2][8];
  37. extern const uint8_t dither_4x4_16[4][8];
  38. extern const uint8_t dither_8x8_32[8][8];
  39. extern const uint8_t dither_8x8_73[8][8];
  40. extern const uint8_t dither_8x8_220[8][8];
  41. const int32_t ff_yuv2rgb_coeffs[8][4] = {
  42. { 117504, 138453, 13954, 34903 }, /* no sequence_display_extension */
  43. { 117504, 138453, 13954, 34903 }, /* ITU-R Rec. 709 (1990) */
  44. { 104597, 132201, 25675, 53279 }, /* unspecified */
  45. { 104597, 132201, 25675, 53279 }, /* reserved */
  46. { 104448, 132798, 24759, 53109 }, /* FCC */
  47. { 104597, 132201, 25675, 53279 }, /* ITU-R Rec. 624-4 System B, G */
  48. { 104597, 132201, 25675, 53279 }, /* SMPTE 170M */
  49. { 117579, 136230, 16907, 35559 } /* SMPTE 240M (1987) */
  50. };
  51. const int *sws_getCoefficients(int colorspace)
  52. {
  53. if (colorspace > 7 || colorspace < 0)
  54. colorspace = SWS_CS_DEFAULT;
  55. return ff_yuv2rgb_coeffs[colorspace];
  56. }
  57. #define LOADCHROMA(i) \
  58. U = pu[i]; \
  59. V = pv[i]; \
  60. r = (void *)c->table_rV[V+YUVRGB_TABLE_HEADROOM]; \
  61. g = (void *)(c->table_gU[U+YUVRGB_TABLE_HEADROOM] + c->table_gV[V+YUVRGB_TABLE_HEADROOM]); \
  62. b = (void *)c->table_bU[U+YUVRGB_TABLE_HEADROOM];
  63. #define PUTRGB(dst, src, i) \
  64. Y = src[2 * i]; \
  65. dst[2 * i] = r[Y] + g[Y] + b[Y]; \
  66. Y = src[2 * i + 1]; \
  67. dst[2 * i + 1] = r[Y] + g[Y] + b[Y];
  68. #define PUTRGB24(dst, src, i) \
  69. Y = src[2 * i]; \
  70. dst[6 * i + 0] = r[Y]; \
  71. dst[6 * i + 1] = g[Y]; \
  72. dst[6 * i + 2] = b[Y]; \
  73. Y = src[2 * i + 1]; \
  74. dst[6 * i + 3] = r[Y]; \
  75. dst[6 * i + 4] = g[Y]; \
  76. dst[6 * i + 5] = b[Y];
  77. #define PUTBGR24(dst, src, i) \
  78. Y = src[2 * i]; \
  79. dst[6 * i + 0] = b[Y]; \
  80. dst[6 * i + 1] = g[Y]; \
  81. dst[6 * i + 2] = r[Y]; \
  82. Y = src[2 * i + 1]; \
  83. dst[6 * i + 3] = b[Y]; \
  84. dst[6 * i + 4] = g[Y]; \
  85. dst[6 * i + 5] = r[Y];
  86. #define PUTRGBA(dst, ysrc, asrc, i, s) \
  87. Y = ysrc[2 * i]; \
  88. dst[2 * i] = r[Y] + g[Y] + b[Y] + (asrc[2 * i] << s); \
  89. Y = ysrc[2 * i + 1]; \
  90. dst[2 * i + 1] = r[Y] + g[Y] + b[Y] + (asrc[2 * i + 1] << s);
  91. #define PUTRGB48(dst, src, i) \
  92. Y = src[ 2 * i]; \
  93. dst[12 * i + 0] = dst[12 * i + 1] = r[Y]; \
  94. dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
  95. dst[12 * i + 4] = dst[12 * i + 5] = b[Y]; \
  96. Y = src[ 2 * i + 1]; \
  97. dst[12 * i + 6] = dst[12 * i + 7] = r[Y]; \
  98. dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
  99. dst[12 * i + 10] = dst[12 * i + 11] = b[Y];
  100. #define PUTBGR48(dst, src, i) \
  101. Y = src[2 * i]; \
  102. dst[12 * i + 0] = dst[12 * i + 1] = b[Y]; \
  103. dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
  104. dst[12 * i + 4] = dst[12 * i + 5] = r[Y]; \
  105. Y = src[2 * i + 1]; \
  106. dst[12 * i + 6] = dst[12 * i + 7] = b[Y]; \
  107. dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
  108. dst[12 * i + 10] = dst[12 * i + 11] = r[Y];
  109. #define YUV2RGBFUNC(func_name, dst_type, alpha) \
  110. static int func_name(SwsContext *c, const uint8_t *src[], \
  111. int srcStride[], int srcSliceY, int srcSliceH, \
  112. uint8_t *dst[], int dstStride[]) \
  113. { \
  114. int y; \
  115. \
  116. if (!alpha && c->srcFormat == PIX_FMT_YUV422P) { \
  117. srcStride[1] *= 2; \
  118. srcStride[2] *= 2; \
  119. } \
  120. for (y = 0; y < srcSliceH; y += 2) { \
  121. dst_type *dst_1 = \
  122. (dst_type *)(dst[0] + (y + srcSliceY) * dstStride[0]); \
  123. dst_type *dst_2 = \
  124. (dst_type *)(dst[0] + (y + srcSliceY + 1) * dstStride[0]); \
  125. dst_type av_unused *r, *g, *b; \
  126. const uint8_t *py_1 = src[0] + y * srcStride[0]; \
  127. const uint8_t *py_2 = py_1 + srcStride[0]; \
  128. const uint8_t *pu = src[1] + (y >> 1) * srcStride[1]; \
  129. const uint8_t *pv = src[2] + (y >> 1) * srcStride[2]; \
  130. const uint8_t av_unused *pa_1, *pa_2; \
  131. unsigned int h_size = c->dstW >> 3; \
  132. if (alpha) { \
  133. pa_1 = src[3] + y * srcStride[3]; \
  134. pa_2 = pa_1 + srcStride[3]; \
  135. } \
  136. while (h_size--) { \
  137. int av_unused U, V, Y; \
  138. #define ENDYUV2RGBLINE(dst_delta, ss) \
  139. pu += 4 >> ss; \
  140. pv += 4 >> ss; \
  141. py_1 += 8 >> ss; \
  142. py_2 += 8 >> ss; \
  143. dst_1 += dst_delta >> ss; \
  144. dst_2 += dst_delta >> ss; \
  145. } \
  146. if (c->dstW & (4 >> ss)) { \
  147. int av_unused Y, U, V; \
  148. #define ENDYUV2RGBFUNC() \
  149. } \
  150. } \
  151. return srcSliceH; \
  152. }
  153. #define CLOSEYUV2RGBFUNC(dst_delta) \
  154. ENDYUV2RGBLINE(dst_delta, 0) \
  155. ENDYUV2RGBFUNC()
  156. YUV2RGBFUNC(yuv2rgb_c_48, uint8_t, 0)
  157. LOADCHROMA(0);
  158. PUTRGB48(dst_1, py_1, 0);
  159. PUTRGB48(dst_2, py_2, 0);
  160. LOADCHROMA(1);
  161. PUTRGB48(dst_2, py_2, 1);
  162. PUTRGB48(dst_1, py_1, 1);
  163. LOADCHROMA(2);
  164. PUTRGB48(dst_1, py_1, 2);
  165. PUTRGB48(dst_2, py_2, 2);
  166. LOADCHROMA(3);
  167. PUTRGB48(dst_2, py_2, 3);
  168. PUTRGB48(dst_1, py_1, 3);
  169. ENDYUV2RGBLINE(48, 0)
  170. LOADCHROMA(0);
  171. PUTRGB48(dst_1, py_1, 0);
  172. PUTRGB48(dst_2, py_2, 0);
  173. LOADCHROMA(1);
  174. PUTRGB48(dst_2, py_2, 1);
  175. PUTRGB48(dst_1, py_1, 1);
  176. ENDYUV2RGBLINE(48, 1)
  177. LOADCHROMA(0);
  178. PUTRGB48(dst_1, py_1, 0);
  179. PUTRGB48(dst_2, py_2, 0);
  180. ENDYUV2RGBFUNC()
  181. YUV2RGBFUNC(yuv2rgb_c_bgr48, uint8_t, 0)
  182. LOADCHROMA(0);
  183. PUTBGR48(dst_1, py_1, 0);
  184. PUTBGR48(dst_2, py_2, 0);
  185. LOADCHROMA(1);
  186. PUTBGR48(dst_2, py_2, 1);
  187. PUTBGR48(dst_1, py_1, 1);
  188. LOADCHROMA(2);
  189. PUTBGR48(dst_1, py_1, 2);
  190. PUTBGR48(dst_2, py_2, 2);
  191. LOADCHROMA(3);
  192. PUTBGR48(dst_2, py_2, 3);
  193. PUTBGR48(dst_1, py_1, 3);
  194. ENDYUV2RGBLINE(48, 0)
  195. LOADCHROMA(0);
  196. PUTBGR48(dst_1, py_1, 0);
  197. PUTBGR48(dst_2, py_2, 0);
  198. LOADCHROMA(1);
  199. PUTBGR48(dst_2, py_2, 1);
  200. PUTBGR48(dst_1, py_1, 1);
  201. ENDYUV2RGBLINE(48, 1)
  202. LOADCHROMA(0);
  203. PUTBGR48(dst_1, py_1, 0);
  204. PUTBGR48(dst_2, py_2, 0);
  205. ENDYUV2RGBFUNC()
  206. YUV2RGBFUNC(yuv2rgb_c_32, uint32_t, 0)
  207. LOADCHROMA(0);
  208. PUTRGB(dst_1, py_1, 0);
  209. PUTRGB(dst_2, py_2, 0);
  210. LOADCHROMA(1);
  211. PUTRGB(dst_2, py_2, 1);
  212. PUTRGB(dst_1, py_1, 1);
  213. LOADCHROMA(2);
  214. PUTRGB(dst_1, py_1, 2);
  215. PUTRGB(dst_2, py_2, 2);
  216. LOADCHROMA(3);
  217. PUTRGB(dst_2, py_2, 3);
  218. PUTRGB(dst_1, py_1, 3);
  219. ENDYUV2RGBLINE(8, 0)
  220. LOADCHROMA(0);
  221. PUTRGB(dst_1, py_1, 0);
  222. PUTRGB(dst_2, py_2, 0);
  223. LOADCHROMA(1);
  224. PUTRGB(dst_2, py_2, 1);
  225. PUTRGB(dst_1, py_1, 1);
  226. ENDYUV2RGBLINE(8, 1)
  227. LOADCHROMA(0);
  228. PUTRGB(dst_1, py_1, 0);
  229. PUTRGB(dst_2, py_2, 0);
  230. ENDYUV2RGBFUNC()
  231. YUV2RGBFUNC(yuva2rgba_c, uint32_t, 1)
  232. LOADCHROMA(0);
  233. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  234. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  235. LOADCHROMA(1);
  236. PUTRGBA(dst_2, py_2, pa_1, 1, 24);
  237. PUTRGBA(dst_1, py_1, pa_2, 1, 24);
  238. LOADCHROMA(2);
  239. PUTRGBA(dst_1, py_1, pa_1, 2, 24);
  240. PUTRGBA(dst_2, py_2, pa_2, 2, 24);
  241. LOADCHROMA(3);
  242. PUTRGBA(dst_2, py_2, pa_1, 3, 24);
  243. PUTRGBA(dst_1, py_1, pa_2, 3, 24);
  244. pa_1 += 8; \
  245. pa_2 += 8; \
  246. ENDYUV2RGBLINE(8, 0)
  247. LOADCHROMA(0);
  248. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  249. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  250. LOADCHROMA(1);
  251. PUTRGBA(dst_2, py_2, pa_1, 1, 24);
  252. PUTRGBA(dst_1, py_1, pa_2, 1, 24);
  253. pa_1 += 4; \
  254. pa_2 += 4; \
  255. ENDYUV2RGBLINE(8, 1)
  256. LOADCHROMA(0);
  257. PUTRGBA(dst_1, py_1, pa_1, 0, 24);
  258. PUTRGBA(dst_2, py_2, pa_2, 0, 24);
  259. ENDYUV2RGBFUNC()
  260. YUV2RGBFUNC(yuva2argb_c, uint32_t, 1)
  261. LOADCHROMA(0);
  262. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  263. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  264. LOADCHROMA(1);
  265. PUTRGBA(dst_2, py_2, pa_2, 1, 0);
  266. PUTRGBA(dst_1, py_1, pa_1, 1, 0);
  267. LOADCHROMA(2);
  268. PUTRGBA(dst_1, py_1, pa_1, 2, 0);
  269. PUTRGBA(dst_2, py_2, pa_2, 2, 0);
  270. LOADCHROMA(3);
  271. PUTRGBA(dst_2, py_2, pa_2, 3, 0);
  272. PUTRGBA(dst_1, py_1, pa_1, 3, 0);
  273. pa_1 += 8; \
  274. pa_2 += 8; \
  275. ENDYUV2RGBLINE(8, 0)
  276. LOADCHROMA(0);
  277. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  278. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  279. LOADCHROMA(1);
  280. PUTRGBA(dst_2, py_2, pa_2, 1, 0);
  281. PUTRGBA(dst_1, py_1, pa_1, 1, 0);
  282. pa_1 += 4; \
  283. pa_2 += 4; \
  284. ENDYUV2RGBLINE(8, 1)
  285. LOADCHROMA(0);
  286. PUTRGBA(dst_1, py_1, pa_1, 0, 0);
  287. PUTRGBA(dst_2, py_2, pa_2, 0, 0);
  288. ENDYUV2RGBFUNC()
  289. YUV2RGBFUNC(yuv2rgb_c_24_rgb, uint8_t, 0)
  290. LOADCHROMA(0);
  291. PUTRGB24(dst_1, py_1, 0);
  292. PUTRGB24(dst_2, py_2, 0);
  293. LOADCHROMA(1);
  294. PUTRGB24(dst_2, py_2, 1);
  295. PUTRGB24(dst_1, py_1, 1);
  296. LOADCHROMA(2);
  297. PUTRGB24(dst_1, py_1, 2);
  298. PUTRGB24(dst_2, py_2, 2);
  299. LOADCHROMA(3);
  300. PUTRGB24(dst_2, py_2, 3);
  301. PUTRGB24(dst_1, py_1, 3);
  302. ENDYUV2RGBLINE(24, 0)
  303. LOADCHROMA(0);
  304. PUTRGB24(dst_1, py_1, 0);
  305. PUTRGB24(dst_2, py_2, 0);
  306. LOADCHROMA(1);
  307. PUTRGB24(dst_2, py_2, 1);
  308. PUTRGB24(dst_1, py_1, 1);
  309. ENDYUV2RGBLINE(24, 1)
  310. LOADCHROMA(0);
  311. PUTRGB24(dst_1, py_1, 0);
  312. PUTRGB24(dst_2, py_2, 0);
  313. ENDYUV2RGBFUNC()
  314. // only trivial mods from yuv2rgb_c_24_rgb
  315. YUV2RGBFUNC(yuv2rgb_c_24_bgr, uint8_t, 0)
  316. LOADCHROMA(0);
  317. PUTBGR24(dst_1, py_1, 0);
  318. PUTBGR24(dst_2, py_2, 0);
  319. LOADCHROMA(1);
  320. PUTBGR24(dst_2, py_2, 1);
  321. PUTBGR24(dst_1, py_1, 1);
  322. LOADCHROMA(2);
  323. PUTBGR24(dst_1, py_1, 2);
  324. PUTBGR24(dst_2, py_2, 2);
  325. LOADCHROMA(3);
  326. PUTBGR24(dst_2, py_2, 3);
  327. PUTBGR24(dst_1, py_1, 3);
  328. ENDYUV2RGBLINE(24, 0)
  329. LOADCHROMA(0);
  330. PUTBGR24(dst_1, py_1, 0);
  331. PUTBGR24(dst_2, py_2, 0);
  332. LOADCHROMA(1);
  333. PUTBGR24(dst_2, py_2, 1);
  334. PUTBGR24(dst_1, py_1, 1);
  335. ENDYUV2RGBLINE(24, 1)
  336. LOADCHROMA(0);
  337. PUTBGR24(dst_1, py_1, 0);
  338. PUTBGR24(dst_2, py_2, 0);
  339. ENDYUV2RGBFUNC()
  340. YUV2RGBFUNC(yuv2rgb_c_16_ordered_dither, uint16_t, 0)
  341. const uint8_t *d16 = dither_2x2_8[y & 1];
  342. const uint8_t *e16 = dither_2x2_4[y & 1];
  343. const uint8_t *f16 = dither_2x2_8[(y & 1)^1];
  344. #define PUTRGB16(dst, src, i, o) \
  345. Y = src[2 * i]; \
  346. dst[2 * i] = r[Y + d16[0 + o]] + \
  347. g[Y + e16[0 + o]] + \
  348. b[Y + f16[0 + o]]; \
  349. Y = src[2 * i + 1]; \
  350. dst[2 * i + 1] = r[Y + d16[1 + o]] + \
  351. g[Y + e16[1 + o]] + \
  352. b[Y + f16[1 + o]];
  353. LOADCHROMA(0);
  354. PUTRGB16(dst_1, py_1, 0, 0);
  355. PUTRGB16(dst_2, py_2, 0, 0 + 8);
  356. LOADCHROMA(1);
  357. PUTRGB16(dst_2, py_2, 1, 2 + 8);
  358. PUTRGB16(dst_1, py_1, 1, 2);
  359. LOADCHROMA(2);
  360. PUTRGB16(dst_1, py_1, 2, 4);
  361. PUTRGB16(dst_2, py_2, 2, 4 + 8);
  362. LOADCHROMA(3);
  363. PUTRGB16(dst_2, py_2, 3, 6 + 8);
  364. PUTRGB16(dst_1, py_1, 3, 6);
  365. CLOSEYUV2RGBFUNC(8)
  366. YUV2RGBFUNC(yuv2rgb_c_15_ordered_dither, uint16_t, 0)
  367. const uint8_t *d16 = dither_2x2_8[y & 1];
  368. const uint8_t *e16 = dither_2x2_8[(y & 1)^1];
  369. #define PUTRGB15(dst, src, i, o) \
  370. Y = src[2 * i]; \
  371. dst[2 * i] = r[Y + d16[0 + o]] + \
  372. g[Y + d16[1 + o]] + \
  373. b[Y + e16[0 + o]]; \
  374. Y = src[2 * i + 1]; \
  375. dst[2 * i + 1] = r[Y + d16[1 + o]] + \
  376. g[Y + d16[0 + o]] + \
  377. b[Y + e16[1 + o]];
  378. LOADCHROMA(0);
  379. PUTRGB15(dst_1, py_1, 0, 0);
  380. PUTRGB15(dst_2, py_2, 0, 0 + 8);
  381. LOADCHROMA(1);
  382. PUTRGB15(dst_2, py_2, 1, 2 + 8);
  383. PUTRGB15(dst_1, py_1, 1, 2);
  384. LOADCHROMA(2);
  385. PUTRGB15(dst_1, py_1, 2, 4);
  386. PUTRGB15(dst_2, py_2, 2, 4 + 8);
  387. LOADCHROMA(3);
  388. PUTRGB15(dst_2, py_2, 3, 6 + 8);
  389. PUTRGB15(dst_1, py_1, 3, 6);
  390. CLOSEYUV2RGBFUNC(8)
  391. // r, g, b, dst_1, dst_2
  392. YUV2RGBFUNC(yuv2rgb_c_12_ordered_dither, uint16_t, 0)
  393. const uint8_t *d16 = dither_4x4_16[y & 3];
  394. #define PUTRGB12(dst, src, i, o) \
  395. Y = src[2 * i]; \
  396. dst[2 * i] = r[Y + d16[0 + o]] + \
  397. g[Y + d16[0 + o]] + \
  398. b[Y + d16[0 + o]]; \
  399. Y = src[2 * i + 1]; \
  400. dst[2 * i + 1] = r[Y + d16[1 + o]] + \
  401. g[Y + d16[1 + o]] + \
  402. b[Y + d16[1 + o]];
  403. LOADCHROMA(0);
  404. PUTRGB12(dst_1, py_1, 0, 0);
  405. PUTRGB12(dst_2, py_2, 0, 0 + 8);
  406. LOADCHROMA(1);
  407. PUTRGB12(dst_2, py_2, 1, 2 + 8);
  408. PUTRGB12(dst_1, py_1, 1, 2);
  409. LOADCHROMA(2);
  410. PUTRGB12(dst_1, py_1, 2, 4);
  411. PUTRGB12(dst_2, py_2, 2, 4 + 8);
  412. LOADCHROMA(3);
  413. PUTRGB12(dst_2, py_2, 3, 6 + 8);
  414. PUTRGB12(dst_1, py_1, 3, 6);
  415. CLOSEYUV2RGBFUNC(8)
  416. // r, g, b, dst_1, dst_2
  417. YUV2RGBFUNC(yuv2rgb_c_8_ordered_dither, uint8_t, 0)
  418. const uint8_t *d32 = dither_8x8_32[y & 7];
  419. const uint8_t *d64 = dither_8x8_73[y & 7];
  420. #define PUTRGB8(dst, src, i, o) \
  421. Y = src[2 * i]; \
  422. dst[2 * i] = r[Y + d32[0 + o]] + \
  423. g[Y + d32[0 + o]] + \
  424. b[Y + d64[0 + o]]; \
  425. Y = src[2 * i + 1]; \
  426. dst[2 * i + 1] = r[Y + d32[1 + o]] + \
  427. g[Y + d32[1 + o]] + \
  428. b[Y + d64[1 + o]];
  429. LOADCHROMA(0);
  430. PUTRGB8(dst_1, py_1, 0, 0);
  431. PUTRGB8(dst_2, py_2, 0, 0 + 8);
  432. LOADCHROMA(1);
  433. PUTRGB8(dst_2, py_2, 1, 2 + 8);
  434. PUTRGB8(dst_1, py_1, 1, 2);
  435. LOADCHROMA(2);
  436. PUTRGB8(dst_1, py_1, 2, 4);
  437. PUTRGB8(dst_2, py_2, 2, 4 + 8);
  438. LOADCHROMA(3);
  439. PUTRGB8(dst_2, py_2, 3, 6 + 8);
  440. PUTRGB8(dst_1, py_1, 3, 6);
  441. CLOSEYUV2RGBFUNC(8)
  442. YUV2RGBFUNC(yuv2rgb_c_4_ordered_dither, uint8_t, 0)
  443. const uint8_t * d64 = dither_8x8_73[y & 7];
  444. const uint8_t *d128 = dither_8x8_220[y & 7];
  445. int acc;
  446. #define PUTRGB4D(dst, src, i, o) \
  447. Y = src[2 * i]; \
  448. acc = r[Y + d128[0 + o]] + \
  449. g[Y + d64[0 + o]] + \
  450. b[Y + d128[0 + o]]; \
  451. Y = src[2 * i + 1]; \
  452. acc |= (r[Y + d128[1 + o]] + \
  453. g[Y + d64[1 + o]] + \
  454. b[Y + d128[1 + o]]) << 4; \
  455. dst[i] = acc;
  456. LOADCHROMA(0);
  457. PUTRGB4D(dst_1, py_1, 0, 0);
  458. PUTRGB4D(dst_2, py_2, 0, 0 + 8);
  459. LOADCHROMA(1);
  460. PUTRGB4D(dst_2, py_2, 1, 2 + 8);
  461. PUTRGB4D(dst_1, py_1, 1, 2);
  462. LOADCHROMA(2);
  463. PUTRGB4D(dst_1, py_1, 2, 4);
  464. PUTRGB4D(dst_2, py_2, 2, 4 + 8);
  465. LOADCHROMA(3);
  466. PUTRGB4D(dst_2, py_2, 3, 6 + 8);
  467. PUTRGB4D(dst_1, py_1, 3, 6);
  468. CLOSEYUV2RGBFUNC(4)
  469. YUV2RGBFUNC(yuv2rgb_c_4b_ordered_dither, uint8_t, 0)
  470. const uint8_t *d64 = dither_8x8_73[y & 7];
  471. const uint8_t *d128 = dither_8x8_220[y & 7];
  472. #define PUTRGB4DB(dst, src, i, o) \
  473. Y = src[2 * i]; \
  474. dst[2 * i] = r[Y + d128[0 + o]] + \
  475. g[Y + d64[0 + o]] + \
  476. b[Y + d128[0 + o]]; \
  477. Y = src[2 * i + 1]; \
  478. dst[2 * i + 1] = r[Y + d128[1 + o]] + \
  479. g[Y + d64[1 + o]] + \
  480. b[Y + d128[1 + o]];
  481. LOADCHROMA(0);
  482. PUTRGB4DB(dst_1, py_1, 0, 0);
  483. PUTRGB4DB(dst_2, py_2, 0, 0 + 8);
  484. LOADCHROMA(1);
  485. PUTRGB4DB(dst_2, py_2, 1, 2 + 8);
  486. PUTRGB4DB(dst_1, py_1, 1, 2);
  487. LOADCHROMA(2);
  488. PUTRGB4DB(dst_1, py_1, 2, 4);
  489. PUTRGB4DB(dst_2, py_2, 2, 4 + 8);
  490. LOADCHROMA(3);
  491. PUTRGB4DB(dst_2, py_2, 3, 6 + 8);
  492. PUTRGB4DB(dst_1, py_1, 3, 6);
  493. CLOSEYUV2RGBFUNC(8)
  494. YUV2RGBFUNC(yuv2rgb_c_1_ordered_dither, uint8_t, 0)
  495. const uint8_t *d128 = dither_8x8_220[y & 7];
  496. char out_1 = 0, out_2 = 0;
  497. g = c->table_gU[128 + YUVRGB_TABLE_HEADROOM] + c->table_gV[128 + YUVRGB_TABLE_HEADROOM];
  498. #define PUTRGB1(out, src, i, o) \
  499. Y = src[2 * i]; \
  500. out += out + g[Y + d128[0 + o]]; \
  501. Y = src[2 * i + 1]; \
  502. out += out + g[Y + d128[1 + o]];
  503. PUTRGB1(out_1, py_1, 0, 0);
  504. PUTRGB1(out_2, py_2, 0, 0 + 8);
  505. PUTRGB1(out_2, py_2, 1, 2 + 8);
  506. PUTRGB1(out_1, py_1, 1, 2);
  507. PUTRGB1(out_1, py_1, 2, 4);
  508. PUTRGB1(out_2, py_2, 2, 4 + 8);
  509. PUTRGB1(out_2, py_2, 3, 6 + 8);
  510. PUTRGB1(out_1, py_1, 3, 6);
  511. dst_1[0] = out_1;
  512. dst_2[0] = out_2;
  513. CLOSEYUV2RGBFUNC(1)
  514. SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c)
  515. {
  516. SwsFunc t = NULL;
  517. if (HAVE_MMX)
  518. t = ff_yuv2rgb_init_mmx(c);
  519. else if (HAVE_VIS)
  520. t = ff_yuv2rgb_init_vis(c);
  521. else if (HAVE_ALTIVEC)
  522. t = ff_yuv2rgb_init_altivec(c);
  523. else if (ARCH_BFIN)
  524. t = ff_yuv2rgb_get_func_ptr_bfin(c);
  525. if (t)
  526. return t;
  527. av_log(c, AV_LOG_WARNING,
  528. "No accelerated colorspace conversion found from %s to %s.\n",
  529. av_get_pix_fmt_name(c->srcFormat), av_get_pix_fmt_name(c->dstFormat));
  530. switch (c->dstFormat) {
  531. case PIX_FMT_BGR48BE:
  532. case PIX_FMT_BGR48LE:
  533. return yuv2rgb_c_bgr48;
  534. case PIX_FMT_RGB48BE:
  535. case PIX_FMT_RGB48LE:
  536. return yuv2rgb_c_48;
  537. case PIX_FMT_ARGB:
  538. case PIX_FMT_ABGR:
  539. if (CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat))
  540. return yuva2argb_c;
  541. case PIX_FMT_RGBA:
  542. case PIX_FMT_BGRA:
  543. return (CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat)) ? yuva2rgba_c : yuv2rgb_c_32;
  544. case PIX_FMT_RGB24:
  545. return yuv2rgb_c_24_rgb;
  546. case PIX_FMT_BGR24:
  547. return yuv2rgb_c_24_bgr;
  548. case PIX_FMT_RGB565:
  549. case PIX_FMT_BGR565:
  550. return yuv2rgb_c_16_ordered_dither;
  551. case PIX_FMT_RGB555:
  552. case PIX_FMT_BGR555:
  553. return yuv2rgb_c_15_ordered_dither;
  554. case PIX_FMT_RGB444:
  555. case PIX_FMT_BGR444:
  556. return yuv2rgb_c_12_ordered_dither;
  557. case PIX_FMT_RGB8:
  558. case PIX_FMT_BGR8:
  559. return yuv2rgb_c_8_ordered_dither;
  560. case PIX_FMT_RGB4:
  561. case PIX_FMT_BGR4:
  562. return yuv2rgb_c_4_ordered_dither;
  563. case PIX_FMT_RGB4_BYTE:
  564. case PIX_FMT_BGR4_BYTE:
  565. return yuv2rgb_c_4b_ordered_dither;
  566. case PIX_FMT_MONOBLACK:
  567. return yuv2rgb_c_1_ordered_dither;
  568. }
  569. return NULL;
  570. }
  571. static void fill_table(uint8_t* table[256 + 2*YUVRGB_TABLE_HEADROOM], const int elemsize,
  572. const int inc, void *y_tab)
  573. {
  574. int i;
  575. uint8_t *y_table = y_tab;
  576. y_table -= elemsize * (inc >> 9);
  577. for (i = 0; i < 256 + 2*YUVRGB_TABLE_HEADROOM; i++) {
  578. int64_t cb = av_clip(i-YUVRGB_TABLE_HEADROOM, 0, 255)*inc;
  579. table[i] = y_table + elemsize * (cb >> 16);
  580. }
  581. }
  582. static void fill_gv_table(int table[256 + 2*YUVRGB_TABLE_HEADROOM], const int elemsize, const int inc)
  583. {
  584. int i;
  585. int off = -(inc >> 9);
  586. for (i = 0; i < 256 + 2*YUVRGB_TABLE_HEADROOM; i++) {
  587. int64_t cb = av_clip(i-YUVRGB_TABLE_HEADROOM, 0, 255)*inc;
  588. table[i] = elemsize * (off + (cb >> 16));
  589. }
  590. }
  591. static uint16_t roundToInt16(int64_t f)
  592. {
  593. int r = (f + (1 << 15)) >> 16;
  594. if (r < -0x7FFF)
  595. return 0x8000;
  596. else if (r > 0x7FFF)
  597. return 0x7FFF;
  598. else
  599. return r;
  600. }
  601. av_cold int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
  602. int fullRange, int brightness,
  603. int contrast, int saturation)
  604. {
  605. const int isRgb = c->dstFormat == PIX_FMT_RGB32 ||
  606. c->dstFormat == PIX_FMT_RGB32_1 ||
  607. c->dstFormat == PIX_FMT_BGR24 ||
  608. c->dstFormat == PIX_FMT_RGB565BE ||
  609. c->dstFormat == PIX_FMT_RGB565LE ||
  610. c->dstFormat == PIX_FMT_RGB555BE ||
  611. c->dstFormat == PIX_FMT_RGB555LE ||
  612. c->dstFormat == PIX_FMT_RGB444BE ||
  613. c->dstFormat == PIX_FMT_RGB444LE ||
  614. c->dstFormat == PIX_FMT_RGB8 ||
  615. c->dstFormat == PIX_FMT_RGB4 ||
  616. c->dstFormat == PIX_FMT_RGB4_BYTE ||
  617. c->dstFormat == PIX_FMT_MONOBLACK;
  618. const int isNotNe = c->dstFormat == PIX_FMT_NE(RGB565LE, RGB565BE) ||
  619. c->dstFormat == PIX_FMT_NE(RGB555LE, RGB555BE) ||
  620. c->dstFormat == PIX_FMT_NE(RGB444LE, RGB444BE) ||
  621. c->dstFormat == PIX_FMT_NE(BGR565LE, BGR565BE) ||
  622. c->dstFormat == PIX_FMT_NE(BGR555LE, BGR555BE) ||
  623. c->dstFormat == PIX_FMT_NE(BGR444LE, BGR444BE);
  624. const int bpp = c->dstFormatBpp;
  625. uint8_t *y_table;
  626. uint16_t *y_table16;
  627. uint32_t *y_table32;
  628. int i, base, rbase, gbase, bbase, av_uninit(abase), needAlpha;
  629. const int yoffs = fullRange ? 384 : 326;
  630. int64_t crv = inv_table[0];
  631. int64_t cbu = inv_table[1];
  632. int64_t cgu = -inv_table[2];
  633. int64_t cgv = -inv_table[3];
  634. int64_t cy = 1 << 16;
  635. int64_t oy = 0;
  636. int64_t yb = 0;
  637. if (!fullRange) {
  638. cy = (cy * 255) / 219;
  639. oy = 16 << 16;
  640. } else {
  641. crv = (crv * 224) / 255;
  642. cbu = (cbu * 224) / 255;
  643. cgu = (cgu * 224) / 255;
  644. cgv = (cgv * 224) / 255;
  645. }
  646. cy = (cy * contrast) >> 16;
  647. crv = (crv * contrast * saturation) >> 32;
  648. cbu = (cbu * contrast * saturation) >> 32;
  649. cgu = (cgu * contrast * saturation) >> 32;
  650. cgv = (cgv * contrast * saturation) >> 32;
  651. oy -= 256 * brightness;
  652. c->uOffset = 0x0400040004000400LL;
  653. c->vOffset = 0x0400040004000400LL;
  654. c->yCoeff = roundToInt16(cy * 8192) * 0x0001000100010001ULL;
  655. c->vrCoeff = roundToInt16(crv * 8192) * 0x0001000100010001ULL;
  656. c->ubCoeff = roundToInt16(cbu * 8192) * 0x0001000100010001ULL;
  657. c->vgCoeff = roundToInt16(cgv * 8192) * 0x0001000100010001ULL;
  658. c->ugCoeff = roundToInt16(cgu * 8192) * 0x0001000100010001ULL;
  659. c->yOffset = roundToInt16(oy * 8) * 0x0001000100010001ULL;
  660. c->yuv2rgb_y_coeff = (int16_t)roundToInt16(cy << 13);
  661. c->yuv2rgb_y_offset = (int16_t)roundToInt16(oy << 9);
  662. c->yuv2rgb_v2r_coeff = (int16_t)roundToInt16(crv << 13);
  663. c->yuv2rgb_v2g_coeff = (int16_t)roundToInt16(cgv << 13);
  664. c->yuv2rgb_u2g_coeff = (int16_t)roundToInt16(cgu << 13);
  665. c->yuv2rgb_u2b_coeff = (int16_t)roundToInt16(cbu << 13);
  666. //scale coefficients by cy
  667. crv = ((crv << 16) + 0x8000) / cy;
  668. cbu = ((cbu << 16) + 0x8000) / cy;
  669. cgu = ((cgu << 16) + 0x8000) / cy;
  670. cgv = ((cgv << 16) + 0x8000) / cy;
  671. av_free(c->yuvTable);
  672. switch (bpp) {
  673. case 1:
  674. c->yuvTable = av_malloc(1024);
  675. y_table = c->yuvTable;
  676. yb = -(384 << 16) - oy;
  677. for (i = 0; i < 1024 - 110; i++) {
  678. y_table[i + 110] = av_clip_uint8((yb + 0x8000) >> 16) >> 7;
  679. yb += cy;
  680. }
  681. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  682. fill_gv_table(c->table_gV, 1, cgv);
  683. break;
  684. case 4:
  685. case 4 | 128:
  686. rbase = isRgb ? 3 : 0;
  687. gbase = 1;
  688. bbase = isRgb ? 0 : 3;
  689. c->yuvTable = av_malloc(1024 * 3);
  690. y_table = c->yuvTable;
  691. yb = -(384 << 16) - oy;
  692. for (i = 0; i < 1024 - 110; i++) {
  693. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  694. y_table[i + 110] = (yval >> 7) << rbase;
  695. y_table[i + 37 + 1024] = ((yval + 43) / 85) << gbase;
  696. y_table[i + 110 + 2048] = (yval >> 7) << bbase;
  697. yb += cy;
  698. }
  699. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  700. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  701. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  702. fill_gv_table(c->table_gV, 1, cgv);
  703. break;
  704. case 8:
  705. rbase = isRgb ? 5 : 0;
  706. gbase = isRgb ? 2 : 3;
  707. bbase = isRgb ? 0 : 6;
  708. c->yuvTable = av_malloc(1024 * 3);
  709. y_table = c->yuvTable;
  710. yb = -(384 << 16) - oy;
  711. for (i = 0; i < 1024 - 38; i++) {
  712. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  713. y_table[i + 16] = ((yval + 18) / 36) << rbase;
  714. y_table[i + 16 + 1024] = ((yval + 18) / 36) << gbase;
  715. y_table[i + 37 + 2048] = ((yval + 43) / 85) << bbase;
  716. yb += cy;
  717. }
  718. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  719. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  720. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  721. fill_gv_table(c->table_gV, 1, cgv);
  722. break;
  723. case 12:
  724. rbase = isRgb ? 8 : 0;
  725. gbase = 4;
  726. bbase = isRgb ? 0 : 8;
  727. c->yuvTable = av_malloc(1024 * 3 * 2);
  728. y_table16 = c->yuvTable;
  729. yb = -(384 << 16) - oy;
  730. for (i = 0; i < 1024; i++) {
  731. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  732. y_table16[i] = (yval >> 4) << rbase;
  733. y_table16[i + 1024] = (yval >> 4) << gbase;
  734. y_table16[i + 2048] = (yval >> 4) << bbase;
  735. yb += cy;
  736. }
  737. if (isNotNe)
  738. for (i = 0; i < 1024 * 3; i++)
  739. y_table16[i] = av_bswap16(y_table16[i]);
  740. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  741. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  742. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  743. fill_gv_table(c->table_gV, 2, cgv);
  744. break;
  745. case 15:
  746. case 16:
  747. rbase = isRgb ? bpp - 5 : 0;
  748. gbase = 5;
  749. bbase = isRgb ? 0 : (bpp - 5);
  750. c->yuvTable = av_malloc(1024 * 3 * 2);
  751. y_table16 = c->yuvTable;
  752. yb = -(384 << 16) - oy;
  753. for (i = 0; i < 1024; i++) {
  754. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  755. y_table16[i] = (yval >> 3) << rbase;
  756. y_table16[i + 1024] = (yval >> (18 - bpp)) << gbase;
  757. y_table16[i + 2048] = (yval >> 3) << bbase;
  758. yb += cy;
  759. }
  760. if (isNotNe)
  761. for (i = 0; i < 1024 * 3; i++)
  762. y_table16[i] = av_bswap16(y_table16[i]);
  763. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  764. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  765. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  766. fill_gv_table(c->table_gV, 2, cgv);
  767. break;
  768. case 24:
  769. case 48:
  770. c->yuvTable = av_malloc(1024);
  771. y_table = c->yuvTable;
  772. yb = -(384 << 16) - oy;
  773. for (i = 0; i < 1024; i++) {
  774. y_table[i] = av_clip_uint8((yb + 0x8000) >> 16);
  775. yb += cy;
  776. }
  777. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  778. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  779. fill_table(c->table_bU, 1, cbu, y_table + yoffs);
  780. fill_gv_table(c->table_gV, 1, cgv);
  781. break;
  782. case 32:
  783. base = (c->dstFormat == PIX_FMT_RGB32_1 ||
  784. c->dstFormat == PIX_FMT_BGR32_1) ? 8 : 0;
  785. rbase = base + (isRgb ? 16 : 0);
  786. gbase = base + 8;
  787. bbase = base + (isRgb ? 0 : 16);
  788. needAlpha = CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat);
  789. if (!needAlpha)
  790. abase = (base + 24) & 31;
  791. c->yuvTable = av_malloc(1024 * 3 * 4);
  792. y_table32 = c->yuvTable;
  793. yb = -(384 << 16) - oy;
  794. for (i = 0; i < 1024; i++) {
  795. unsigned yval = av_clip_uint8((yb + 0x8000) >> 16);
  796. y_table32[i] = (yval << rbase) +
  797. (needAlpha ? 0 : (255u << abase));
  798. y_table32[i + 1024] = yval << gbase;
  799. y_table32[i + 2048] = yval << bbase;
  800. yb += cy;
  801. }
  802. fill_table(c->table_rV, 4, crv, y_table32 + yoffs);
  803. fill_table(c->table_gU, 4, cgu, y_table32 + yoffs + 1024);
  804. fill_table(c->table_bU, 4, cbu, y_table32 + yoffs + 2048);
  805. fill_gv_table(c->table_gV, 4, cgv);
  806. break;
  807. default:
  808. c->yuvTable = NULL;
  809. av_log(c, AV_LOG_ERROR, "%ibpp not supported by yuv2rgb\n", bpp);
  810. return -1;
  811. }
  812. return 0;
  813. }