yuv2rgb.c 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825
  1. /*
  2. * software YUV to RGB converter
  3. *
  4. * Copyright (C) 2009 Konstantin Shishkov
  5. *
  6. * 1,4,8bpp support and context / deglobalize stuff
  7. * by Michael Niedermayer (michaelni@gmx.at)
  8. *
  9. * This file is part of FFmpeg.
  10. *
  11. * FFmpeg is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * FFmpeg is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with FFmpeg; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include <stdio.h>
  26. #include <stdlib.h>
  27. #include <inttypes.h>
  28. #include <assert.h>
  29. #include "config.h"
  30. #include "rgb2rgb.h"
  31. #include "swscale.h"
  32. #include "swscale_internal.h"
  33. #include "libavutil/x86_cpu.h"
  34. #include "libavutil/bswap.h"
  35. extern const uint8_t dither_4x4_16[4][8];
  36. extern const uint8_t dither_8x8_32[8][8];
  37. extern const uint8_t dither_8x8_73[8][8];
  38. extern const uint8_t dither_8x8_220[8][8];
  39. const int32_t ff_yuv2rgb_coeffs[8][4] = {
  40. {117504, 138453, 13954, 34903}, /* no sequence_display_extension */
  41. {117504, 138453, 13954, 34903}, /* ITU-R Rec. 709 (1990) */
  42. {104597, 132201, 25675, 53279}, /* unspecified */
  43. {104597, 132201, 25675, 53279}, /* reserved */
  44. {104448, 132798, 24759, 53109}, /* FCC */
  45. {104597, 132201, 25675, 53279}, /* ITU-R Rec. 624-4 System B, G */
  46. {104597, 132201, 25675, 53279}, /* SMPTE 170M */
  47. {117579, 136230, 16907, 35559} /* SMPTE 240M (1987) */
  48. };
  49. const int *sws_getCoefficients(int colorspace)
  50. {
  51. if (colorspace > 7 || colorspace < 0)
  52. colorspace = SWS_CS_DEFAULT;
  53. return ff_yuv2rgb_coeffs[colorspace];
  54. }
  55. #define LOADCHROMA(i) \
  56. U = pu[i]; \
  57. V = pv[i]; \
  58. r = (void *)c->table_rV[V]; \
  59. g = (void *)(c->table_gU[U] + c->table_gV[V]); \
  60. b = (void *)c->table_bU[U];
  61. #define PUTRGB(dst,src,i) \
  62. Y = src[2*i]; \
  63. dst[2*i ] = r[Y] + g[Y] + b[Y]; \
  64. Y = src[2*i+1]; \
  65. dst[2*i+1] = r[Y] + g[Y] + b[Y];
  66. #define PUTRGB24(dst,src,i) \
  67. Y = src[2*i]; \
  68. dst[6*i+0] = r[Y]; dst[6*i+1] = g[Y]; dst[6*i+2] = b[Y]; \
  69. Y = src[2*i+1]; \
  70. dst[6*i+3] = r[Y]; dst[6*i+4] = g[Y]; dst[6*i+5] = b[Y];
  71. #define PUTBGR24(dst,src,i) \
  72. Y = src[2*i]; \
  73. dst[6*i+0] = b[Y]; dst[6*i+1] = g[Y]; dst[6*i+2] = r[Y]; \
  74. Y = src[2*i+1]; \
  75. dst[6*i+3] = b[Y]; dst[6*i+4] = g[Y]; dst[6*i+5] = r[Y];
  76. #define PUTRGBA(dst,ysrc,asrc,i,s) \
  77. Y = ysrc[2*i]; \
  78. dst[2*i ] = r[Y] + g[Y] + b[Y] + (asrc[2*i ]<<s); \
  79. Y = ysrc[2*i+1]; \
  80. dst[2*i+1] = r[Y] + g[Y] + b[Y] + (asrc[2*i+1]<<s);
  81. #define PUTRGB48(dst,src,i) \
  82. Y = src[2*i]; \
  83. dst[12*i+ 0] = dst[12*i+ 1] = r[Y]; \
  84. dst[12*i+ 2] = dst[12*i+ 3] = g[Y]; \
  85. dst[12*i+ 4] = dst[12*i+ 5] = b[Y]; \
  86. Y = src[2*i+1]; \
  87. dst[12*i+ 6] = dst[12*i+ 7] = r[Y]; \
  88. dst[12*i+ 8] = dst[12*i+ 9] = g[Y]; \
  89. dst[12*i+10] = dst[12*i+11] = b[Y];
  90. #define YUV2RGBFUNC(func_name, dst_type, alpha) \
  91. static int func_name(SwsContext *c, const uint8_t* src[], int srcStride[], int srcSliceY, \
  92. int srcSliceH, uint8_t* dst[], int dstStride[]) \
  93. {\
  94. int y;\
  95. \
  96. if (!alpha && c->srcFormat == PIX_FMT_YUV422P) {\
  97. srcStride[1] *= 2;\
  98. srcStride[2] *= 2;\
  99. }\
  100. for (y=0; y<srcSliceH; y+=2) {\
  101. dst_type *dst_1 = (dst_type*)(dst[0] + (y+srcSliceY )*dstStride[0]);\
  102. dst_type *dst_2 = (dst_type*)(dst[0] + (y+srcSliceY+1)*dstStride[0]);\
  103. dst_type av_unused *r, *b;\
  104. dst_type *g;\
  105. const uint8_t *py_1 = src[0] + y*srcStride[0];\
  106. const uint8_t *py_2 = py_1 + srcStride[0];\
  107. const uint8_t *pu = src[1] + (y>>1)*srcStride[1];\
  108. const uint8_t *pv = src[2] + (y>>1)*srcStride[2];\
  109. const uint8_t av_unused *pa_1, *pa_2;\
  110. unsigned int h_size = c->dstW>>3;\
  111. if (alpha) {\
  112. pa_1 = src[3] + y*srcStride[3];\
  113. pa_2 = pa_1 + srcStride[3];\
  114. }\
  115. while (h_size--) {\
  116. int av_unused U, V;\
  117. int Y;\
  118. #define ENDYUV2RGBLINE(dst_delta)\
  119. pu += 4;\
  120. pv += 4;\
  121. py_1 += 8;\
  122. py_2 += 8;\
  123. dst_1 += dst_delta;\
  124. dst_2 += dst_delta;\
  125. }\
  126. if (c->dstW & 4) {\
  127. int av_unused Y, U, V;\
  128. #define ENDYUV2RGBFUNC()\
  129. }\
  130. }\
  131. return srcSliceH;\
  132. }
  133. #define CLOSEYUV2RGBFUNC(dst_delta)\
  134. ENDYUV2RGBLINE(dst_delta)\
  135. ENDYUV2RGBFUNC()
  136. YUV2RGBFUNC(yuv2rgb_c_48, uint8_t, 0)
  137. LOADCHROMA(0);
  138. PUTRGB48(dst_1,py_1,0);
  139. PUTRGB48(dst_2,py_2,0);
  140. LOADCHROMA(1);
  141. PUTRGB48(dst_2,py_2,1);
  142. PUTRGB48(dst_1,py_1,1);
  143. LOADCHROMA(2);
  144. PUTRGB48(dst_1,py_1,2);
  145. PUTRGB48(dst_2,py_2,2);
  146. LOADCHROMA(3);
  147. PUTRGB48(dst_2,py_2,3);
  148. PUTRGB48(dst_1,py_1,3);
  149. ENDYUV2RGBLINE(48)
  150. LOADCHROMA(0);
  151. PUTRGB48(dst_1,py_1,0);
  152. PUTRGB48(dst_2,py_2,0);
  153. LOADCHROMA(1);
  154. PUTRGB48(dst_2,py_2,1);
  155. PUTRGB48(dst_1,py_1,1);
  156. ENDYUV2RGBFUNC()
  157. YUV2RGBFUNC(yuv2rgb_c_32, uint32_t, 0)
  158. LOADCHROMA(0);
  159. PUTRGB(dst_1,py_1,0);
  160. PUTRGB(dst_2,py_2,0);
  161. LOADCHROMA(1);
  162. PUTRGB(dst_2,py_2,1);
  163. PUTRGB(dst_1,py_1,1);
  164. LOADCHROMA(2);
  165. PUTRGB(dst_1,py_1,2);
  166. PUTRGB(dst_2,py_2,2);
  167. LOADCHROMA(3);
  168. PUTRGB(dst_2,py_2,3);
  169. PUTRGB(dst_1,py_1,3);
  170. ENDYUV2RGBLINE(8)
  171. LOADCHROMA(0);
  172. PUTRGB(dst_1,py_1,0);
  173. PUTRGB(dst_2,py_2,0);
  174. LOADCHROMA(1);
  175. PUTRGB(dst_2,py_2,1);
  176. PUTRGB(dst_1,py_1,1);
  177. ENDYUV2RGBFUNC()
  178. YUV2RGBFUNC(yuva2rgba_c, uint32_t, 1)
  179. LOADCHROMA(0);
  180. PUTRGBA(dst_1,py_1,pa_1,0,24);
  181. PUTRGBA(dst_2,py_2,pa_2,0,24);
  182. LOADCHROMA(1);
  183. PUTRGBA(dst_2,py_2,pa_1,1,24);
  184. PUTRGBA(dst_1,py_1,pa_2,1,24);
  185. LOADCHROMA(2);
  186. PUTRGBA(dst_1,py_1,pa_1,2,24);
  187. PUTRGBA(dst_2,py_2,pa_2,2,24);
  188. LOADCHROMA(3);
  189. PUTRGBA(dst_2,py_2,pa_1,3,24);
  190. PUTRGBA(dst_1,py_1,pa_2,3,24);
  191. pa_1 += 8;\
  192. pa_2 += 8;\
  193. ENDYUV2RGBLINE(8)
  194. LOADCHROMA(0);
  195. PUTRGBA(dst_1,py_1,pa_1,0,24);
  196. PUTRGBA(dst_2,py_2,pa_2,0,24);
  197. LOADCHROMA(1);
  198. PUTRGBA(dst_2,py_2,pa_1,1,24);
  199. PUTRGBA(dst_1,py_1,pa_2,1,24);
  200. ENDYUV2RGBFUNC()
  201. YUV2RGBFUNC(yuva2argb_c, uint32_t, 1)
  202. LOADCHROMA(0);
  203. PUTRGBA(dst_1,py_1,pa_1,0,0);
  204. PUTRGBA(dst_2,py_2,pa_2,0,0);
  205. LOADCHROMA(1);
  206. PUTRGBA(dst_2,py_2,pa_2,1,0);
  207. PUTRGBA(dst_1,py_1,pa_1,1,0);
  208. LOADCHROMA(2);
  209. PUTRGBA(dst_1,py_1,pa_1,2,0);
  210. PUTRGBA(dst_2,py_2,pa_2,2,0);
  211. LOADCHROMA(3);
  212. PUTRGBA(dst_2,py_2,pa_2,3,0);
  213. PUTRGBA(dst_1,py_1,pa_1,3,0);
  214. pa_1 += 8;\
  215. pa_2 += 8;\
  216. ENDYUV2RGBLINE(8)
  217. LOADCHROMA(0);
  218. PUTRGBA(dst_1,py_1,pa_1,0,0);
  219. PUTRGBA(dst_2,py_2,pa_2,0,0);
  220. LOADCHROMA(1);
  221. PUTRGBA(dst_2,py_2,pa_2,1,0);
  222. PUTRGBA(dst_1,py_1,pa_1,1,0);
  223. ENDYUV2RGBFUNC()
  224. YUV2RGBFUNC(yuv2rgb_c_24_rgb, uint8_t, 0)
  225. LOADCHROMA(0);
  226. PUTRGB24(dst_1,py_1,0);
  227. PUTRGB24(dst_2,py_2,0);
  228. LOADCHROMA(1);
  229. PUTRGB24(dst_2,py_2,1);
  230. PUTRGB24(dst_1,py_1,1);
  231. LOADCHROMA(2);
  232. PUTRGB24(dst_1,py_1,2);
  233. PUTRGB24(dst_2,py_2,2);
  234. LOADCHROMA(3);
  235. PUTRGB24(dst_2,py_2,3);
  236. PUTRGB24(dst_1,py_1,3);
  237. ENDYUV2RGBLINE(24)
  238. LOADCHROMA(0);
  239. PUTRGB24(dst_1,py_1,0);
  240. PUTRGB24(dst_2,py_2,0);
  241. LOADCHROMA(1);
  242. PUTRGB24(dst_2,py_2,1);
  243. PUTRGB24(dst_1,py_1,1);
  244. ENDYUV2RGBFUNC()
  245. // only trivial mods from yuv2rgb_c_24_rgb
  246. YUV2RGBFUNC(yuv2rgb_c_24_bgr, uint8_t, 0)
  247. LOADCHROMA(0);
  248. PUTBGR24(dst_1,py_1,0);
  249. PUTBGR24(dst_2,py_2,0);
  250. LOADCHROMA(1);
  251. PUTBGR24(dst_2,py_2,1);
  252. PUTBGR24(dst_1,py_1,1);
  253. LOADCHROMA(2);
  254. PUTBGR24(dst_1,py_1,2);
  255. PUTBGR24(dst_2,py_2,2);
  256. LOADCHROMA(3);
  257. PUTBGR24(dst_2,py_2,3);
  258. PUTBGR24(dst_1,py_1,3);
  259. ENDYUV2RGBLINE(24)
  260. LOADCHROMA(0);
  261. PUTBGR24(dst_1,py_1,0);
  262. PUTBGR24(dst_2,py_2,0);
  263. LOADCHROMA(1);
  264. PUTBGR24(dst_2,py_2,1);
  265. PUTBGR24(dst_1,py_1,1);
  266. ENDYUV2RGBFUNC()
  267. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  268. // r, g, b, dst_1, dst_2
  269. YUV2RGBFUNC(yuv2rgb_c_16, uint16_t, 0)
  270. LOADCHROMA(0);
  271. PUTRGB(dst_1,py_1,0);
  272. PUTRGB(dst_2,py_2,0);
  273. LOADCHROMA(1);
  274. PUTRGB(dst_2,py_2,1);
  275. PUTRGB(dst_1,py_1,1);
  276. LOADCHROMA(2);
  277. PUTRGB(dst_1,py_1,2);
  278. PUTRGB(dst_2,py_2,2);
  279. LOADCHROMA(3);
  280. PUTRGB(dst_2,py_2,3);
  281. PUTRGB(dst_1,py_1,3);
  282. CLOSEYUV2RGBFUNC(8)
  283. #if 0 // Currently unused
  284. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  285. // r, g, b, dst_1, dst_2
  286. YUV2RGBFUNC(yuv2rgb_c_8, uint8_t, 0)
  287. LOADCHROMA(0);
  288. PUTRGB(dst_1,py_1,0);
  289. PUTRGB(dst_2,py_2,0);
  290. LOADCHROMA(1);
  291. PUTRGB(dst_2,py_2,1);
  292. PUTRGB(dst_1,py_1,1);
  293. LOADCHROMA(2);
  294. PUTRGB(dst_1,py_1,2);
  295. PUTRGB(dst_2,py_2,2);
  296. LOADCHROMA(3);
  297. PUTRGB(dst_2,py_2,3);
  298. PUTRGB(dst_1,py_1,3);
  299. CLOSEYUV2RGBFUNC(8)
  300. #endif
  301. // r, g, b, dst_1, dst_2
  302. YUV2RGBFUNC(yuv2rgb_c_12_ordered_dither, uint16_t, 0)
  303. const uint8_t *d16 = dither_4x4_16[y&3];
  304. #define PUTRGB12(dst,src,i,o) \
  305. Y = src[2*i]; \
  306. dst[2*i] = r[Y+d16[0+o]] + g[Y+d16[0+o]] + b[Y+d16[0+o]]; \
  307. Y = src[2*i+1]; \
  308. dst[2*i+1] = r[Y+d16[1+o]] + g[Y+d16[1+o]] + b[Y+d16[1+o]];
  309. LOADCHROMA(0);
  310. PUTRGB12(dst_1,py_1,0,0);
  311. PUTRGB12(dst_2,py_2,0,0+8);
  312. LOADCHROMA(1);
  313. PUTRGB12(dst_2,py_2,1,2+8);
  314. PUTRGB12(dst_1,py_1,1,2);
  315. LOADCHROMA(2);
  316. PUTRGB12(dst_1,py_1,2,4);
  317. PUTRGB12(dst_2,py_2,2,4+8);
  318. LOADCHROMA(3);
  319. PUTRGB12(dst_2,py_2,3,6+8);
  320. PUTRGB12(dst_1,py_1,3,6);
  321. CLOSEYUV2RGBFUNC(8)
  322. // r, g, b, dst_1, dst_2
  323. YUV2RGBFUNC(yuv2rgb_c_8_ordered_dither, uint8_t, 0)
  324. const uint8_t *d32 = dither_8x8_32[y&7];
  325. const uint8_t *d64 = dither_8x8_73[y&7];
  326. #define PUTRGB8(dst,src,i,o) \
  327. Y = src[2*i]; \
  328. dst[2*i] = r[Y+d32[0+o]] + g[Y+d32[0+o]] + b[Y+d64[0+o]]; \
  329. Y = src[2*i+1]; \
  330. dst[2*i+1] = r[Y+d32[1+o]] + g[Y+d32[1+o]] + b[Y+d64[1+o]];
  331. LOADCHROMA(0);
  332. PUTRGB8(dst_1,py_1,0,0);
  333. PUTRGB8(dst_2,py_2,0,0+8);
  334. LOADCHROMA(1);
  335. PUTRGB8(dst_2,py_2,1,2+8);
  336. PUTRGB8(dst_1,py_1,1,2);
  337. LOADCHROMA(2);
  338. PUTRGB8(dst_1,py_1,2,4);
  339. PUTRGB8(dst_2,py_2,2,4+8);
  340. LOADCHROMA(3);
  341. PUTRGB8(dst_2,py_2,3,6+8);
  342. PUTRGB8(dst_1,py_1,3,6);
  343. CLOSEYUV2RGBFUNC(8)
  344. #if 0 // Currently unused
  345. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  346. // r, g, b, dst_1, dst_2
  347. YUV2RGBFUNC(yuv2rgb_c_4, uint8_t, 0)
  348. int acc;
  349. #define PUTRGB4(dst,src,i) \
  350. Y = src[2*i]; \
  351. acc = r[Y] + g[Y] + b[Y]; \
  352. Y = src[2*i+1]; \
  353. acc |= (r[Y] + g[Y] + b[Y])<<4; \
  354. dst[i] = acc;
  355. LOADCHROMA(0);
  356. PUTRGB4(dst_1,py_1,0);
  357. PUTRGB4(dst_2,py_2,0);
  358. LOADCHROMA(1);
  359. PUTRGB4(dst_2,py_2,1);
  360. PUTRGB4(dst_1,py_1,1);
  361. LOADCHROMA(2);
  362. PUTRGB4(dst_1,py_1,2);
  363. PUTRGB4(dst_2,py_2,2);
  364. LOADCHROMA(3);
  365. PUTRGB4(dst_2,py_2,3);
  366. PUTRGB4(dst_1,py_1,3);
  367. CLOSEYUV2RGBFUNC(4)
  368. #endif
  369. YUV2RGBFUNC(yuv2rgb_c_4_ordered_dither, uint8_t, 0)
  370. const uint8_t *d64 = dither_8x8_73[y&7];
  371. const uint8_t *d128 = dither_8x8_220[y&7];
  372. int acc;
  373. #define PUTRGB4D(dst,src,i,o) \
  374. Y = src[2*i]; \
  375. acc = r[Y+d128[0+o]] + g[Y+d64[0+o]] + b[Y+d128[0+o]]; \
  376. Y = src[2*i+1]; \
  377. acc |= (r[Y+d128[1+o]] + g[Y+d64[1+o]] + b[Y+d128[1+o]])<<4; \
  378. dst[i]= acc;
  379. LOADCHROMA(0);
  380. PUTRGB4D(dst_1,py_1,0,0);
  381. PUTRGB4D(dst_2,py_2,0,0+8);
  382. LOADCHROMA(1);
  383. PUTRGB4D(dst_2,py_2,1,2+8);
  384. PUTRGB4D(dst_1,py_1,1,2);
  385. LOADCHROMA(2);
  386. PUTRGB4D(dst_1,py_1,2,4);
  387. PUTRGB4D(dst_2,py_2,2,4+8);
  388. LOADCHROMA(3);
  389. PUTRGB4D(dst_2,py_2,3,6+8);
  390. PUTRGB4D(dst_1,py_1,3,6);
  391. CLOSEYUV2RGBFUNC(4)
  392. #if 0 // Currently unused
  393. // This is exactly the same code as yuv2rgb_c_32 except for the types of
  394. // r, g, b, dst_1, dst_2
  395. YUV2RGBFUNC(yuv2rgb_c_4b, uint8_t, 0)
  396. LOADCHROMA(0);
  397. PUTRGB(dst_1,py_1,0);
  398. PUTRGB(dst_2,py_2,0);
  399. LOADCHROMA(1);
  400. PUTRGB(dst_2,py_2,1);
  401. PUTRGB(dst_1,py_1,1);
  402. LOADCHROMA(2);
  403. PUTRGB(dst_1,py_1,2);
  404. PUTRGB(dst_2,py_2,2);
  405. LOADCHROMA(3);
  406. PUTRGB(dst_2,py_2,3);
  407. PUTRGB(dst_1,py_1,3);
  408. CLOSEYUV2RGBFUNC(8)
  409. #endif
  410. YUV2RGBFUNC(yuv2rgb_c_4b_ordered_dither, uint8_t, 0)
  411. const uint8_t *d64 = dither_8x8_73[y&7];
  412. const uint8_t *d128 = dither_8x8_220[y&7];
  413. #define PUTRGB4DB(dst,src,i,o) \
  414. Y = src[2*i]; \
  415. dst[2*i] = r[Y+d128[0+o]] + g[Y+d64[0+o]] + b[Y+d128[0+o]]; \
  416. Y = src[2*i+1]; \
  417. dst[2*i+1] = r[Y+d128[1+o]] + g[Y+d64[1+o]] + b[Y+d128[1+o]];
  418. LOADCHROMA(0);
  419. PUTRGB4DB(dst_1,py_1,0,0);
  420. PUTRGB4DB(dst_2,py_2,0,0+8);
  421. LOADCHROMA(1);
  422. PUTRGB4DB(dst_2,py_2,1,2+8);
  423. PUTRGB4DB(dst_1,py_1,1,2);
  424. LOADCHROMA(2);
  425. PUTRGB4DB(dst_1,py_1,2,4);
  426. PUTRGB4DB(dst_2,py_2,2,4+8);
  427. LOADCHROMA(3);
  428. PUTRGB4DB(dst_2,py_2,3,6+8);
  429. PUTRGB4DB(dst_1,py_1,3,6);
  430. CLOSEYUV2RGBFUNC(8)
  431. YUV2RGBFUNC(yuv2rgb_c_1_ordered_dither, uint8_t, 0)
  432. const uint8_t *d128 = dither_8x8_220[y&7];
  433. char out_1 = 0, out_2 = 0;
  434. g= c->table_gU[128] + c->table_gV[128];
  435. #define PUTRGB1(out,src,i,o) \
  436. Y = src[2*i]; \
  437. out+= out + g[Y+d128[0+o]]; \
  438. Y = src[2*i+1]; \
  439. out+= out + g[Y+d128[1+o]];
  440. PUTRGB1(out_1,py_1,0,0);
  441. PUTRGB1(out_2,py_2,0,0+8);
  442. PUTRGB1(out_2,py_2,1,2+8);
  443. PUTRGB1(out_1,py_1,1,2);
  444. PUTRGB1(out_1,py_1,2,4);
  445. PUTRGB1(out_2,py_2,2,4+8);
  446. PUTRGB1(out_2,py_2,3,6+8);
  447. PUTRGB1(out_1,py_1,3,6);
  448. dst_1[0]= out_1;
  449. dst_2[0]= out_2;
  450. CLOSEYUV2RGBFUNC(1)
  451. SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c)
  452. {
  453. SwsFunc t = NULL;
  454. #if HAVE_MMX
  455. t = ff_yuv2rgb_init_mmx(c);
  456. #endif
  457. #if HAVE_VIS
  458. t = ff_yuv2rgb_init_vis(c);
  459. #endif
  460. #if CONFIG_MLIB
  461. t = ff_yuv2rgb_init_mlib(c);
  462. #endif
  463. #if HAVE_ALTIVEC
  464. if (c->flags & SWS_CPU_CAPS_ALTIVEC)
  465. t = ff_yuv2rgb_init_altivec(c);
  466. #endif
  467. #if ARCH_BFIN
  468. if (c->flags & SWS_CPU_CAPS_BFIN)
  469. t = ff_yuv2rgb_get_func_ptr_bfin(c);
  470. #endif
  471. if (t)
  472. return t;
  473. av_log(c, AV_LOG_WARNING, "No accelerated colorspace conversion found from %s to %s.\n", sws_format_name(c->srcFormat), sws_format_name(c->dstFormat));
  474. switch (c->dstFormat) {
  475. case PIX_FMT_RGB48BE:
  476. case PIX_FMT_RGB48LE: return yuv2rgb_c_48;
  477. case PIX_FMT_ARGB:
  478. case PIX_FMT_ABGR: if (CONFIG_SWSCALE_ALPHA && c->srcFormat == PIX_FMT_YUVA420P) return yuva2argb_c;
  479. case PIX_FMT_RGBA:
  480. case PIX_FMT_BGRA: return (CONFIG_SWSCALE_ALPHA && c->srcFormat == PIX_FMT_YUVA420P) ? yuva2rgba_c : yuv2rgb_c_32;
  481. case PIX_FMT_RGB24: return yuv2rgb_c_24_rgb;
  482. case PIX_FMT_BGR24: return yuv2rgb_c_24_bgr;
  483. case PIX_FMT_RGB565:
  484. case PIX_FMT_BGR565:
  485. case PIX_FMT_RGB555:
  486. case PIX_FMT_BGR555: return yuv2rgb_c_16;
  487. case PIX_FMT_RGB444:
  488. case PIX_FMT_BGR444: return yuv2rgb_c_12_ordered_dither;
  489. case PIX_FMT_RGB8:
  490. case PIX_FMT_BGR8: return yuv2rgb_c_8_ordered_dither;
  491. case PIX_FMT_RGB4:
  492. case PIX_FMT_BGR4: return yuv2rgb_c_4_ordered_dither;
  493. case PIX_FMT_RGB4_BYTE:
  494. case PIX_FMT_BGR4_BYTE: return yuv2rgb_c_4b_ordered_dither;
  495. case PIX_FMT_MONOBLACK: return yuv2rgb_c_1_ordered_dither;
  496. default:
  497. assert(0);
  498. }
  499. return NULL;
  500. }
  501. static void fill_table(uint8_t* table[256], const int elemsize, const int inc, uint8_t *y_table)
  502. {
  503. int i;
  504. int64_t cb = 0;
  505. y_table -= elemsize * (inc >> 9);
  506. for (i = 0; i < 256; i++) {
  507. table[i] = y_table + elemsize * (cb >> 16);
  508. cb += inc;
  509. }
  510. }
  511. static void fill_gv_table(int table[256], const int elemsize, const int inc)
  512. {
  513. int i;
  514. int64_t cb = 0;
  515. int off = -(inc >> 9);
  516. for (i = 0; i < 256; i++) {
  517. table[i] = elemsize * (off + (cb >> 16));
  518. cb += inc;
  519. }
  520. }
  521. av_cold int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4], int fullRange,
  522. int brightness, int contrast, int saturation)
  523. {
  524. const int isRgb = c->dstFormat==PIX_FMT_RGB32
  525. || c->dstFormat==PIX_FMT_RGB32_1
  526. || c->dstFormat==PIX_FMT_BGR24
  527. || c->dstFormat==PIX_FMT_RGB565BE
  528. || c->dstFormat==PIX_FMT_RGB565LE
  529. || c->dstFormat==PIX_FMT_RGB555BE
  530. || c->dstFormat==PIX_FMT_RGB555LE
  531. || c->dstFormat==PIX_FMT_RGB444BE
  532. || c->dstFormat==PIX_FMT_RGB444LE
  533. || c->dstFormat==PIX_FMT_RGB8
  534. || c->dstFormat==PIX_FMT_RGB4
  535. || c->dstFormat==PIX_FMT_RGB4_BYTE
  536. || c->dstFormat==PIX_FMT_MONOBLACK;
  537. const int isNotNe = c->dstFormat==PIX_FMT_NE(RGB565LE,RGB565BE)
  538. || c->dstFormat==PIX_FMT_NE(RGB555LE,RGB555BE)
  539. || c->dstFormat==PIX_FMT_NE(RGB444LE,RGB444BE)
  540. || c->dstFormat==PIX_FMT_NE(BGR565LE,BGR565BE)
  541. || c->dstFormat==PIX_FMT_NE(BGR555LE,BGR555BE)
  542. || c->dstFormat==PIX_FMT_NE(BGR444LE,BGR444BE);
  543. const int bpp = c->dstFormatBpp;
  544. uint8_t *y_table;
  545. uint16_t *y_table16;
  546. uint32_t *y_table32;
  547. int i, base, rbase, gbase, bbase, abase, needAlpha;
  548. const int yoffs = fullRange ? 384 : 326;
  549. int64_t crv = inv_table[0];
  550. int64_t cbu = inv_table[1];
  551. int64_t cgu = -inv_table[2];
  552. int64_t cgv = -inv_table[3];
  553. int64_t cy = 1<<16;
  554. int64_t oy = 0;
  555. int64_t yb = 0;
  556. if (!fullRange) {
  557. cy = (cy*255) / 219;
  558. oy = 16<<16;
  559. } else {
  560. crv = (crv*224) / 255;
  561. cbu = (cbu*224) / 255;
  562. cgu = (cgu*224) / 255;
  563. cgv = (cgv*224) / 255;
  564. }
  565. cy = (cy *contrast ) >> 16;
  566. crv = (crv*contrast * saturation) >> 32;
  567. cbu = (cbu*contrast * saturation) >> 32;
  568. cgu = (cgu*contrast * saturation) >> 32;
  569. cgv = (cgv*contrast * saturation) >> 32;
  570. oy -= 256*brightness;
  571. //scale coefficients by cy
  572. crv = ((crv << 16) + 0x8000) / cy;
  573. cbu = ((cbu << 16) + 0x8000) / cy;
  574. cgu = ((cgu << 16) + 0x8000) / cy;
  575. cgv = ((cgv << 16) + 0x8000) / cy;
  576. av_free(c->yuvTable);
  577. switch (bpp) {
  578. case 1:
  579. c->yuvTable = av_malloc(1024);
  580. y_table = c->yuvTable;
  581. yb = -(384<<16) - oy;
  582. for (i = 0; i < 1024-110; i++) {
  583. y_table[i+110] = av_clip_uint8((yb + 0x8000) >> 16) >> 7;
  584. yb += cy;
  585. }
  586. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  587. fill_gv_table(c->table_gV, 1, cgv);
  588. break;
  589. case 4:
  590. case 4|128:
  591. rbase = isRgb ? 3 : 0;
  592. gbase = 1;
  593. bbase = isRgb ? 0 : 3;
  594. c->yuvTable = av_malloc(1024*3);
  595. y_table = c->yuvTable;
  596. yb = -(384<<16) - oy;
  597. for (i = 0; i < 1024-110; i++) {
  598. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  599. y_table[i+110 ] = (yval >> 7) << rbase;
  600. y_table[i+ 37+1024] = ((yval + 43) / 85) << gbase;
  601. y_table[i+110+2048] = (yval >> 7) << bbase;
  602. yb += cy;
  603. }
  604. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  605. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  606. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  607. fill_gv_table(c->table_gV, 1, cgv);
  608. break;
  609. case 8:
  610. rbase = isRgb ? 5 : 0;
  611. gbase = isRgb ? 2 : 3;
  612. bbase = isRgb ? 0 : 6;
  613. c->yuvTable = av_malloc(1024*3);
  614. y_table = c->yuvTable;
  615. yb = -(384<<16) - oy;
  616. for (i = 0; i < 1024-38; i++) {
  617. int yval = av_clip_uint8((yb + 0x8000) >> 16);
  618. y_table[i+16 ] = ((yval + 18) / 36) << rbase;
  619. y_table[i+16+1024] = ((yval + 18) / 36) << gbase;
  620. y_table[i+37+2048] = ((yval + 43) / 85) << bbase;
  621. yb += cy;
  622. }
  623. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  624. fill_table(c->table_gU, 1, cgu, y_table + yoffs + 1024);
  625. fill_table(c->table_bU, 1, cbu, y_table + yoffs + 2048);
  626. fill_gv_table(c->table_gV, 1, cgv);
  627. break;
  628. case 12:
  629. rbase = isRgb ? 8 : 0;
  630. gbase = 4;
  631. bbase = isRgb ? 0 : 8;
  632. c->yuvTable = av_malloc(1024*3*2);
  633. y_table16 = c->yuvTable;
  634. yb = -(384<<16) - oy;
  635. for (i = 0; i < 1024; i++) {
  636. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  637. y_table16[i ] = (yval >> 4) << rbase;
  638. y_table16[i+1024] = (yval >> 4) << gbase;
  639. y_table16[i+2048] = (yval >> 4) << bbase;
  640. yb += cy;
  641. }
  642. if (isNotNe)
  643. for (i = 0; i < 1024*3; i++)
  644. y_table16[i] = bswap_16(y_table16[i]);
  645. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  646. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  647. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  648. fill_gv_table(c->table_gV, 2, cgv);
  649. break;
  650. case 15:
  651. case 16:
  652. rbase = isRgb ? bpp - 5 : 0;
  653. gbase = 5;
  654. bbase = isRgb ? 0 : (bpp - 5);
  655. c->yuvTable = av_malloc(1024*3*2);
  656. y_table16 = c->yuvTable;
  657. yb = -(384<<16) - oy;
  658. for (i = 0; i < 1024; i++) {
  659. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  660. y_table16[i ] = (yval >> 3) << rbase;
  661. y_table16[i+1024] = (yval >> (18 - bpp)) << gbase;
  662. y_table16[i+2048] = (yval >> 3) << bbase;
  663. yb += cy;
  664. }
  665. if(isNotNe)
  666. for (i = 0; i < 1024*3; i++)
  667. y_table16[i] = bswap_16(y_table16[i]);
  668. fill_table(c->table_rV, 2, crv, y_table16 + yoffs);
  669. fill_table(c->table_gU, 2, cgu, y_table16 + yoffs + 1024);
  670. fill_table(c->table_bU, 2, cbu, y_table16 + yoffs + 2048);
  671. fill_gv_table(c->table_gV, 2, cgv);
  672. break;
  673. case 24:
  674. case 48:
  675. c->yuvTable = av_malloc(1024);
  676. y_table = c->yuvTable;
  677. yb = -(384<<16) - oy;
  678. for (i = 0; i < 1024; i++) {
  679. y_table[i] = av_clip_uint8((yb + 0x8000) >> 16);
  680. yb += cy;
  681. }
  682. fill_table(c->table_rV, 1, crv, y_table + yoffs);
  683. fill_table(c->table_gU, 1, cgu, y_table + yoffs);
  684. fill_table(c->table_bU, 1, cbu, y_table + yoffs);
  685. fill_gv_table(c->table_gV, 1, cgv);
  686. break;
  687. case 32:
  688. base = (c->dstFormat == PIX_FMT_RGB32_1 || c->dstFormat == PIX_FMT_BGR32_1) ? 8 : 0;
  689. rbase = base + (isRgb ? 16 : 0);
  690. gbase = base + 8;
  691. bbase = base + (isRgb ? 0 : 16);
  692. needAlpha = CONFIG_SWSCALE_ALPHA && isALPHA(c->srcFormat);
  693. if (!needAlpha)
  694. abase = (base + 24) & 31;
  695. c->yuvTable = av_malloc(1024*3*4);
  696. y_table32 = c->yuvTable;
  697. yb = -(384<<16) - oy;
  698. for (i = 0; i < 1024; i++) {
  699. uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
  700. y_table32[i ] = (yval << rbase) + (needAlpha ? 0 : (255 << abase));
  701. y_table32[i+1024] = yval << gbase;
  702. y_table32[i+2048] = yval << bbase;
  703. yb += cy;
  704. }
  705. fill_table(c->table_rV, 4, crv, y_table32 + yoffs);
  706. fill_table(c->table_gU, 4, cgu, y_table32 + yoffs + 1024);
  707. fill_table(c->table_bU, 4, cbu, y_table32 + yoffs + 2048);
  708. fill_gv_table(c->table_gV, 4, cgv);
  709. break;
  710. default:
  711. c->yuvTable = NULL;
  712. av_log(c, AV_LOG_ERROR, "%ibpp not supported by yuv2rgb\n", bpp);
  713. return -1;
  714. }
  715. return 0;
  716. }