yuv.h 7.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210
  1. // Copyright 2010 Google Inc. All Rights Reserved.
  2. //
  3. // Use of this source code is governed by a BSD-style license
  4. // that can be found in the COPYING file in the root of the source
  5. // tree. An additional intellectual property rights grant can be found
  6. // in the file PATENTS. All contributing project authors may
  7. // be found in the AUTHORS file in the root of the source tree.
  8. // -----------------------------------------------------------------------------
  9. //
  10. // inline YUV<->RGB conversion function
  11. //
  12. // The exact naming is Y'CbCr, following the ITU-R BT.601 standard.
  13. // More information at: https://en.wikipedia.org/wiki/YCbCr
  14. // Y = 0.2569 * R + 0.5044 * G + 0.0979 * B + 16
  15. // U = -0.1483 * R - 0.2911 * G + 0.4394 * B + 128
  16. // V = 0.4394 * R - 0.3679 * G - 0.0715 * B + 128
  17. // We use 16bit fixed point operations for RGB->YUV conversion (YUV_FIX).
  18. //
  19. // For the Y'CbCr to RGB conversion, the BT.601 specification reads:
  20. // R = 1.164 * (Y-16) + 1.596 * (V-128)
  21. // G = 1.164 * (Y-16) - 0.813 * (V-128) - 0.391 * (U-128)
  22. // B = 1.164 * (Y-16) + 2.018 * (U-128)
  23. // where Y is in the [16,235] range, and U/V in the [16,240] range.
  24. //
  25. // The fixed-point implementation used here is:
  26. // R = (19077 . y + 26149 . v - 14234) >> 6
  27. // G = (19077 . y - 6419 . u - 13320 . v + 8708) >> 6
  28. // B = (19077 . y + 33050 . u - 17685) >> 6
  29. // where the '.' operator is the mulhi_epu16 variant:
  30. // a . b = ((a << 8) * b) >> 16
  31. // that preserves 8 bits of fractional precision before final descaling.
  32. // Author: Skal (pascal.massimino@gmail.com)
  33. #ifndef WEBP_DSP_YUV_H_
  34. #define WEBP_DSP_YUV_H_
  35. #include "./dsp.h"
  36. #include "../dec/vp8_dec.h"
  37. //------------------------------------------------------------------------------
  38. // YUV -> RGB conversion
  39. #ifdef __cplusplus
  40. extern "C" {
  41. #endif
  42. enum {
  43. YUV_FIX = 16, // fixed-point precision for RGB->YUV
  44. YUV_HALF = 1 << (YUV_FIX - 1),
  45. YUV_FIX2 = 6, // fixed-point precision for YUV->RGB
  46. YUV_MASK2 = (256 << YUV_FIX2) - 1
  47. };
  48. //------------------------------------------------------------------------------
  49. // slower on x86 by ~7-8%, but bit-exact with the SSE2/NEON version
  50. static WEBP_INLINE int MultHi(int v, int coeff) { // _mm_mulhi_epu16 emulation
  51. return (v * coeff) >> 8;
  52. }
  53. static WEBP_INLINE int VP8Clip8(int v) {
  54. return ((v & ~YUV_MASK2) == 0) ? (v >> YUV_FIX2) : (v < 0) ? 0 : 255;
  55. }
  56. static WEBP_INLINE int VP8YUVToR(int y, int v) {
  57. return VP8Clip8(MultHi(y, 19077) + MultHi(v, 26149) - 14234);
  58. }
  59. static WEBP_INLINE int VP8YUVToG(int y, int u, int v) {
  60. return VP8Clip8(MultHi(y, 19077) - MultHi(u, 6419) - MultHi(v, 13320) + 8708);
  61. }
  62. static WEBP_INLINE int VP8YUVToB(int y, int u) {
  63. return VP8Clip8(MultHi(y, 19077) + MultHi(u, 33050) - 17685);
  64. }
  65. static WEBP_INLINE void VP8YuvToRgb(int y, int u, int v,
  66. uint8_t* const rgb) {
  67. rgb[0] = VP8YUVToR(y, v);
  68. rgb[1] = VP8YUVToG(y, u, v);
  69. rgb[2] = VP8YUVToB(y, u);
  70. }
  71. static WEBP_INLINE void VP8YuvToBgr(int y, int u, int v,
  72. uint8_t* const bgr) {
  73. bgr[0] = VP8YUVToB(y, u);
  74. bgr[1] = VP8YUVToG(y, u, v);
  75. bgr[2] = VP8YUVToR(y, v);
  76. }
  77. static WEBP_INLINE void VP8YuvToRgb565(int y, int u, int v,
  78. uint8_t* const rgb) {
  79. const int r = VP8YUVToR(y, v); // 5 usable bits
  80. const int g = VP8YUVToG(y, u, v); // 6 usable bits
  81. const int b = VP8YUVToB(y, u); // 5 usable bits
  82. const int rg = (r & 0xf8) | (g >> 5);
  83. const int gb = ((g << 3) & 0xe0) | (b >> 3);
  84. #if (WEBP_SWAP_16BIT_CSP == 1)
  85. rgb[0] = gb;
  86. rgb[1] = rg;
  87. #else
  88. rgb[0] = rg;
  89. rgb[1] = gb;
  90. #endif
  91. }
  92. static WEBP_INLINE void VP8YuvToRgba4444(int y, int u, int v,
  93. uint8_t* const argb) {
  94. const int r = VP8YUVToR(y, v); // 4 usable bits
  95. const int g = VP8YUVToG(y, u, v); // 4 usable bits
  96. const int b = VP8YUVToB(y, u); // 4 usable bits
  97. const int rg = (r & 0xf0) | (g >> 4);
  98. const int ba = (b & 0xf0) | 0x0f; // overwrite the lower 4 bits
  99. #if (WEBP_SWAP_16BIT_CSP == 1)
  100. argb[0] = ba;
  101. argb[1] = rg;
  102. #else
  103. argb[0] = rg;
  104. argb[1] = ba;
  105. #endif
  106. }
  107. //-----------------------------------------------------------------------------
  108. // Alpha handling variants
  109. static WEBP_INLINE void VP8YuvToArgb(uint8_t y, uint8_t u, uint8_t v,
  110. uint8_t* const argb) {
  111. argb[0] = 0xff;
  112. VP8YuvToRgb(y, u, v, argb + 1);
  113. }
  114. static WEBP_INLINE void VP8YuvToBgra(uint8_t y, uint8_t u, uint8_t v,
  115. uint8_t* const bgra) {
  116. VP8YuvToBgr(y, u, v, bgra);
  117. bgra[3] = 0xff;
  118. }
  119. static WEBP_INLINE void VP8YuvToRgba(uint8_t y, uint8_t u, uint8_t v,
  120. uint8_t* const rgba) {
  121. VP8YuvToRgb(y, u, v, rgba);
  122. rgba[3] = 0xff;
  123. }
  124. //-----------------------------------------------------------------------------
  125. // SSE2 extra functions (mostly for upsampling_sse2.c)
  126. #if defined(WEBP_USE_SSE2)
  127. // Process 32 pixels and store the result (16b, 24b or 32b per pixel) in *dst.
  128. void VP8YuvToRgba32_SSE2(const uint8_t* y, const uint8_t* u, const uint8_t* v,
  129. uint8_t* dst);
  130. void VP8YuvToRgb32_SSE2(const uint8_t* y, const uint8_t* u, const uint8_t* v,
  131. uint8_t* dst);
  132. void VP8YuvToBgra32_SSE2(const uint8_t* y, const uint8_t* u, const uint8_t* v,
  133. uint8_t* dst);
  134. void VP8YuvToBgr32_SSE2(const uint8_t* y, const uint8_t* u, const uint8_t* v,
  135. uint8_t* dst);
  136. void VP8YuvToArgb32_SSE2(const uint8_t* y, const uint8_t* u, const uint8_t* v,
  137. uint8_t* dst);
  138. void VP8YuvToRgba444432_SSE2(const uint8_t* y, const uint8_t* u,
  139. const uint8_t* v, uint8_t* dst);
  140. void VP8YuvToRgb56532_SSE2(const uint8_t* y, const uint8_t* u, const uint8_t* v,
  141. uint8_t* dst);
  142. #endif // WEBP_USE_SSE2
  143. //-----------------------------------------------------------------------------
  144. // SSE41 extra functions (mostly for upsampling_sse41.c)
  145. #if defined(WEBP_USE_SSE41)
  146. // Process 32 pixels and store the result (16b, 24b or 32b per pixel) in *dst.
  147. void VP8YuvToRgb32_SSE41(const uint8_t* y, const uint8_t* u, const uint8_t* v,
  148. uint8_t* dst);
  149. void VP8YuvToBgr32_SSE41(const uint8_t* y, const uint8_t* u, const uint8_t* v,
  150. uint8_t* dst);
  151. #endif // WEBP_USE_SSE41
  152. //------------------------------------------------------------------------------
  153. // RGB -> YUV conversion
  154. // Stub functions that can be called with various rounding values:
  155. static WEBP_INLINE int VP8ClipUV(int uv, int rounding) {
  156. uv = (uv + rounding + (128 << (YUV_FIX + 2))) >> (YUV_FIX + 2);
  157. return ((uv & ~0xff) == 0) ? uv : (uv < 0) ? 0 : 255;
  158. }
  159. static WEBP_INLINE int VP8RGBToY(int r, int g, int b, int rounding) {
  160. const int luma = 16839 * r + 33059 * g + 6420 * b;
  161. return (luma + rounding + (16 << YUV_FIX)) >> YUV_FIX; // no need to clip
  162. }
  163. static WEBP_INLINE int VP8RGBToU(int r, int g, int b, int rounding) {
  164. const int u = -9719 * r - 19081 * g + 28800 * b;
  165. return VP8ClipUV(u, rounding);
  166. }
  167. static WEBP_INLINE int VP8RGBToV(int r, int g, int b, int rounding) {
  168. const int v = +28800 * r - 24116 * g - 4684 * b;
  169. return VP8ClipUV(v, rounding);
  170. }
  171. #ifdef __cplusplus
  172. } // extern "C"
  173. #endif
  174. #endif // WEBP_DSP_YUV_H_