h264pred.c 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260
  1. /*
  2. * Copyright (c) 2015 Henrik Gramner
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License as published by
  8. * the Free Software Foundation; either version 2 of the License, or
  9. * (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  14. * GNU General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU General Public License along
  17. * with FFmpeg; if not, write to the Free Software Foundation, Inc.,
  18. * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
  19. */
  20. #include <string.h>
  21. #include "checkasm.h"
  22. #include "libavcodec/avcodec.h"
  23. #include "libavcodec/h264pred.h"
  24. #include "libavutil/common.h"
  25. #include "libavutil/internal.h"
  26. #include "libavutil/intreadwrite.h"
  27. static const int codec_ids[4] = { AV_CODEC_ID_H264, AV_CODEC_ID_VP8, AV_CODEC_ID_RV40, AV_CODEC_ID_SVQ3 };
  28. static const char * const pred4x4_modes[4][15] = {
  29. { /* H264 */
  30. [VERT_PRED ] = "vertical",
  31. [HOR_PRED ] = "horizontal",
  32. [DC_PRED ] = "dc",
  33. [DIAG_DOWN_LEFT_PRED ] = "down_left",
  34. [DIAG_DOWN_RIGHT_PRED] = "down_right",
  35. [VERT_RIGHT_PRED ] = "vertical_right",
  36. [HOR_DOWN_PRED ] = "horizontal_right",
  37. [VERT_LEFT_PRED ] = "vertical_left",
  38. [HOR_UP_PRED ] = "horizontal_up",
  39. [LEFT_DC_PRED ] = "left_dc",
  40. [TOP_DC_PRED ] = "top_dc",
  41. [DC_128_PRED ] = "dc_128",
  42. },
  43. { /* VP8 */
  44. [VERT_PRED ] = "vertical_vp8",
  45. [HOR_PRED ] = "horizontal_vp8",
  46. [VERT_LEFT_PRED] = "vertical_left_vp8",
  47. [TM_VP8_PRED ] = "tm_vp8",
  48. [DC_127_PRED ] = "dc_127_vp8",
  49. [DC_129_PRED ] = "dc_129_vp8",
  50. },
  51. { /* RV40 */
  52. [DIAG_DOWN_LEFT_PRED ] = "down_left_rv40",
  53. [VERT_LEFT_PRED ] = "vertical_left_rv40",
  54. [HOR_UP_PRED ] = "horizontal_up_rv40",
  55. [DIAG_DOWN_LEFT_PRED_RV40_NODOWN] = "down_left_nodown_rv40",
  56. [HOR_UP_PRED_RV40_NODOWN ] = "horizontal_up_nodown_rv40",
  57. [VERT_LEFT_PRED_RV40_NODOWN ] = "vertical_left_nodown_rv40",
  58. },
  59. { /* SVQ3 */
  60. [DIAG_DOWN_LEFT_PRED] = "down_left_svq3",
  61. },
  62. };
  63. static const char * const pred8x8_modes[4][11] = {
  64. { /* H264 */
  65. [DC_PRED8x8 ] = "dc",
  66. [HOR_PRED8x8 ] = "horizontal",
  67. [VERT_PRED8x8 ] = "vertical",
  68. [PLANE_PRED8x8 ] = "plane",
  69. [LEFT_DC_PRED8x8 ] = "left_dc",
  70. [TOP_DC_PRED8x8 ] = "top_dc",
  71. [DC_128_PRED8x8 ] = "dc_128",
  72. [ALZHEIMER_DC_L0T_PRED8x8] = "mad_cow_dc_l0t",
  73. [ALZHEIMER_DC_0LT_PRED8x8] = "mad_cow_dc_0lt",
  74. [ALZHEIMER_DC_L00_PRED8x8] = "mad_cow_dc_l00",
  75. [ALZHEIMER_DC_0L0_PRED8x8] = "mad_cow_dc_0l0",
  76. },
  77. { /* VP8 */
  78. [PLANE_PRED8x8 ] = "tm_vp8",
  79. [DC_127_PRED8x8] = "dc_127_vp8",
  80. [DC_129_PRED8x8] = "dc_129_vp8",
  81. },
  82. { /* RV40 */
  83. [DC_PRED8x8 ] = "dc_rv40",
  84. [LEFT_DC_PRED8x8] = "left_dc_rv40",
  85. [TOP_DC_PRED8x8 ] = "top_dc_rv40",
  86. },
  87. /* nothing for SVQ3 */
  88. };
  89. static const char * const pred16x16_modes[4][9] = {
  90. { /* H264 */
  91. [DC_PRED8x8 ] = "dc",
  92. [HOR_PRED8x8 ] = "horizontal",
  93. [VERT_PRED8x8 ] = "vertical",
  94. [PLANE_PRED8x8 ] = "plane",
  95. [LEFT_DC_PRED8x8] = "left_dc",
  96. [TOP_DC_PRED8x8 ] = "top_dc",
  97. [DC_128_PRED8x8 ] = "dc_128",
  98. },
  99. { /* VP8 */
  100. [PLANE_PRED8x8 ] = "tm_vp8",
  101. [DC_127_PRED8x8] = "dc_127_vp8",
  102. [DC_129_PRED8x8] = "dc_129_vp8",
  103. },
  104. { /* RV40 */
  105. [PLANE_PRED8x8] = "plane_rv40",
  106. },
  107. { /* SVQ3 */
  108. [PLANE_PRED8x8] = "plane_svq3",
  109. },
  110. };
  111. static const uint32_t pixel_mask[3] = { 0xffffffff, 0x01ff01ff, 0x03ff03ff };
  112. #define SIZEOF_PIXEL ((bit_depth + 7) / 8)
  113. #define BUF_SIZE (3 * 16 * 17)
  114. #define check_pred_func(func, name, mode_name) \
  115. (mode_name && ((codec_ids[codec] == AV_CODEC_ID_H264) ? \
  116. check_func(func, "pred%s_%s_%d", name, mode_name, bit_depth) : \
  117. check_func(func, "pred%s_%s", name, mode_name)))
  118. #define randomize_buffers() \
  119. do { \
  120. uint32_t mask = pixel_mask[bit_depth - 8]; \
  121. int i; \
  122. for (i = 0; i < BUF_SIZE; i += 4) { \
  123. uint32_t r = rnd() & mask; \
  124. AV_WN32A(buf0 + i, r); \
  125. AV_WN32A(buf1 + i, r); \
  126. } \
  127. } while (0)
  128. #define src0 (buf0 + 4 * 16) /* Offset to allow room for top and left */
  129. #define src1 (buf1 + 4 * 16)
  130. static void check_pred4x4(H264PredContext *h, uint8_t *buf0, uint8_t *buf1,
  131. int codec, int chroma_format, int bit_depth)
  132. {
  133. if (chroma_format == 1) {
  134. uint8_t *topright = buf0 + 2*16;
  135. int pred_mode;
  136. declare_func_emms(AV_CPU_FLAG_MMX | AV_CPU_FLAG_MMXEXT, void, uint8_t *src, const uint8_t *topright, ptrdiff_t stride);
  137. for (pred_mode = 0; pred_mode < 15; pred_mode++) {
  138. if (check_pred_func(h->pred4x4[pred_mode], "4x4", pred4x4_modes[codec][pred_mode])) {
  139. randomize_buffers();
  140. call_ref(src0, topright, 12*SIZEOF_PIXEL);
  141. call_new(src1, topright, 12*SIZEOF_PIXEL);
  142. if (memcmp(buf0, buf1, BUF_SIZE))
  143. fail();
  144. bench_new(src1, topright, 12*SIZEOF_PIXEL);
  145. }
  146. }
  147. }
  148. }
  149. static void check_pred8x8(H264PredContext *h, uint8_t *buf0, uint8_t *buf1,
  150. int codec, int chroma_format, int bit_depth)
  151. {
  152. int pred_mode;
  153. declare_func_emms(AV_CPU_FLAG_MMX | AV_CPU_FLAG_MMXEXT, void, uint8_t *src, ptrdiff_t stride);
  154. for (pred_mode = 0; pred_mode < 11; pred_mode++) {
  155. if (check_pred_func(h->pred8x8[pred_mode], (chroma_format == 2) ? "8x16" : "8x8",
  156. pred8x8_modes[codec][pred_mode])) {
  157. randomize_buffers();
  158. call_ref(src0, 24*SIZEOF_PIXEL);
  159. call_new(src1, 24*SIZEOF_PIXEL);
  160. if (memcmp(buf0, buf1, BUF_SIZE))
  161. fail();
  162. bench_new(src1, 24*SIZEOF_PIXEL);
  163. }
  164. }
  165. }
  166. static void check_pred16x16(H264PredContext *h, uint8_t *buf0, uint8_t *buf1,
  167. int codec, int chroma_format, int bit_depth)
  168. {
  169. if (chroma_format == 1) {
  170. int pred_mode;
  171. declare_func_emms(AV_CPU_FLAG_MMX | AV_CPU_FLAG_MMXEXT, void, uint8_t *src, ptrdiff_t stride);
  172. for (pred_mode = 0; pred_mode < 9; pred_mode++) {
  173. if (check_pred_func(h->pred16x16[pred_mode], "16x16", pred16x16_modes[codec][pred_mode])) {
  174. randomize_buffers();
  175. call_ref(src0, 48);
  176. call_new(src1, 48);
  177. if (memcmp(buf0, buf1, BUF_SIZE))
  178. fail();
  179. bench_new(src1, 48);
  180. }
  181. }
  182. }
  183. }
  184. static void check_pred8x8l(H264PredContext *h, uint8_t *buf0, uint8_t *buf1,
  185. int codec, int chroma_format, int bit_depth)
  186. {
  187. if (chroma_format == 1 && codec_ids[codec] == AV_CODEC_ID_H264) {
  188. int pred_mode;
  189. declare_func_emms(AV_CPU_FLAG_MMXEXT, void, uint8_t *src, int topleft, int topright, ptrdiff_t stride);
  190. for (pred_mode = 0; pred_mode < 12; pred_mode++) {
  191. if (check_pred_func(h->pred8x8l[pred_mode], "8x8l", pred4x4_modes[codec][pred_mode])) {
  192. int neighbors;
  193. for (neighbors = 0; neighbors <= 0xc000; neighbors += 0x4000) {
  194. int has_topleft = neighbors & 0x8000;
  195. int has_topright = neighbors & 0x4000;
  196. if ((pred_mode == DIAG_DOWN_RIGHT_PRED || pred_mode == VERT_RIGHT_PRED) && !has_topleft)
  197. continue; /* Those aren't allowed according to the spec */
  198. randomize_buffers();
  199. call_ref(src0, has_topleft, has_topright, 24*SIZEOF_PIXEL);
  200. call_new(src1, has_topleft, has_topright, 24*SIZEOF_PIXEL);
  201. if (memcmp(buf0, buf1, BUF_SIZE))
  202. fail();
  203. bench_new(src1, has_topleft, has_topright, 24*SIZEOF_PIXEL);
  204. }
  205. }
  206. }
  207. }
  208. }
  209. /* TODO: Add tests for H.264 lossless H/V prediction */
  210. void checkasm_check_h264pred(void)
  211. {
  212. static const struct {
  213. void (*func)(H264PredContext*, uint8_t*, uint8_t*, int, int, int);
  214. const char *name;
  215. } tests[] = {
  216. { check_pred4x4, "pred4x4" },
  217. { check_pred8x8, "pred8x8" },
  218. { check_pred16x16, "pred16x16" },
  219. { check_pred8x8l, "pred8x8l" },
  220. };
  221. LOCAL_ALIGNED_16(uint8_t, buf0, [BUF_SIZE]);
  222. LOCAL_ALIGNED_16(uint8_t, buf1, [BUF_SIZE]);
  223. H264PredContext h;
  224. int test, codec, chroma_format, bit_depth;
  225. for (test = 0; test < FF_ARRAY_ELEMS(tests); test++) {
  226. for (codec = 0; codec < 4; codec++) {
  227. int codec_id = codec_ids[codec];
  228. for (bit_depth = 8; bit_depth <= (codec_id == AV_CODEC_ID_H264 ? 10 : 8); bit_depth++)
  229. for (chroma_format = 1; chroma_format <= (codec_id == AV_CODEC_ID_H264 ? 2 : 1); chroma_format++) {
  230. ff_h264_pred_init(&h, codec_id, bit_depth, chroma_format);
  231. tests[test].func(&h, buf0, buf1, codec, chroma_format, bit_depth);
  232. }
  233. }
  234. report("%s", tests[test].name);
  235. }
  236. }