swscale.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436
  1. /*
  2. * Copyright (C) 2003-2011 Michael Niedermayer <michaelni@gmx.at>
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #include <stdio.h>
  21. #include <stdlib.h>
  22. #include <string.h>
  23. #include <inttypes.h>
  24. #include <stdarg.h>
  25. #undef HAVE_AV_CONFIG_H
  26. #include "libavutil/cpu.h"
  27. #include "libavutil/imgutils.h"
  28. #include "libavutil/mem.h"
  29. #include "libavutil/avutil.h"
  30. #include "libavutil/crc.h"
  31. #include "libavutil/pixdesc.h"
  32. #include "libavutil/lfg.h"
  33. #include "libswscale/swscale.h"
  34. /* HACK Duplicated from swscale_internal.h.
  35. * Should be removed when a cleaner pixel format system exists. */
  36. #define isGray(x) \
  37. ((x) == AV_PIX_FMT_GRAY8 || \
  38. (x) == AV_PIX_FMT_YA8 || \
  39. (x) == AV_PIX_FMT_GRAY16BE || \
  40. (x) == AV_PIX_FMT_GRAY16LE || \
  41. (x) == AV_PIX_FMT_YA16BE || \
  42. (x) == AV_PIX_FMT_YA16LE)
  43. #define hasChroma(x) \
  44. (!(isGray(x) || \
  45. (x) == AV_PIX_FMT_MONOBLACK || \
  46. (x) == AV_PIX_FMT_MONOWHITE))
  47. #define isALPHA(x) \
  48. ((x) == AV_PIX_FMT_BGR32 || \
  49. (x) == AV_PIX_FMT_BGR32_1 || \
  50. (x) == AV_PIX_FMT_RGB32 || \
  51. (x) == AV_PIX_FMT_RGB32_1 || \
  52. (x) == AV_PIX_FMT_YUVA420P)
  53. static uint64_t getSSD(const uint8_t *src1, const uint8_t *src2, int stride1,
  54. int stride2, int w, int h)
  55. {
  56. int x, y;
  57. uint64_t ssd = 0;
  58. for (y = 0; y < h; y++) {
  59. for (x = 0; x < w; x++) {
  60. int d = src1[x + y * stride1] - src2[x + y * stride2];
  61. ssd += d * d;
  62. }
  63. }
  64. return ssd;
  65. }
  66. struct Results {
  67. uint64_t ssdY;
  68. uint64_t ssdU;
  69. uint64_t ssdV;
  70. uint64_t ssdA;
  71. uint32_t crc;
  72. };
  73. // test by ref -> src -> dst -> out & compare out against ref
  74. // ref & out are YV12
  75. static int doTest(uint8_t *ref[4], int refStride[4], int w, int h,
  76. enum AVPixelFormat srcFormat, enum AVPixelFormat dstFormat,
  77. int srcW, int srcH, int dstW, int dstH, int flags,
  78. struct Results *r)
  79. {
  80. const AVPixFmtDescriptor *desc_yuva420p = av_pix_fmt_desc_get(AV_PIX_FMT_YUVA420P);
  81. const AVPixFmtDescriptor *desc_src = av_pix_fmt_desc_get(srcFormat);
  82. const AVPixFmtDescriptor *desc_dst = av_pix_fmt_desc_get(dstFormat);
  83. static enum AVPixelFormat cur_srcFormat;
  84. static int cur_srcW, cur_srcH;
  85. static uint8_t *src[4];
  86. static int srcStride[4];
  87. uint8_t *dst[4] = { 0 };
  88. uint8_t *out[4] = { 0 };
  89. int dstStride[4] = {0};
  90. int i;
  91. uint64_t ssdY, ssdU = 0, ssdV = 0, ssdA = 0;
  92. struct SwsContext *dstContext = NULL, *outContext = NULL;
  93. uint32_t crc = 0;
  94. int res = 0;
  95. if (cur_srcFormat != srcFormat || cur_srcW != srcW || cur_srcH != srcH) {
  96. struct SwsContext *srcContext = NULL;
  97. int p;
  98. for (p = 0; p < 4; p++)
  99. av_freep(&src[p]);
  100. res = av_image_fill_linesizes(srcStride, srcFormat, srcW);
  101. if (res < 0) {
  102. fprintf(stderr, "av_image_fill_linesizes failed\n");
  103. goto end;
  104. }
  105. for (p = 0; p < 4; p++) {
  106. srcStride[p] = FFALIGN(srcStride[p], 16);
  107. if (srcStride[p])
  108. src[p] = av_mallocz(srcStride[p] * srcH + 16);
  109. if (srcStride[p] && !src[p]) {
  110. perror("Malloc");
  111. res = -1;
  112. goto end;
  113. }
  114. }
  115. srcContext = sws_getContext(w, h, AV_PIX_FMT_YUVA420P, srcW, srcH,
  116. srcFormat, SWS_BILINEAR, NULL, NULL, NULL);
  117. if (!srcContext) {
  118. fprintf(stderr, "Failed to get %s ---> %s\n",
  119. desc_yuva420p->name,
  120. desc_src->name);
  121. res = -1;
  122. goto end;
  123. }
  124. sws_scale(srcContext, (const uint8_t * const*)ref, refStride, 0, h, src, srcStride);
  125. sws_freeContext(srcContext);
  126. cur_srcFormat = srcFormat;
  127. cur_srcW = srcW;
  128. cur_srcH = srcH;
  129. }
  130. res = av_image_fill_linesizes(dstStride, dstFormat, dstW);
  131. if (res < 0) {
  132. fprintf(stderr, "av_image_fill_linesizes failed\n");
  133. goto end;
  134. }
  135. for (i = 0; i < 4; i++) {
  136. /* Image buffers passed into libswscale can be allocated any way you
  137. * prefer, as long as they're aligned enough for the architecture, and
  138. * they're freed appropriately (such as using av_free for buffers
  139. * allocated with av_malloc). */
  140. /* An extra 16 bytes is being allocated because some scalers may write
  141. * out of bounds. */
  142. dstStride[i] = FFALIGN(dstStride[i], 16);
  143. if (dstStride[i])
  144. dst[i] = av_mallocz(dstStride[i] * dstH + 16);
  145. if (dstStride[i] && !dst[i]) {
  146. perror("Malloc");
  147. res = -1;
  148. goto end;
  149. }
  150. }
  151. dstContext = sws_getContext(srcW, srcH, srcFormat, dstW, dstH, dstFormat,
  152. flags, NULL, NULL, NULL);
  153. if (!dstContext) {
  154. fprintf(stderr, "Failed to get %s ---> %s\n",
  155. desc_src->name, desc_dst->name);
  156. res = -1;
  157. goto end;
  158. }
  159. printf(" %s %dx%d -> %s %3dx%3d flags=%2d",
  160. desc_src->name, srcW, srcH,
  161. desc_dst->name, dstW, dstH,
  162. flags);
  163. fflush(stdout);
  164. sws_scale(dstContext, (const uint8_t * const*)src, srcStride, 0, srcH, dst, dstStride);
  165. for (i = 0; i < 4 && dstStride[i]; i++)
  166. crc = av_crc(av_crc_get_table(AV_CRC_32_IEEE), crc, dst[i],
  167. dstStride[i] * dstH);
  168. if (r && crc == r->crc) {
  169. ssdY = r->ssdY;
  170. ssdU = r->ssdU;
  171. ssdV = r->ssdV;
  172. ssdA = r->ssdA;
  173. } else {
  174. for (i = 0; i < 4; i++) {
  175. refStride[i] = FFALIGN(refStride[i], 16);
  176. if (refStride[i])
  177. out[i] = av_mallocz(refStride[i] * h);
  178. if (refStride[i] && !out[i]) {
  179. perror("Malloc");
  180. res = -1;
  181. goto end;
  182. }
  183. }
  184. outContext = sws_getContext(dstW, dstH, dstFormat, w, h,
  185. AV_PIX_FMT_YUVA420P, SWS_BILINEAR,
  186. NULL, NULL, NULL);
  187. if (!outContext) {
  188. fprintf(stderr, "Failed to get %s ---> %s\n",
  189. desc_dst->name,
  190. desc_yuva420p->name);
  191. res = -1;
  192. goto end;
  193. }
  194. sws_scale(outContext, (const uint8_t * const*)dst, dstStride, 0, dstH, out, refStride);
  195. ssdY = getSSD(ref[0], out[0], refStride[0], refStride[0], w, h);
  196. if (hasChroma(srcFormat) && hasChroma(dstFormat)) {
  197. //FIXME check that output is really gray
  198. ssdU = getSSD(ref[1], out[1], refStride[1], refStride[1],
  199. (w + 1) >> 1, (h + 1) >> 1);
  200. ssdV = getSSD(ref[2], out[2], refStride[2], refStride[2],
  201. (w + 1) >> 1, (h + 1) >> 1);
  202. }
  203. if (isALPHA(srcFormat) && isALPHA(dstFormat))
  204. ssdA = getSSD(ref[3], out[3], refStride[3], refStride[3], w, h);
  205. ssdY /= w * h;
  206. ssdU /= w * h / 4;
  207. ssdV /= w * h / 4;
  208. ssdA /= w * h;
  209. sws_freeContext(outContext);
  210. for (i = 0; i < 4; i++)
  211. if (refStride[i])
  212. av_free(out[i]);
  213. }
  214. printf(" CRC=%08x SSD=%5"PRId64 ",%5"PRId64 ",%5"PRId64 ",%5"PRId64 "\n",
  215. crc, ssdY, ssdU, ssdV, ssdA);
  216. end:
  217. sws_freeContext(dstContext);
  218. for (i = 0; i < 4; i++)
  219. if (dstStride[i])
  220. av_free(dst[i]);
  221. return res;
  222. }
  223. static void selfTest(uint8_t *ref[4], int refStride[4], int w, int h,
  224. enum AVPixelFormat srcFormat_in,
  225. enum AVPixelFormat dstFormat_in)
  226. {
  227. const int flags[] = { SWS_FAST_BILINEAR, SWS_BILINEAR, SWS_BICUBIC,
  228. SWS_X, SWS_POINT, SWS_AREA, 0 };
  229. const int srcW = w;
  230. const int srcH = h;
  231. const int dstW[] = { srcW - srcW / 3, srcW, srcW + srcW / 3, 0 };
  232. const int dstH[] = { srcH - srcH / 3, srcH, srcH + srcH / 3, 0 };
  233. enum AVPixelFormat srcFormat, dstFormat;
  234. const AVPixFmtDescriptor *desc_src, *desc_dst;
  235. for (srcFormat = srcFormat_in != AV_PIX_FMT_NONE ? srcFormat_in : 0;
  236. srcFormat < AV_PIX_FMT_NB; srcFormat++) {
  237. if (!sws_isSupportedInput(srcFormat) ||
  238. !sws_isSupportedOutput(srcFormat))
  239. continue;
  240. desc_src = av_pix_fmt_desc_get(srcFormat);
  241. for (dstFormat = dstFormat_in != AV_PIX_FMT_NONE ? dstFormat_in : 0;
  242. dstFormat < AV_PIX_FMT_NB; dstFormat++) {
  243. int i, j, k;
  244. int res = 0;
  245. if (!sws_isSupportedInput(dstFormat) ||
  246. !sws_isSupportedOutput(dstFormat))
  247. continue;
  248. desc_dst = av_pix_fmt_desc_get(dstFormat);
  249. printf("%s -> %s\n", desc_src->name, desc_dst->name);
  250. fflush(stdout);
  251. for (k = 0; flags[k] && !res; k++)
  252. for (i = 0; dstW[i] && !res; i++)
  253. for (j = 0; dstH[j] && !res; j++)
  254. res = doTest(ref, refStride, w, h,
  255. srcFormat, dstFormat,
  256. srcW, srcH, dstW[i], dstH[j], flags[k],
  257. NULL);
  258. if (dstFormat_in != AV_PIX_FMT_NONE)
  259. break;
  260. }
  261. if (srcFormat_in != AV_PIX_FMT_NONE)
  262. break;
  263. }
  264. }
  265. static int fileTest(uint8_t *ref[4], int refStride[4], int w, int h, FILE *fp,
  266. enum AVPixelFormat srcFormat_in,
  267. enum AVPixelFormat dstFormat_in)
  268. {
  269. char buf[256];
  270. while (fgets(buf, sizeof(buf), fp)) {
  271. struct Results r;
  272. enum AVPixelFormat srcFormat;
  273. char srcStr[13];
  274. int srcW = 0, srcH = 0;
  275. enum AVPixelFormat dstFormat;
  276. char dstStr[13];
  277. int dstW = 0, dstH = 0;
  278. int flags;
  279. int ret;
  280. ret = sscanf(buf,
  281. " %12s %dx%d -> %12s %dx%d flags=%d CRC=%x"
  282. " SSD=%"SCNd64 ", %"SCNd64 ", %"SCNd64 ", %"SCNd64 "\n",
  283. srcStr, &srcW, &srcH, dstStr, &dstW, &dstH,
  284. &flags, &r.crc, &r.ssdY, &r.ssdU, &r.ssdV, &r.ssdA);
  285. if (ret != 12) {
  286. srcStr[0] = dstStr[0] = 0;
  287. ret = sscanf(buf, "%12s -> %12s\n", srcStr, dstStr);
  288. }
  289. srcFormat = av_get_pix_fmt(srcStr);
  290. dstFormat = av_get_pix_fmt(dstStr);
  291. if (srcFormat == AV_PIX_FMT_NONE || dstFormat == AV_PIX_FMT_NONE ||
  292. srcW > 8192U || srcH > 8192U || dstW > 8192U || dstH > 8192U) {
  293. fprintf(stderr, "malformed input file\n");
  294. return -1;
  295. }
  296. if ((srcFormat_in != AV_PIX_FMT_NONE && srcFormat_in != srcFormat) ||
  297. (dstFormat_in != AV_PIX_FMT_NONE && dstFormat_in != dstFormat))
  298. continue;
  299. if (ret != 12) {
  300. printf("%s", buf);
  301. continue;
  302. }
  303. doTest(ref, refStride, w, h,
  304. srcFormat, dstFormat,
  305. srcW, srcH, dstW, dstH, flags,
  306. &r);
  307. }
  308. return 0;
  309. }
  310. #define W 96
  311. #define H 96
  312. int main(int argc, char **argv)
  313. {
  314. enum AVPixelFormat srcFormat = AV_PIX_FMT_NONE;
  315. enum AVPixelFormat dstFormat = AV_PIX_FMT_NONE;
  316. uint8_t *rgb_data = av_malloc(W * H * 4);
  317. const uint8_t * const rgb_src[4] = { rgb_data, NULL, NULL, NULL };
  318. int rgb_stride[4] = { 4 * W, 0, 0, 0 };
  319. uint8_t *data = av_malloc(4 * W * H);
  320. uint8_t *src[4] = { data, data + W * H, data + W * H * 2, data + W * H * 3 };
  321. int stride[4] = { W, W, W, W };
  322. int x, y;
  323. struct SwsContext *sws;
  324. AVLFG rand;
  325. int res = -1;
  326. int i;
  327. FILE *fp = NULL;
  328. if (!rgb_data || !data)
  329. return -1;
  330. for (i = 1; i < argc; i += 2) {
  331. if (argv[i][0] != '-' || i + 1 == argc)
  332. goto bad_option;
  333. if (!strcmp(argv[i], "-ref")) {
  334. fp = fopen(argv[i + 1], "r");
  335. if (!fp) {
  336. fprintf(stderr, "could not open '%s'\n", argv[i + 1]);
  337. goto error;
  338. }
  339. } else if (!strcmp(argv[i], "-cpuflags")) {
  340. unsigned flags = av_get_cpu_flags();
  341. int ret = av_parse_cpu_caps(&flags, argv[i + 1]);
  342. if (ret < 0) {
  343. fprintf(stderr, "invalid cpu flags %s\n", argv[i + 1]);
  344. return ret;
  345. }
  346. av_force_cpu_flags(flags);
  347. } else if (!strcmp(argv[i], "-src")) {
  348. srcFormat = av_get_pix_fmt(argv[i + 1]);
  349. if (srcFormat == AV_PIX_FMT_NONE) {
  350. fprintf(stderr, "invalid pixel format %s\n", argv[i + 1]);
  351. return -1;
  352. }
  353. } else if (!strcmp(argv[i], "-dst")) {
  354. dstFormat = av_get_pix_fmt(argv[i + 1]);
  355. if (dstFormat == AV_PIX_FMT_NONE) {
  356. fprintf(stderr, "invalid pixel format %s\n", argv[i + 1]);
  357. return -1;
  358. }
  359. } else {
  360. bad_option:
  361. fprintf(stderr, "bad option or argument missing (%s)\n", argv[i]);
  362. goto error;
  363. }
  364. }
  365. sws = sws_getContext(W / 12, H / 12, AV_PIX_FMT_RGB32, W, H,
  366. AV_PIX_FMT_YUVA420P, SWS_BILINEAR, NULL, NULL, NULL);
  367. av_lfg_init(&rand, 1);
  368. for (y = 0; y < H; y++)
  369. for (x = 0; x < W * 4; x++)
  370. rgb_data[ x + y * 4 * W] = av_lfg_get(&rand);
  371. sws_scale(sws, rgb_src, rgb_stride, 0, H / 12, src, stride);
  372. sws_freeContext(sws);
  373. av_free(rgb_data);
  374. if(fp) {
  375. res = fileTest(src, stride, W, H, fp, srcFormat, dstFormat);
  376. fclose(fp);
  377. } else {
  378. selfTest(src, stride, W, H, srcFormat, dstFormat);
  379. res = 0;
  380. }
  381. error:
  382. av_free(data);
  383. return res;
  384. }