/* * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with FFmpeg; if not, write to the Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */ #include <string.h> #include "checkasm.h" #include "libavfilter/bwdifdsp.h" #include "libavutil/mem_internal.h" #define WIDTH 256 #define randomize_buffers(buf0, buf1, mask, count) \ for (size_t i = 0; i < count; i++) \ buf0[i] = buf1[i] = rnd() & mask #define randomize_overflow_check(buf0, buf1, mask, count) \ for (size_t i = 0; i < count; i++) \ buf0[i] = buf1[i] = (rnd() & 1) != 0 ? mask : 0; #define BODY(type, depth) \ do { \ type prev0[9*WIDTH], prev1[9*WIDTH]; \ type next0[9*WIDTH], next1[9*WIDTH]; \ type cur0[9*WIDTH], cur1[9*WIDTH]; \ type dst0[WIDTH], dst1[WIDTH]; \ const int stride = WIDTH; \ const int mask = (1<<depth)-1; \ \ declare_func(void, void *dst, const void *prev, const void *cur, const void *next, \ int w, int prefs, int mrefs, int prefs2, int mrefs2, \ int prefs3, int mrefs3, int prefs4, int mrefs4, \ int parity, int clip_max); \ \ randomize_buffers(prev0, prev1, mask, 9*WIDTH); \ randomize_buffers(next0, next1, mask, 9*WIDTH); \ randomize_buffers( cur0, cur1, mask, 9*WIDTH); \ \ call_ref(dst0, prev0 + 4*WIDTH, cur0 + 4*WIDTH, next0 + 4*WIDTH, \ WIDTH, stride, -stride, 2*stride, -2*stride, \ 3*stride, -3*stride, 4*stride, -4*stride, \ 0, mask); \ call_new(dst1, prev1 + 4*WIDTH, cur1 + 4*WIDTH, next1 + 4*WIDTH, \ WIDTH, stride, -stride, 2*stride, -2*stride, \ 3*stride, -3*stride, 4*stride, -4*stride, \ 0, mask); \ \ if (memcmp(dst0, dst1, sizeof dst0) \ || memcmp(prev0, prev1, sizeof prev0) \ || memcmp(next0, next1, sizeof next0) \ || memcmp( cur0, cur1, sizeof cur0)) \ fail(); \ bench_new(dst1, prev1 + 4*WIDTH, cur1 + 4*WIDTH, next1 + 4*WIDTH, \ WIDTH, stride, -stride, 2*stride, -2*stride, \ 3*stride, -3*stride, 4*stride, -4*stride, \ 0, mask); \ } while (0) void checkasm_check_vf_bwdif(void) { BWDIFDSPContext ctx_8, ctx_10; ff_bwdif_init_filter_line(&ctx_8, 8); ff_bwdif_init_filter_line(&ctx_10, 10); if (check_func(ctx_8.filter_line, "bwdif8")) { BODY(uint8_t, 8); report("bwdif8"); } if (check_func(ctx_10.filter_line, "bwdif10")) { BODY(uint16_t, 10); report("bwdif10"); } if (!ctx_8.filter_line3) ctx_8.filter_line3 = ff_bwdif_filter_line3_c; { LOCAL_ALIGNED_16(uint8_t, prev0, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, prev1, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, next0, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, next1, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, cur0, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, cur1, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, dst0, [WIDTH*3]); LOCAL_ALIGNED_16(uint8_t, dst1, [WIDTH*3]); const int stride = WIDTH; const int mask = (1<<8)-1; int parity; for (parity = 0; parity != 2; ++parity) { if (check_func(ctx_8.filter_line3, "bwdif8.line3.rnd.p%d", parity)) { declare_func(void, void * dst1, int d_stride, const void * prev1, const void * cur1, const void * next1, int prefs, int w, int parity, int clip_max); randomize_buffers(prev0, prev1, mask, 11*WIDTH); randomize_buffers(next0, next1, mask, 11*WIDTH); randomize_buffers( cur0, cur1, mask, 11*WIDTH); call_ref(dst0, stride, prev0 + stride * 4, cur0 + stride * 4, next0 + stride * 4, stride, WIDTH, parity, mask); call_new(dst1, stride, prev1 + stride * 4, cur1 + stride * 4, next1 + stride * 4, stride, WIDTH, parity, mask); if (memcmp(dst0, dst1, WIDTH*3) || memcmp(prev0, prev1, WIDTH*11) || memcmp(next0, next1, WIDTH*11) || memcmp( cur0, cur1, WIDTH*11)) fail(); bench_new(dst1, stride, prev1 + stride * 4, cur1 + stride * 4, next1 + stride * 4, stride, WIDTH, parity, mask); } } // Use just 0s and ~0s to try to provoke bad cropping or overflow // Parity makes no difference to this test so just test 0 if (check_func(ctx_8.filter_line3, "bwdif8.line3.overflow")) { declare_func(void, void * dst1, int d_stride, const void * prev1, const void * cur1, const void * next1, int prefs, int w, int parity, int clip_max); randomize_overflow_check(prev0, prev1, mask, 11*WIDTH); randomize_overflow_check(next0, next1, mask, 11*WIDTH); randomize_overflow_check( cur0, cur1, mask, 11*WIDTH); call_ref(dst0, stride, prev0 + stride * 4, cur0 + stride * 4, next0 + stride * 4, stride, WIDTH, 0, mask); call_new(dst1, stride, prev1 + stride * 4, cur1 + stride * 4, next1 + stride * 4, stride, WIDTH, 0, mask); if (memcmp(dst0, dst1, WIDTH*3) || memcmp(prev0, prev1, WIDTH*11) || memcmp(next0, next1, WIDTH*11) || memcmp( cur0, cur1, WIDTH*11)) fail(); // No point to benching } report("bwdif8.line3"); } { LOCAL_ALIGNED_16(uint8_t, prev0, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, prev1, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, next0, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, next1, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, cur0, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, cur1, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, dst0, [WIDTH*3]); LOCAL_ALIGNED_16(uint8_t, dst1, [WIDTH*3]); const int stride = WIDTH; const int mask = (1<<8)-1; int spat; int parity; for (spat = 0; spat != 2; ++spat) { for (parity = 0; parity != 2; ++parity) { if (check_func(ctx_8.filter_edge, "bwdif8.edge.s%d.p%d", spat, parity)) { declare_func(void, void *dst1, const void *prev1, const void *cur1, const void *next1, int w, int prefs, int mrefs, int prefs2, int mrefs2, int parity, int clip_max, int spat); randomize_buffers(prev0, prev1, mask, 11*WIDTH); randomize_buffers(next0, next1, mask, 11*WIDTH); randomize_buffers( cur0, cur1, mask, 11*WIDTH); memset(dst0, 0xba, WIDTH * 3); memset(dst1, 0xba, WIDTH * 3); call_ref(dst0 + stride, prev0 + stride * 4, cur0 + stride * 4, next0 + stride * 4, WIDTH, stride, -stride, stride * 2, -stride * 2, parity, mask, spat); call_new(dst1 + stride, prev1 + stride * 4, cur1 + stride * 4, next1 + stride * 4, WIDTH, stride, -stride, stride * 2, -stride * 2, parity, mask, spat); if (memcmp(dst0, dst1, WIDTH*3) || memcmp(prev0, prev1, WIDTH*11) || memcmp(next0, next1, WIDTH*11) || memcmp( cur0, cur1, WIDTH*11)) fail(); bench_new(dst1 + stride, prev1 + stride * 4, cur1 + stride * 4, next1 + stride * 4, WIDTH, stride, -stride, stride * 2, -stride * 2, parity, mask, spat); } } } report("bwdif8.edge"); } if (check_func(ctx_8.filter_intra, "bwdif8.intra")) { LOCAL_ALIGNED_16(uint8_t, cur0, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, cur1, [11*WIDTH]); LOCAL_ALIGNED_16(uint8_t, dst0, [WIDTH*3]); LOCAL_ALIGNED_16(uint8_t, dst1, [WIDTH*3]); const int stride = WIDTH; const int mask = (1<<8)-1; declare_func(void, void *dst1, const void *cur1, int w, int prefs, int mrefs, int prefs3, int mrefs3, int parity, int clip_max); randomize_buffers( cur0, cur1, mask, 11*WIDTH); memset(dst0, 0xba, WIDTH * 3); memset(dst1, 0xba, WIDTH * 3); call_ref(dst0 + stride, cur0 + stride * 4, WIDTH, stride, -stride, stride * 3, -stride * 3, 0, mask); call_new(dst1 + stride, cur0 + stride * 4, WIDTH, stride, -stride, stride * 3, -stride * 3, 0, mask); if (memcmp(dst0, dst1, WIDTH*3) || memcmp( cur0, cur1, WIDTH*11)) fail(); bench_new(dst1 + stride, cur0 + stride * 4, WIDTH, stride, -stride, stride * 3, -stride * 3, 0, mask); report("bwdif8.intra"); } }