/* * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with FFmpeg; if not, write to the Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */ #include #include #include #include "checkasm.h" #include "libavutil/intreadwrite.h" #include "libavutil/macros.h" #include "libavutil/mem_internal.h" #include "libavcodec/vp6data.h" #include "libavcodec/vp56dsp.h" #define randomize_buffer(buf) \ do { \ for (size_t k = 0; k < (sizeof(buf) & ~3); k += 4) \ AV_WN32A(buf + k, rnd()); \ for (size_t k = sizeof(buf) & ~3; k < sizeof(buf); ++k) \ buf[k] = rnd(); \ } while (0) void checkasm_check_vp6dsp(void) { enum { BLOCK_SIZE_1D = 8, SRC_ROWS_ABOVE = 1, SRC_ROWS_BELOW = 2, SRC_COLS_LEFT = 1, SRC_COLS_RIGHT = 2, SRC_ROWS = SRC_ROWS_ABOVE + BLOCK_SIZE_1D + SRC_ROWS_BELOW, SRC_ROW_SIZE = SRC_COLS_LEFT + BLOCK_SIZE_1D + SRC_COLS_RIGHT, MAX_STRIDE = 64, ///< arbitrary SRC_BUF_SIZE = (SRC_ROWS - 1) * MAX_STRIDE + SRC_ROW_SIZE + 7 /* to vary misalignment */, DST_BUF_SIZE = (BLOCK_SIZE_1D - 1) * MAX_STRIDE + BLOCK_SIZE_1D, }; VP6DSPContext vp6dsp; ff_vp6dsp_init(&vp6dsp); declare_func(void, uint8_t *dst, const uint8_t *src, ptrdiff_t stride, const int16_t *h_weights, const int16_t *v_weights); if (check_func(vp6dsp.vp6_filter_diag4, "filter_diag4")) { DECLARE_ALIGNED(8, uint8_t, dstbuf_ref)[DST_BUF_SIZE]; DECLARE_ALIGNED(8, uint8_t, dstbuf_new)[DST_BUF_SIZE]; DECLARE_ALIGNED(8, uint8_t, srcbuf)[SRC_BUF_SIZE]; randomize_buffer(dstbuf_ref); randomize_buffer(srcbuf); memcpy(dstbuf_new, dstbuf_ref, sizeof(dstbuf_new)); ptrdiff_t stride = (rnd() % (MAX_STRIDE / 16) + 1) * 16; const uint8_t *src = srcbuf + SRC_COLS_LEFT + rnd() % 8U; uint8_t *dst_new = dstbuf_new, *dst_ref = dstbuf_ref; if (rnd() & 1) { dst_new += (BLOCK_SIZE_1D - 1) * stride; dst_ref += (BLOCK_SIZE_1D - 1) * stride; src += (SRC_ROWS - 1) * stride; stride *= -1; } src += SRC_ROWS_ABOVE * stride; unsigned select = rnd() % FF_ARRAY_ELEMS(vp6_block_copy_filter); unsigned x8 = 1 + rnd() % (FF_ARRAY_ELEMS(vp6_block_copy_filter[0]) - 1); unsigned y8 = 1 + rnd() % (FF_ARRAY_ELEMS(vp6_block_copy_filter[0]) - 1); const int16_t *h_weights = vp6_block_copy_filter[select][x8]; const int16_t *v_weights = vp6_block_copy_filter[select][y8]; call_ref(dst_ref, src, stride, h_weights, v_weights); call_new(dst_new, src, stride, h_weights, v_weights); if (memcmp(dstbuf_new, dstbuf_ref, sizeof(dstbuf_new))) fail(); bench_new(dst_new, src, stride, h_weights, v_weights); } report("filter_diag4"); }