/* * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #include #include #include "config.h" #include "checkasm.h" #include "libavcodec/idctdsp.h" #include "libavcodec/mathops.h" #include "libavcodec/mpegvideo.h" #include "libavcodec/mpegvideodata.h" #include "libavcodec/mpegvideo_unquantize.h" #include "libavutil/intreadwrite.h" #include "libavutil/mem_internal.h" #define randomize_struct(TYPE, s) do { \ static_assert(!(_Alignof(TYPE) % 4), \ "can't use aligned stores"); \ unsigned char *ptr = (unsigned char*)s; \ for (size_t i = 0; i < sizeof(*s) & ~3; i += 4) \ AV_WN32A(ptr + i, rnd()); \ for (size_t i = sizeof(*s) & ~3; i < sizeof(*s); ++i) \ ptr[i] = rnd(); \ } while (0) enum TestType { H263, MPEG1, MPEG2, }; static void init_idct_scantable(MPVContext *const s, int intra_scantable) { static const enum idct_permutation_type permutation_types[] = { FF_IDCT_PERM_NONE, FF_IDCT_PERM_LIBMPEG2, #if ARCH_X86_32 && HAVE_X86ASM FF_IDCT_PERM_SIMPLE, #endif #if ARCH_PPC || ARCH_X86 FF_IDCT_PERM_TRANSPOSE, #endif #if ARCH_ARM || ARCH_AARCH64 FF_IDCT_PERM_PARTTRANS, #endif #if ARCH_X86 && HAVE_X86ASM FF_IDCT_PERM_SSE2, #endif }; // Copied here to avoid #ifs. static const uint8_t ff_wmv1_scantable[][64] = { { 0x00, 0x08, 0x01, 0x02, 0x09, 0x10, 0x18, 0x11, 0x0A, 0x03, 0x04, 0x0B, 0x12, 0x19, 0x20, 0x28, 0x30, 0x38, 0x29, 0x21, 0x1A, 0x13, 0x0C, 0x05, 0x06, 0x0D, 0x14, 0x1B, 0x22, 0x31, 0x39, 0x3A, 0x32, 0x2A, 0x23, 0x1C, 0x15, 0x0E, 0x07, 0x0F, 0x16, 0x1D, 0x24, 0x2B, 0x33, 0x3B, 0x3C, 0x34, 0x2C, 0x25, 0x1E, 0x17, 0x1F, 0x26, 0x2D, 0x35, 0x3D, 0x3E, 0x36, 0x2E, 0x27, 0x2F, 0x37, 0x3F, }, { 0x00, 0x08, 0x01, 0x02, 0x09, 0x10, 0x18, 0x11, 0x0A, 0x03, 0x04, 0x0B, 0x12, 0x19, 0x20, 0x28, 0x21, 0x30, 0x1A, 0x13, 0x0C, 0x05, 0x06, 0x0D, 0x14, 0x1B, 0x22, 0x29, 0x38, 0x31, 0x39, 0x2A, 0x23, 0x1C, 0x15, 0x0E, 0x07, 0x0F, 0x16, 0x1D, 0x24, 0x2B, 0x32, 0x3A, 0x33, 0x3B, 0x2C, 0x25, 0x1E, 0x17, 0x1F, 0x26, 0x2D, 0x34, 0x3C, 0x35, 0x3D, 0x2E, 0x27, 0x2F, 0x36, 0x3E, 0x37, 0x3F, }, { 0x00, 0x01, 0x08, 0x02, 0x03, 0x09, 0x10, 0x18, 0x11, 0x0A, 0x04, 0x05, 0x0B, 0x12, 0x19, 0x20, 0x28, 0x30, 0x21, 0x1A, 0x13, 0x0C, 0x06, 0x07, 0x0D, 0x14, 0x1B, 0x22, 0x29, 0x38, 0x31, 0x39, 0x2A, 0x23, 0x1C, 0x15, 0x0E, 0x0F, 0x16, 0x1D, 0x24, 0x2B, 0x32, 0x3A, 0x33, 0x2C, 0x25, 0x1E, 0x17, 0x1F, 0x26, 0x2D, 0x34, 0x3B, 0x3C, 0x35, 0x2E, 0x27, 0x2F, 0x36, 0x3D, 0x3E, 0x37, 0x3F, }, { 0x00, 0x08, 0x10, 0x01, 0x18, 0x20, 0x28, 0x09, 0x02, 0x03, 0x0A, 0x11, 0x19, 0x30, 0x38, 0x29, 0x21, 0x1A, 0x12, 0x0B, 0x04, 0x05, 0x0C, 0x13, 0x1B, 0x22, 0x31, 0x39, 0x32, 0x2A, 0x23, 0x1C, 0x14, 0x0D, 0x06, 0x07, 0x0E, 0x15, 0x1D, 0x24, 0x2B, 0x33, 0x3A, 0x3B, 0x34, 0x2C, 0x25, 0x1E, 0x16, 0x0F, 0x17, 0x1F, 0x26, 0x2D, 0x3C, 0x35, 0x2E, 0x27, 0x2F, 0x36, 0x3D, 0x3E, 0x37, 0x3F, } }; static const uint8_t *const scantables[] = { ff_alternate_vertical_scan, ff_alternate_horizontal_scan, ff_zigzag_direct, ff_wmv1_scantable[0], ff_wmv1_scantable[1], ff_wmv1_scantable[2], ff_wmv1_scantable[3], }; static const uint8_t *scantable = NULL; static enum idct_permutation_type idct_permutation; if (!scantable) { scantable = scantables[rnd() % FF_ARRAY_ELEMS(scantables)]; idct_permutation = permutation_types[rnd() % FF_ARRAY_ELEMS(permutation_types)]; } ff_init_scantable_permutation(s->idsp.idct_permutation, idct_permutation); ff_init_scantable(s->idsp.idct_permutation, intra_scantable ? &s->intra_scantable : &s->inter_scantable, scantable); } static void init_h263_test(MPVContext *const s, int16_t block[64], int last_nonzero_coeff, int qscale, int intra) { const uint8_t *permutation = s->inter_scantable.permutated; if (intra) { permutation = s->intra_scantable.permutated; block[0] = rnd() & 511; static int h263_aic = -1, ac_pred; if (h263_aic < 0) { h263_aic = rnd() & 1; ac_pred = rnd() & 1; } s->h263_aic = h263_aic; s->ac_pred = ac_pred; if (s->ac_pred) last_nonzero_coeff = 63; } for (int i = intra; i <= last_nonzero_coeff; ++i) { int random = rnd(); if (random & 1) continue; random >>= 1; // Select level so that the multiplication fits into 16 bits. // FIXME: The FLV and MPEG-4 decoders can have escape values exceeding this. block[permutation[i]] = sign_extend(random, 10); } } static void init_mpeg12_test(MPVContext *const s, int16_t block[64], int last_nonzero_coeff, int qscale, int intra, enum TestType type) { uint16_t *matrix = intra ? s->intra_matrix : s->inter_matrix; if (type == MPEG2) qscale = s->q_scale_type ? ff_mpeg2_non_linear_qscale[qscale] : qscale << 1; for (int i = 0; i < 64; ++i) matrix[i] = 1 + rnd() % 254; const uint8_t *permutation = s->intra_scantable.permutated; if (intra) { block[0] = (int8_t)rnd(); for (int i = 1; i <= last_nonzero_coeff; ++i) { int j = permutation[i]; unsigned random = rnd(); if (random & 1) continue; random >>= 1; // Select level so that the multiplication does not overflow // an int16_t and so that it is within the possible range // (-2048..2047). FIXME: It seems that this need not be fulfilled // in practice for the MPEG-4 decoder at least. int limit = FFMIN(INT16_MAX / (qscale * matrix[j]), 2047); block[j] = random % (2 * limit + 1) - limit; } } else { for (int i = 0; i <= last_nonzero_coeff; ++i) { int j = permutation[i]; unsigned random = rnd(); if (random & 1) continue; random >>= 1; int limit = FFMIN((INT16_MAX / (qscale * matrix[j]) - 1) / 2, 2047); block[j] = random % (2 * limit + 1) - limit; } } } void checkasm_check_mpegvideo_unquantize(void) { static const struct { const char *name; size_t offset; int intra, intra_scantable; enum TestType type; } tests[] = { #define TEST(NAME, INTRA, INTRA_SCANTABLE, TYPE) \ { .name = #NAME, .offset = offsetof(MPVUnquantDSPContext, NAME), \ .intra = INTRA, .intra_scantable = INTRA_SCANTABLE, .type = TYPE } TEST(dct_unquantize_mpeg1_intra, 1, 1, MPEG1), TEST(dct_unquantize_mpeg1_inter, 0, 1, MPEG1), TEST(dct_unquantize_mpeg2_intra, 1, 1, MPEG2), TEST(dct_unquantize_mpeg2_inter, 0, 1, MPEG2), TEST(dct_unquantize_h263_intra, 1, 1, H263), TEST(dct_unquantize_h263_inter, 0, 0, H263), }; MPVUnquantDSPContext unquant_dsp_ctx; int q_scale_type = rnd() & 1; ff_mpv_unquantize_init(&unquant_dsp_ctx, 1 /* bitexact */, q_scale_type); declare_func(void, const MPVContext *s, int16_t *block, int n, int qscale); for (size_t i = 0; i < FF_ARRAY_ELEMS(tests); ++i) { void (*func)(const MPVContext *s, int16_t *block, int n, int qscale) = *(void (**)(const MPVContext *, int16_t *, int, int))((char*)&unquant_dsp_ctx + tests[i].offset); if (check_func(func, "%s", tests[i].name)) { MPVContext new, ref; DECLARE_ALIGNED(16, int16_t, block_new)[64]; DECLARE_ALIGNED(16, int16_t, block_ref)[64]; static int block_last_index = -1; randomize_struct(MPVContext, &ref); ref.q_scale_type = q_scale_type; init_idct_scantable(&ref, tests[i].intra_scantable); if (block_last_index < 0) block_last_index = rnd() % 64; memset(block_ref, 0, sizeof(block_ref)); if (tests[i].intra) { // Less restricted than real dc_scale values ref.y_dc_scale = 1 + rnd() % 64; ref.c_dc_scale = 1 + rnd() % 64; } static int qscale = 0; if (qscale == 0) qscale = 1 + rnd() % 31; if (tests[i].type == H263) init_h263_test(&ref, block_ref, block_last_index, qscale, tests[i].intra); else init_mpeg12_test(&ref, block_ref, block_last_index, qscale, tests[i].intra, tests[i].type); int n = rnd() % 6; ref.block_last_index[n] = block_last_index; memcpy(&new, &ref, sizeof(new)); memcpy(block_new, block_ref, sizeof(block_new)); call_ref(&ref, block_ref, n, qscale); call_new(&new, block_new, n, qscale); if (memcmp(&ref, &new, sizeof(new)) || memcmp(block_new, block_ref, sizeof(block_new))) fail(); bench_new(&new, block_new, n, qscale); } report("%s", tests[i].name); } }