mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2026-01-12 00:06:51 +08:00
Reviewed-by: Kacper Michajłow <kasper93@gmail.com> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
275 lines
10 KiB
C
275 lines
10 KiB
C
/*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include <assert.h>
|
|
#include <stddef.h>
|
|
|
|
#include "config.h"
|
|
|
|
#include "checkasm.h"
|
|
|
|
#include "libavcodec/idctdsp.h"
|
|
#include "libavcodec/mathops.h"
|
|
#include "libavcodec/mpegvideo.h"
|
|
#include "libavcodec/mpegvideodata.h"
|
|
#include "libavcodec/mpegvideo_unquantize.h"
|
|
|
|
#include "libavutil/intreadwrite.h"
|
|
#include "libavutil/mem_internal.h"
|
|
|
|
#define randomize_struct(TYPE, s) do { \
|
|
static_assert(!(_Alignof(TYPE) % 4), \
|
|
"can't use aligned stores"); \
|
|
unsigned char *ptr = (unsigned char*)s; \
|
|
for (size_t i = 0; i < sizeof(*s) & ~3; i += 4) \
|
|
AV_WN32A(ptr + i, rnd()); \
|
|
for (size_t i = sizeof(*s) & ~3; i < sizeof(*s); ++i) \
|
|
ptr[i] = rnd(); \
|
|
} while (0)
|
|
|
|
enum TestType {
|
|
H263,
|
|
MPEG1,
|
|
MPEG2,
|
|
};
|
|
|
|
static void init_idct_scantable(MPVContext *const s, int intra_scantable)
|
|
{
|
|
static const enum idct_permutation_type permutation_types[] = {
|
|
FF_IDCT_PERM_NONE,
|
|
FF_IDCT_PERM_LIBMPEG2,
|
|
#if ARCH_X86_32 && HAVE_X86ASM
|
|
FF_IDCT_PERM_SIMPLE,
|
|
#endif
|
|
#if ARCH_PPC || ARCH_X86
|
|
FF_IDCT_PERM_TRANSPOSE,
|
|
#endif
|
|
#if ARCH_ARM || ARCH_AARCH64
|
|
FF_IDCT_PERM_PARTTRANS,
|
|
#endif
|
|
#if ARCH_X86 && HAVE_X86ASM
|
|
FF_IDCT_PERM_SSE2,
|
|
#endif
|
|
};
|
|
// Copied here to avoid #ifs.
|
|
static const uint8_t ff_wmv1_scantable[][64] = {
|
|
{ 0x00, 0x08, 0x01, 0x02, 0x09, 0x10, 0x18, 0x11,
|
|
0x0A, 0x03, 0x04, 0x0B, 0x12, 0x19, 0x20, 0x28,
|
|
0x30, 0x38, 0x29, 0x21, 0x1A, 0x13, 0x0C, 0x05,
|
|
0x06, 0x0D, 0x14, 0x1B, 0x22, 0x31, 0x39, 0x3A,
|
|
0x32, 0x2A, 0x23, 0x1C, 0x15, 0x0E, 0x07, 0x0F,
|
|
0x16, 0x1D, 0x24, 0x2B, 0x33, 0x3B, 0x3C, 0x34,
|
|
0x2C, 0x25, 0x1E, 0x17, 0x1F, 0x26, 0x2D, 0x35,
|
|
0x3D, 0x3E, 0x36, 0x2E, 0x27, 0x2F, 0x37, 0x3F, },
|
|
{ 0x00, 0x08, 0x01, 0x02, 0x09, 0x10, 0x18, 0x11,
|
|
0x0A, 0x03, 0x04, 0x0B, 0x12, 0x19, 0x20, 0x28,
|
|
0x21, 0x30, 0x1A, 0x13, 0x0C, 0x05, 0x06, 0x0D,
|
|
0x14, 0x1B, 0x22, 0x29, 0x38, 0x31, 0x39, 0x2A,
|
|
0x23, 0x1C, 0x15, 0x0E, 0x07, 0x0F, 0x16, 0x1D,
|
|
0x24, 0x2B, 0x32, 0x3A, 0x33, 0x3B, 0x2C, 0x25,
|
|
0x1E, 0x17, 0x1F, 0x26, 0x2D, 0x34, 0x3C, 0x35,
|
|
0x3D, 0x2E, 0x27, 0x2F, 0x36, 0x3E, 0x37, 0x3F, },
|
|
{ 0x00, 0x01, 0x08, 0x02, 0x03, 0x09, 0x10, 0x18,
|
|
0x11, 0x0A, 0x04, 0x05, 0x0B, 0x12, 0x19, 0x20,
|
|
0x28, 0x30, 0x21, 0x1A, 0x13, 0x0C, 0x06, 0x07,
|
|
0x0D, 0x14, 0x1B, 0x22, 0x29, 0x38, 0x31, 0x39,
|
|
0x2A, 0x23, 0x1C, 0x15, 0x0E, 0x0F, 0x16, 0x1D,
|
|
0x24, 0x2B, 0x32, 0x3A, 0x33, 0x2C, 0x25, 0x1E,
|
|
0x17, 0x1F, 0x26, 0x2D, 0x34, 0x3B, 0x3C, 0x35,
|
|
0x2E, 0x27, 0x2F, 0x36, 0x3D, 0x3E, 0x37, 0x3F, },
|
|
{ 0x00, 0x08, 0x10, 0x01, 0x18, 0x20, 0x28, 0x09,
|
|
0x02, 0x03, 0x0A, 0x11, 0x19, 0x30, 0x38, 0x29,
|
|
0x21, 0x1A, 0x12, 0x0B, 0x04, 0x05, 0x0C, 0x13,
|
|
0x1B, 0x22, 0x31, 0x39, 0x32, 0x2A, 0x23, 0x1C,
|
|
0x14, 0x0D, 0x06, 0x07, 0x0E, 0x15, 0x1D, 0x24,
|
|
0x2B, 0x33, 0x3A, 0x3B, 0x34, 0x2C, 0x25, 0x1E,
|
|
0x16, 0x0F, 0x17, 0x1F, 0x26, 0x2D, 0x3C, 0x35,
|
|
0x2E, 0x27, 0x2F, 0x36, 0x3D, 0x3E, 0x37, 0x3F, }
|
|
};
|
|
|
|
static const uint8_t *const scantables[] = {
|
|
ff_alternate_vertical_scan,
|
|
ff_alternate_horizontal_scan,
|
|
ff_zigzag_direct,
|
|
ff_wmv1_scantable[0],
|
|
ff_wmv1_scantable[1],
|
|
ff_wmv1_scantable[2],
|
|
ff_wmv1_scantable[3],
|
|
};
|
|
static const uint8_t *scantable = NULL;
|
|
static enum idct_permutation_type idct_permutation;
|
|
|
|
if (!scantable) {
|
|
scantable = scantables[rnd() % FF_ARRAY_ELEMS(scantables)];
|
|
idct_permutation = permutation_types[rnd() % FF_ARRAY_ELEMS(permutation_types)];
|
|
}
|
|
ff_init_scantable_permutation(s->idsp.idct_permutation, idct_permutation);
|
|
ff_init_scantable(s->idsp.idct_permutation,
|
|
intra_scantable ? &s->intra_scantable : &s->inter_scantable,
|
|
scantable);
|
|
}
|
|
|
|
static void init_h263_test(MPVContext *const s, int16_t block[64],
|
|
int last_nonzero_coeff, int qscale, int intra)
|
|
{
|
|
const uint8_t *permutation = s->inter_scantable.permutated;
|
|
if (intra) {
|
|
permutation = s->intra_scantable.permutated;
|
|
block[0] = rnd() & 511;
|
|
static int h263_aic = -1, ac_pred;
|
|
if (h263_aic < 0) {
|
|
h263_aic = rnd() & 1;
|
|
ac_pred = rnd() & 1;
|
|
}
|
|
s->h263_aic = h263_aic;
|
|
s->ac_pred = ac_pred;
|
|
if (s->ac_pred)
|
|
last_nonzero_coeff = 63;
|
|
}
|
|
for (int i = intra; i <= last_nonzero_coeff; ++i) {
|
|
int random = rnd();
|
|
if (random & 1)
|
|
continue;
|
|
random >>= 1;
|
|
// Select level so that the multiplication fits into 16 bits.
|
|
// FIXME: The FLV and MPEG-4 decoders can have escape values exceeding this.
|
|
block[permutation[i]] = sign_extend(random, 10);
|
|
}
|
|
}
|
|
|
|
static void init_mpeg12_test(MPVContext *const s, int16_t block[64],
|
|
int last_nonzero_coeff, int qscale, int intra,
|
|
enum TestType type)
|
|
{
|
|
uint16_t *matrix = intra ? s->intra_matrix : s->inter_matrix;
|
|
|
|
if (type == MPEG2)
|
|
qscale = s->q_scale_type ? ff_mpeg2_non_linear_qscale[qscale] : qscale << 1;
|
|
|
|
for (int i = 0; i < 64; ++i)
|
|
matrix[i] = 1 + rnd() % 254;
|
|
|
|
const uint8_t *permutation = s->intra_scantable.permutated;
|
|
if (intra) {
|
|
block[0] = (int8_t)rnd();
|
|
for (int i = 1; i <= last_nonzero_coeff; ++i) {
|
|
int j = permutation[i];
|
|
unsigned random = rnd();
|
|
if (random & 1)
|
|
continue;
|
|
random >>= 1;
|
|
// Select level so that the multiplication does not overflow
|
|
// an int16_t and so that it is within the possible range
|
|
// (-2048..2047). FIXME: It seems that this need not be fulfilled
|
|
// in practice for the MPEG-4 decoder at least.
|
|
int limit = FFMIN(INT16_MAX / (qscale * matrix[j]), 2047);
|
|
block[j] = random % (2 * limit + 1) - limit;
|
|
}
|
|
} else {
|
|
for (int i = 0; i <= last_nonzero_coeff; ++i) {
|
|
int j = permutation[i];
|
|
unsigned random = rnd();
|
|
if (random & 1)
|
|
continue;
|
|
random >>= 1;
|
|
int limit = FFMIN((INT16_MAX / (qscale * matrix[j]) - 1) / 2, 2047);
|
|
block[j] = random % (2 * limit + 1) - limit;
|
|
}
|
|
}
|
|
}
|
|
|
|
void checkasm_check_mpegvideo_unquantize(void)
|
|
{
|
|
static const struct {
|
|
const char *name;
|
|
size_t offset;
|
|
int intra, intra_scantable;
|
|
enum TestType type;
|
|
} tests[] = {
|
|
#define TEST(NAME, INTRA, INTRA_SCANTABLE, TYPE) \
|
|
{ .name = #NAME, .offset = offsetof(MPVUnquantDSPContext, NAME), \
|
|
.intra = INTRA, .intra_scantable = INTRA_SCANTABLE, .type = TYPE }
|
|
TEST(dct_unquantize_mpeg1_intra, 1, 1, MPEG1),
|
|
TEST(dct_unquantize_mpeg1_inter, 0, 1, MPEG1),
|
|
TEST(dct_unquantize_mpeg2_intra, 1, 1, MPEG2),
|
|
TEST(dct_unquantize_mpeg2_inter, 0, 1, MPEG2),
|
|
TEST(dct_unquantize_h263_intra, 1, 1, H263),
|
|
TEST(dct_unquantize_h263_inter, 0, 0, H263),
|
|
};
|
|
MPVUnquantDSPContext unquant_dsp_ctx;
|
|
int q_scale_type = rnd() & 1;
|
|
|
|
ff_mpv_unquantize_init(&unquant_dsp_ctx, 1 /* bitexact */, q_scale_type);
|
|
declare_func(void, const MPVContext *s, int16_t *block, int n, int qscale);
|
|
|
|
for (size_t i = 0; i < FF_ARRAY_ELEMS(tests); ++i) {
|
|
void (*func)(const MPVContext *s, int16_t *block, int n, int qscale) =
|
|
*(void (**)(const MPVContext *, int16_t *, int, int))((char*)&unquant_dsp_ctx + tests[i].offset);
|
|
if (check_func(func, "%s", tests[i].name)) {
|
|
MPVContext new, ref;
|
|
DECLARE_ALIGNED(16, int16_t, block_new)[64];
|
|
DECLARE_ALIGNED(16, int16_t, block_ref)[64];
|
|
static int block_last_index = -1;
|
|
|
|
randomize_struct(MPVContext, &ref);
|
|
|
|
ref.q_scale_type = q_scale_type;
|
|
|
|
init_idct_scantable(&ref, tests[i].intra_scantable);
|
|
|
|
if (block_last_index < 0)
|
|
block_last_index = rnd() % 64;
|
|
|
|
memset(block_ref, 0, sizeof(block_ref));
|
|
|
|
if (tests[i].intra) {
|
|
// Less restricted than real dc_scale values
|
|
ref.y_dc_scale = 1 + rnd() % 64;
|
|
ref.c_dc_scale = 1 + rnd() % 64;
|
|
}
|
|
|
|
static int qscale = 0;
|
|
|
|
if (qscale == 0)
|
|
qscale = 1 + rnd() % 31;
|
|
|
|
if (tests[i].type == H263)
|
|
init_h263_test(&ref, block_ref, block_last_index, qscale,
|
|
tests[i].intra);
|
|
else
|
|
init_mpeg12_test(&ref, block_ref, block_last_index, qscale,
|
|
tests[i].intra, tests[i].type);
|
|
|
|
int n = rnd() % 6;
|
|
ref.block_last_index[n] = block_last_index;
|
|
|
|
memcpy(&new, &ref, sizeof(new));
|
|
memcpy(block_new, block_ref, sizeof(block_new));
|
|
|
|
call_ref(&ref, block_ref, n, qscale);
|
|
call_new(&new, block_new, n, qscale);
|
|
|
|
if (memcmp(&ref, &new, sizeof(new)) || memcmp(block_new, block_ref, sizeof(block_new)))
|
|
fail();
|
|
|
|
bench_new(&new, block_new, n, qscale);
|
|
}
|
|
report("%s", tests[i].name);
|
|
}
|
|
}
|