You've already forked FFmpeg
mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2025-11-23 21:54:53 +02:00
Reviewed-by: Lynne <dev@lynne.ee> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
211 lines
7.3 KiB
C
211 lines
7.3 KiB
C
/*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include "libavutil/common.h"
|
|
#include "libavutil/intreadwrite.h"
|
|
#include "libavutil/mem_internal.h"
|
|
|
|
#include "libavcodec/mathops.h"
|
|
#include "libavcodec/mpegvideoencdsp.h"
|
|
|
|
#include "checkasm.h"
|
|
|
|
#define randomize_buffers(buf, size) \
|
|
do { \
|
|
for (int j = 0; j < size; j += 4) \
|
|
AV_WN32((char*)buf + j, rnd()); \
|
|
} while (0)
|
|
|
|
#define randomize_buffer_clipped(buf, min, max) \
|
|
do { \
|
|
for (size_t j = 0; j < FF_ARRAY_ELEMS(buf); ++j) \
|
|
buf[j] = rnd() % (max - min + 1) + min; \
|
|
} while (0)
|
|
|
|
static void check_denoise_dct(MpegvideoEncDSPContext *c)
|
|
{
|
|
declare_func(void, int16_t block[64], int dct_error_sum[64],
|
|
const uint16_t dct_offset[64]);
|
|
|
|
if (check_func(c->denoise_dct, "denoise_dct")) {
|
|
DECLARE_ALIGNED(16, int16_t, block_ref)[64];
|
|
DECLARE_ALIGNED(16, int16_t, block_new)[64];
|
|
DECLARE_ALIGNED(16, int, dct_error_sum_ref)[64];
|
|
DECLARE_ALIGNED(16, int, dct_error_sum_new)[64];
|
|
DECLARE_ALIGNED(16, uint16_t, dct_offset)[64];
|
|
|
|
for (size_t i = 0; i < FF_ARRAY_ELEMS(block_ref); ++i) {
|
|
unsigned random = rnd();
|
|
block_ref[i] = random & (1 << 16) ? random : 0;
|
|
}
|
|
randomize_buffers(dct_offset, sizeof(dct_offset));
|
|
randomize_buffer_clipped(dct_error_sum_ref, 0, (1 << 24) - 1);
|
|
memcpy(block_new, block_ref, sizeof(block_new));
|
|
memcpy(dct_error_sum_new, dct_error_sum_ref, sizeof(dct_error_sum_ref));
|
|
|
|
call_ref(block_ref, dct_error_sum_ref, dct_offset);
|
|
call_new(block_new, dct_error_sum_new, dct_offset);
|
|
if (memcmp(block_ref, block_new, sizeof(block_ref)) ||
|
|
memcmp(dct_error_sum_new, dct_error_sum_ref, sizeof(dct_error_sum_new)))
|
|
fail();
|
|
|
|
bench_new(block_new, dct_error_sum_new, dct_offset);
|
|
}
|
|
}
|
|
|
|
static void check_add_8x8basis(MpegvideoEncDSPContext *c)
|
|
{
|
|
declare_func(void, int16_t rem[64], const int16_t basis[64], int scale);
|
|
if (check_func(c->add_8x8basis, "add_8x8basis")) {
|
|
// FIXME: What are the actual ranges for these values?
|
|
int scale = sign_extend(rnd(), 12);
|
|
DECLARE_ALIGNED(16, int16_t, rem1)[64];
|
|
DECLARE_ALIGNED(16, int16_t, rem2)[64];
|
|
DECLARE_ALIGNED(16, int16_t, basis)[64];
|
|
|
|
randomize_buffer_clipped(basis, -15760, 15760);
|
|
randomize_buffers(rem1, sizeof(rem1));
|
|
memcpy(rem2, rem1, sizeof(rem2));
|
|
call_ref(rem1, basis, scale);
|
|
call_new(rem2, basis, scale);
|
|
if (memcmp(rem1, rem2, sizeof(rem1)))
|
|
fail();
|
|
bench_new(rem1, basis, scale);
|
|
}
|
|
}
|
|
|
|
static void check_pix_sum(MpegvideoEncDSPContext *c)
|
|
{
|
|
LOCAL_ALIGNED_16(uint8_t, src, [16 * 16]);
|
|
|
|
declare_func(int, const uint8_t *pix, ptrdiff_t line_size);
|
|
|
|
randomize_buffers(src, 16 * 16);
|
|
|
|
for (int n = 0; n < 2; n++) {
|
|
const char *negstride_str = n ? "_negstride" : "";
|
|
if (check_func(c->pix_sum, "pix_sum%s", negstride_str)) {
|
|
int sum0, sum1;
|
|
const uint8_t *pix = src + (n ? (15 * 16) : 0);
|
|
ptrdiff_t line_size = 16 * (n ? -1 : 1);
|
|
sum0 = call_ref(pix, line_size);
|
|
sum1 = call_new(pix, line_size);
|
|
if (sum0 != sum1)
|
|
fail();
|
|
bench_new(pix, line_size);
|
|
}
|
|
}
|
|
}
|
|
|
|
static void check_pix_norm1(MpegvideoEncDSPContext *c)
|
|
{
|
|
LOCAL_ALIGNED_16(uint8_t, src, [16 * 16]);
|
|
|
|
declare_func(int, const uint8_t *pix, ptrdiff_t line_size);
|
|
|
|
randomize_buffers(src, 16 * 16);
|
|
|
|
for (int n = 0; n < 2; n++) {
|
|
const char *negstride_str = n ? "_negstride" : "";
|
|
if (check_func(c->pix_norm1, "pix_norm1%s", negstride_str)) {
|
|
int sum0, sum1;
|
|
const uint8_t *pix = src + (n ? (15 * 16) : 0);
|
|
ptrdiff_t line_size = 16 * (n ? -1 : 1);
|
|
sum0 = call_ref(pix, line_size);
|
|
sum1 = call_new(pix, line_size);
|
|
if (sum0 != sum1)
|
|
fail();
|
|
bench_new(pix, line_size);
|
|
}
|
|
}
|
|
}
|
|
|
|
#define NUM_LINES 4
|
|
#define MAX_LINE_SIZE 1920
|
|
#define EDGE_WIDTH 16
|
|
#define LINESIZE (EDGE_WIDTH + MAX_LINE_SIZE + EDGE_WIDTH)
|
|
#define BUFSIZE ((EDGE_WIDTH + NUM_LINES + EDGE_WIDTH) * LINESIZE)
|
|
|
|
static void check_draw_edges(MpegvideoEncDSPContext *c)
|
|
{
|
|
static const int input_sizes[] = {8, 128, 1080, MAX_LINE_SIZE, -MAX_LINE_SIZE};
|
|
LOCAL_ALIGNED_16(uint8_t, buf0, [BUFSIZE]);
|
|
LOCAL_ALIGNED_16(uint8_t, buf1, [BUFSIZE]);
|
|
|
|
declare_func_emms(AV_CPU_FLAG_MMX, void, uint8_t *buf, ptrdiff_t wrap, int width, int height,
|
|
int w, int h, int sides);
|
|
|
|
for (int isi = 0; isi < FF_ARRAY_ELEMS(input_sizes); isi++) {
|
|
int input_size = input_sizes[isi];
|
|
int negstride = input_size < 0;
|
|
const char *negstride_str = negstride ? "_negstride" : "";
|
|
int width = FFABS(input_size);
|
|
ptrdiff_t linesize = EDGE_WIDTH + width + EDGE_WIDTH;
|
|
/* calculate height based on specified width to use the entire buffer. */
|
|
int height = (BUFSIZE / linesize) - (2 * EDGE_WIDTH);
|
|
uint8_t *dst0 = buf0 + EDGE_WIDTH * linesize + EDGE_WIDTH;
|
|
uint8_t *dst1 = buf1 + EDGE_WIDTH * linesize + EDGE_WIDTH;
|
|
|
|
if (negstride) {
|
|
dst0 += (height - 1) * linesize;
|
|
dst1 += (height - 1) * linesize;
|
|
linesize *= -1;
|
|
}
|
|
|
|
for (int shift = 0; shift < 3; shift++) {
|
|
int edge = EDGE_WIDTH >> shift;
|
|
if (check_func(c->draw_edges, "draw_edges_%d_%d_%d%s", width, height, edge, negstride_str)) {
|
|
randomize_buffers(buf0, BUFSIZE);
|
|
memcpy(buf1, buf0, BUFSIZE);
|
|
call_ref(dst0, linesize, width, height, edge, edge, EDGE_BOTTOM | EDGE_TOP);
|
|
call_new(dst1, linesize, width, height, edge, edge, EDGE_BOTTOM | EDGE_TOP);
|
|
if (memcmp(buf0, buf1, BUFSIZE))
|
|
fail();
|
|
bench_new(dst1, linesize, width, height, edge, edge, EDGE_BOTTOM | EDGE_TOP);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
#undef NUM_LINES
|
|
#undef MAX_LINE_SIZE
|
|
#undef EDGE_WIDTH
|
|
#undef LINESIZE
|
|
#undef BUFSIZE
|
|
|
|
void checkasm_check_mpegvideoencdsp(void)
|
|
{
|
|
AVCodecContext avctx = {
|
|
.bits_per_raw_sample = 8,
|
|
};
|
|
MpegvideoEncDSPContext c = { 0 };
|
|
|
|
ff_mpegvideoencdsp_init(&c, &avctx);
|
|
|
|
check_denoise_dct(&c);
|
|
report("denoise_dct");
|
|
check_pix_sum(&c);
|
|
report("pix_sum");
|
|
check_pix_norm1(&c);
|
|
report("pix_norm1");
|
|
check_draw_edges(&c);
|
|
report("draw_edges");
|
|
check_add_8x8basis(&c);
|
|
report("add_8x8basis");
|
|
}
|