1/*
2 * Copyright (c) 2016 Ronald S. Bultje <rsbultje@gmail.com>
3 *
4 * This file is part of FFmpeg.
5 *
6 * FFmpeg is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License along
17 * with FFmpeg; if not, write to the Free Software Foundation, Inc.,
18 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
19 */
20
21#include <string.h>
22#include "checkasm.h"
23#include "libavcodec/videodsp.h"
24#include "libavutil/internal.h"
25#include "libavutil/intreadwrite.h"
26#include "libavutil/mem_internal.h"
27
28#define randomize_buffers(w, h)                         \
29    do {                                                \
30        int i;                                          \
31        for (i = 0; i < w * h * sizeof(*src0); i += 4)  \
32            AV_WN32A(((uint8_t *) src0) + i, rnd());    \
33    } while (0)
34
35#define iter_1d(type, fix, fix_val, var, var_start, var_end)        \
36    for (fix = fix_val, var = var_start; var <= var_end; var++) {   \
37        call_ref((type *) dst0, (const type *) (src0 + y * pw + x), \
38                 bw * sizeof(type), pw * sizeof(type),              \
39                 bw, bh, x, y, pw, ph);                             \
40        call_new((type *) dst1, (const type *) (src1 + y * pw + x), \
41                 bw * sizeof(type), pw * sizeof(type),              \
42                 bw, bh, x, y, pw, ph);                             \
43        if (memcmp(dst0, dst1, bw * bh * sizeof(type)))             \
44            fail();                                                 \
45        bench_new((type *) dst1, (const type *) (src1 + y * pw + x),\
46                  bw * sizeof(type), pw * sizeof(type),             \
47                  bw, bh, x, y, pw, ph);                            \
48    }
49
50#define check_emu_edge_size(type, src_w, src_h, dst_w, dst_h)   \
51    do {                                                        \
52        LOCAL_ALIGNED_16(type, src0, [src_w * src_h]);          \
53        LOCAL_ALIGNED_16(type, src1, [src_w * src_h]);          \
54        int bw = dst_w, bh = dst_h;                             \
55        int pw = src_w, ph = src_h;                             \
56        int y, x;                                               \
57        randomize_buffers(src_w, src_h);                        \
58        memcpy(src1, src0, pw * ph * sizeof(type));             \
59        iter_1d(type, y, 0 - src_h, x, 0 - src_w, src_w - 0);   \
60        iter_1d(type, x, src_w - 0, y, 0 - src_h, src_h - 0);   \
61        iter_1d(type, y, src_h - 0, x, 0 - src_w, src_w - 0);   \
62        iter_1d(type, x, 0 - src_w, y, 0 - src_h, src_h - 0);   \
63    } while (0)
64
65#define check_emu_edge(type)                                    \
66    do {                                                        \
67        LOCAL_ALIGNED_16(type, dst0, [64 * 64]);                \
68        LOCAL_ALIGNED_16(type, dst1, [64 * 64]);                \
69        declare_func_emms(AV_CPU_FLAG_MMX | AV_CPU_FLAG_MMXEXT, \
70                          void, type *dst, const type *src,     \
71                          ptrdiff_t dst_linesize,               \
72                          ptrdiff_t src_linesize,               \
73                          int block_w, int block_h,             \
74                          int src_x, int src_y,                 \
75                          int src_w, int src_h);                \
76        check_emu_edge_size(type, 16,  1, 64, 64);              \
77        check_emu_edge_size(type, 16, 16, 64, 64);              \
78        check_emu_edge_size(type, 64, 64, 64, 64);              \
79    } while (0)
80
81void checkasm_check_videodsp(void)
82{
83    VideoDSPContext vdsp;
84
85    ff_videodsp_init(&vdsp, 8);
86    if (check_func(vdsp.emulated_edge_mc, "emulated_edge_mc_8"))
87        check_emu_edge(uint8_t);
88
89    report("emulated_edge_mc");
90}
91