FFmpeg
cavsdsp.c
Go to the documentation of this file.
1 /*
2  * This file is part of FFmpeg.
3  *
4  * FFmpeg is free software; you can redistribute it and/or modify
5  * it under the terms of the GNU General Public License as published by
6  * the Free Software Foundation; either version 2 of the License, or
7  * (at your option) any later version.
8  *
9  * FFmpeg is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12  * GNU General Public License for more details.
13  *
14  * You should have received a copy of the GNU General Public License along
15  * with FFmpeg; if not, write to the Free Software Foundation, Inc.,
16  * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
17  */
18 
19 #include <assert.h>
20 #include <stddef.h>
21 
22 #include "checkasm.h"
23 #include "libavutil/intreadwrite.h"
24 #include "libavutil/macros.h"
25 #include "libavutil/mem_internal.h"
26 #include "libavcodec/cavsdsp.h"
27 
28 
29 enum {
30 // DECLARE_ALIGNED can't handle enum constants.
31 #define MAX_BLOCK_SIZE 16
32  MAX_STRIDE = 64,
33  /// BUF_SIZE is bigger than necessary in order to test strides > block width.
35  /**
36  * The qpel interpolation code accesses two lines above and three lines
37  * below the actual src block; it also accesses two pixels to the left
38  * and three to the right.
39  * The input is not subject to alignment requirements; making the input buffer
40  * bigger (by MAX_BLOCK_SIZE - 1) allows us to use a random misalignment.
41  */
43 };
44 
45 #define randomize_buffers(buf0, buf1) \
46  do { \
47  static_assert(sizeof(buf0) == sizeof(buf1), "Incompatible buffers"); \
48  static_assert(!(sizeof(buf0) % 4), "Tail handling needed"); \
49  static_assert(sizeof(buf0[0]) == 1 && sizeof(buf1[0]) == 1, \
50  "Pointer arithmetic needs to be adapted"); \
51  for (size_t k = 0; k < sizeof(buf0); k += 4) { \
52  uint32_t r = rnd(); \
53  AV_WN32A(buf0 + k, r); \
54  AV_WN32A(buf1 + k, r); \
55  } \
56  } while (0)
57 
58 
59 static void check_cavs_qpeldsp(void)
60 {
61  DECLARE_ALIGNED(MAX_BLOCK_SIZE, uint8_t, srcbuf0)[INPUT_BUF_SIZE];
62  DECLARE_ALIGNED(MAX_BLOCK_SIZE, uint8_t, srcbuf1)[INPUT_BUF_SIZE];
63  DECLARE_ALIGNED(MAX_BLOCK_SIZE, uint8_t, dstbuf0)[BUF_SIZE];
64  DECLARE_ALIGNED(MAX_BLOCK_SIZE, uint8_t, dstbuf1)[BUF_SIZE];
65  CAVSDSPContext cavsdsp;
66  static const struct {
67  const char *name;
68  size_t offset;
69  } tests[] = {
70 #define TEST(NAME) { .name = #NAME, .offset = offsetof(CAVSDSPContext, NAME) }
71  TEST(put_cavs_qpel_pixels_tab),
72  TEST(avg_cavs_qpel_pixels_tab),
73  };
74  declare_func_emms(AV_CPU_FLAG_MMX | AV_CPU_FLAG_MMXEXT, void, uint8_t *dst, const uint8_t *src, ptrdiff_t stride);
75 
76  ff_cavsdsp_init(&cavsdsp);
77 
78  for (size_t i = 0; i < FF_ARRAY_ELEMS(tests); ++i) {
79  qpel_mc_func (*func_tab)[16] = (qpel_mc_func (*)[16])((char*)&cavsdsp + tests[i].offset);
80  for (unsigned j = 0; j < 2; ++j) {
81  const unsigned blocksize = MAX_BLOCK_SIZE >> j;
82 
83  for (unsigned dxy = 0; dxy < 16; ++dxy) {
84  if (check_func(func_tab[j][dxy], "%s[%u][%u]", tests[i].name, j, dxy)) {
85  // Don't always use output that is 16-aligned.
86  size_t dst_offset = (rnd() % (MAX_BLOCK_SIZE / blocksize)) * blocksize;
87  ptrdiff_t stride = (rnd() % (MAX_STRIDE / blocksize) + 1) * blocksize;
88  size_t src_offset = 2 + 2 * stride + rnd() % MAX_BLOCK_SIZE;
89  const uint8_t *src0 = srcbuf0 + src_offset, *src1 = srcbuf1 + src_offset;
90  uint8_t *dst0 = dstbuf0 + dst_offset, *dst1 = dstbuf1 + dst_offset;
91 
92  if (rnd() & 1) {
93  // Flip stride.
94  dst1 += (blocksize - 1) * stride;
95  dst0 += (blocksize - 1) * stride;
96  // We need two lines above src and three lines below the block,
97  // hence blocksize * stride.
98  src0 += blocksize * stride;
99  src1 += blocksize * stride;
100  stride = -stride;
101  }
102 
103  randomize_buffers(srcbuf0, srcbuf1);
104  randomize_buffers(dstbuf0, dstbuf1);
105  call_ref(dst0, src0, stride);
106  call_new(dst1, src1, stride);
107  if (memcmp(srcbuf0, srcbuf1, sizeof(srcbuf0)) || memcmp(dstbuf0, dstbuf1, sizeof(dstbuf0)))
108  fail();
109  bench_new(dst0, src0, stride);
110  }
111  }
112  }
113  }
114 }
115 
117 {
119 }
declare_func_emms
#define declare_func_emms(cpu_flags, ret,...)
Definition: checkasm.h:203
name
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default minimum maximum flags name is the option name
Definition: writing_filters.txt:88
mem_internal.h
src1
const pixel * src1
Definition: h264pred_template.c:420
check_func
#define check_func(func,...)
Definition: checkasm.h:197
MAX_STRIDE
@ MAX_STRIDE
Definition: cavsdsp.c:32
INPUT_BUF_SIZE
@ INPUT_BUF_SIZE
The qpel interpolation code accesses two lines above and three lines below the actual src block; it a...
Definition: cavsdsp.c:42
call_ref
#define call_ref(...)
Definition: checkasm.h:212
func_tab
static const struct @67 func_tab[]
CAVSDSPContext
Definition: cavsdsp.h:30
macros.h
fail
#define fail()
Definition: checkasm.h:206
TEST
#define TEST(NAME)
checkasm.h
rnd
#define rnd()
Definition: checkasm.h:190
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
intreadwrite.h
MAX_BLOCK_SIZE
#define MAX_BLOCK_SIZE
Definition: cavsdsp.c:31
call_new
#define call_new(...)
Definition: checkasm.h:315
checkasm_check_cavsdsp
void checkasm_check_cavsdsp(void)
Definition: cavsdsp.c:116
qpel_mc_func
void(* qpel_mc_func)(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
Definition: qpeldsp.h:65
ff_cavsdsp_init
av_cold void ff_cavsdsp_init(CAVSDSPContext *c)
Definition: cavsdsp.c:550
DECLARE_ALIGNED
#define DECLARE_ALIGNED(n, t, v)
Definition: mem_internal.h:104
dst
uint8_t ptrdiff_t const uint8_t ptrdiff_t int intptr_t intptr_t int int16_t * dst
Definition: dsp.h:87
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
BUF_SIZE
@ BUF_SIZE
BUF_SIZE is bigger than necessary in order to test strides > block width.
Definition: cavsdsp.c:34
tests
const TestCase tests[]
Definition: fifo_muxer.c:363
bench_new
#define bench_new(...)
Definition: checkasm.h:400
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
randomize_buffers
#define randomize_buffers(buf0, buf1)
Definition: cavsdsp.c:45
check_cavs_qpeldsp
static void check_cavs_qpeldsp(void)
Definition: cavsdsp.c:59
stride
#define stride
Definition: h264pred_template.c:536
AV_CPU_FLAG_MMX
#define AV_CPU_FLAG_MMX
standard MMX
Definition: cpu.h:30
AV_CPU_FLAG_MMXEXT
#define AV_CPU_FLAG_MMXEXT
SSE integer functions or AMD MMX ext.
Definition: cpu.h:31
src0
const pixel *const src0
Definition: h264pred_template.c:419
src
#define src
Definition: vp8dsp.c:248
cavsdsp.h