FFmpeg
All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Modules Pages
pixblockdsp.c
Go to the documentation of this file.
1 /*
2  * This file is part of FFmpeg.
3  *
4  * FFmpeg is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * FFmpeg is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with FFmpeg; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17  */
18 
19 #include <stdint.h>
20 
21 #include "config.h"
22 #include "libavutil/attributes.h"
23 #include "libavutil/intreadwrite.h"
24 #include "pixblockdsp.h"
25 
26 static void get_pixels_16_c(int16_t *restrict block, const uint8_t *pixels,
27  ptrdiff_t stride)
28 {
29  for (int i = 0; i < 8; i++)
30  AV_COPY128(block + i * 8, pixels + i * stride);
31 }
32 
33 static void get_pixels_unaligned_16_c(int16_t *restrict block,
34  const uint8_t *pixels, ptrdiff_t stride)
35 {
36  AV_COPY128U(block + 0 * 8, pixels + 0 * stride);
37  AV_COPY128U(block + 1 * 8, pixels + 1 * stride);
38  AV_COPY128U(block + 2 * 8, pixels + 2 * stride);
39  AV_COPY128U(block + 3 * 8, pixels + 3 * stride);
40  AV_COPY128U(block + 4 * 8, pixels + 4 * stride);
41  AV_COPY128U(block + 5 * 8, pixels + 5 * stride);
42  AV_COPY128U(block + 6 * 8, pixels + 6 * stride);
43  AV_COPY128U(block + 7 * 8, pixels + 7 * stride);
44 }
45 
46 static void get_pixels_8_c(int16_t *restrict block, const uint8_t *pixels,
47  ptrdiff_t stride)
48 {
49  int i;
50 
51  /* read the pixels */
52  for (i = 0; i < 8; i++) {
53  block[0] = pixels[0];
54  block[1] = pixels[1];
55  block[2] = pixels[2];
56  block[3] = pixels[3];
57  block[4] = pixels[4];
58  block[5] = pixels[5];
59  block[6] = pixels[6];
60  block[7] = pixels[7];
61  pixels += stride;
62  block += 8;
63  }
64 }
65 
66 static void diff_pixels_c(int16_t *restrict block, const uint8_t *s1,
67  const uint8_t *s2, ptrdiff_t stride)
68 {
69  int i;
70 
71  /* read the pixels */
72  for (i = 0; i < 8; i++) {
73  block[0] = s1[0] - s2[0];
74  block[1] = s1[1] - s2[1];
75  block[2] = s1[2] - s2[2];
76  block[3] = s1[3] - s2[3];
77  block[4] = s1[4] - s2[4];
78  block[5] = s1[5] - s2[5];
79  block[6] = s1[6] - s2[6];
80  block[7] = s1[7] - s2[7];
81  s1 += stride;
82  s2 += stride;
83  block += 8;
84  }
85 }
86 
87 av_cold void ff_pixblockdsp_init(PixblockDSPContext *c, int bits_per_raw_sample)
88 {
89  const unsigned high_bit_depth = bits_per_raw_sample > 8 &&
90  bits_per_raw_sample <= 16;
91 
92  c->diff_pixels_unaligned =
93  c->diff_pixels = diff_pixels_c;
94 
95  if (high_bit_depth) {
96  c->get_pixels_unaligned = get_pixels_unaligned_16_c;
97  c->get_pixels = get_pixels_16_c;
98  } else {
99  c->get_pixels_unaligned =
100  c->get_pixels = get_pixels_8_c;
101  }
102 
103 #if ARCH_AARCH64
104  ff_pixblockdsp_init_aarch64(c, high_bit_depth);
105 #elif ARCH_ARM
106  ff_pixblockdsp_init_arm(c, high_bit_depth);
107 #elif ARCH_PPC
108  ff_pixblockdsp_init_ppc(c, high_bit_depth);
109 #elif ARCH_RISCV
110  ff_pixblockdsp_init_riscv(c, high_bit_depth);
111 #elif ARCH_X86
112  ff_pixblockdsp_init_x86(c, high_bit_depth);
113 #elif ARCH_MIPS
114  ff_pixblockdsp_init_mips(c, high_bit_depth);
115 #endif
116 }
get_pixels_unaligned_16_c
static void get_pixels_unaligned_16_c(int16_t *restrict block, const uint8_t *pixels, ptrdiff_t stride)
Definition: pixblockdsp.c:33
av_cold
#define av_cold
Definition: attributes.h:90
ff_pixblockdsp_init_riscv
void ff_pixblockdsp_init_riscv(PixblockDSPContext *c, unsigned high_bit_depth)
Definition: pixblockdsp_init.c:43
intreadwrite.h
ff_pixblockdsp_init_aarch64
av_cold void ff_pixblockdsp_init_aarch64(PixblockDSPContext *c, unsigned high_bit_depth)
Definition: pixblockdsp_init_aarch64.c:31
get_pixels_8_c
static void get_pixels_8_c(int16_t *restrict block, const uint8_t *pixels, ptrdiff_t stride)
Definition: pixblockdsp.c:46
get_pixels_16_c
static void get_pixels_16_c(int16_t *restrict block, const uint8_t *pixels, ptrdiff_t stride)
Definition: pixblockdsp.c:26
PixblockDSPContext
Definition: pixblockdsp.h:28
AV_COPY128
#define AV_COPY128(d, s)
Definition: intreadwrite.h:642
AV_COPY128U
#define AV_COPY128U(d, s)
Definition: intreadwrite.h:615
c
Undefined Behavior In the C some operations are like signed integer dereferencing freed accessing outside allocated Undefined Behavior must not occur in a C it is not safe even if the output of undefined operations is unused The unsafety may seem nit picking but Optimizing compilers have in fact optimized code on the assumption that no undefined Behavior occurs Optimizing code based on wrong assumptions can and has in some cases lead to effects beyond the output of computations The signed integer overflow problem in speed critical code Code which is highly optimized and works with signed integers sometimes has the problem that often the output of the computation does not c
Definition: undefined.txt:32
ff_pixblockdsp_init_x86
void ff_pixblockdsp_init_x86(PixblockDSPContext *c, unsigned high_bit_depth)
Definition: pixblockdsp_init.c:30
ff_pixblockdsp_init_arm
av_cold void ff_pixblockdsp_init_arm(PixblockDSPContext *c, unsigned high_bit_depth)
Definition: pixblockdsp_init_arm.c:40
attributes.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
stride
#define stride
Definition: h264pred_template.c:536
ff_pixblockdsp_init
av_cold void ff_pixblockdsp_init(PixblockDSPContext *c, int bits_per_raw_sample)
Definition: pixblockdsp.c:87
ff_pixblockdsp_init_mips
void ff_pixblockdsp_init_mips(PixblockDSPContext *c, unsigned high_bit_depth)
Definition: pixblockdsp_init_mips.c:26
diff_pixels_c
static void diff_pixels_c(int16_t *restrict block, const uint8_t *s1, const uint8_t *s2, ptrdiff_t stride)
Definition: pixblockdsp.c:66
ff_pixblockdsp_init_ppc
av_cold void ff_pixblockdsp_init_ppc(PixblockDSPContext *c, unsigned high_bit_depth)
Definition: pixblockdsp.c:264
block
The exact code depends on how similar the blocks are and how related they are to the block
Definition: filter_design.txt:207
pixblockdsp.h