Go to the documentation of this file.
   31 extern const int16_t ff_filters_16bpp[3][15][4][16];
 
   40 #if HAVE_AVX2_EXTERNAL 
   47 #if HAVE_AVX2_EXTERNAL 
   58 #if HAVE_AVX2_EXTERNAL 
   67 #define decl_lpf_func(dir, wd, bpp, opt) \ 
   68 void ff_vp9_loop_filter_##dir##_##wd##_##bpp##_##opt(uint8_t *dst, ptrdiff_t stride, \ 
   71 #define decl_lpf_funcs(dir, wd, bpp) \ 
   72 decl_lpf_func(dir, wd, bpp, sse2); \ 
   73 decl_lpf_func(dir, wd, bpp, ssse3); \ 
   74 decl_lpf_func(dir, wd, bpp, avx) 
   76 #define decl_lpf_funcs_wd(dir) \ 
   77 decl_lpf_funcs(dir,  4, BPC); \ 
   78 decl_lpf_funcs(dir,  8, BPC); \ 
   79 decl_lpf_funcs(dir, 16, BPC) 
   84 #define lpf_16_wrapper(dir, off, bpp, opt) \ 
   85 static void loop_filter_##dir##_16_##bpp##_##opt(uint8_t *dst, ptrdiff_t stride, \ 
   86                                                  int E, int I, int H) \ 
   88     ff_vp9_loop_filter_##dir##_16_##bpp##_##opt(dst,       stride, E, I, H); \ 
   89     ff_vp9_loop_filter_##dir##_16_##bpp##_##opt(dst + off, stride, E, I, H); \ 
   92 #define lpf_16_wrappers(bpp, opt) \ 
   93 lpf_16_wrapper(h, 8 * stride, bpp, opt) \ 
   94 lpf_16_wrapper(v, 16,         bpp, opt) 
   96 lpf_16_wrappers(
BPC, sse2)
 
   97 lpf_16_wrappers(
BPC, ssse3)
 
   98 lpf_16_wrappers(
BPC, avx)
 
  100 #define lpf_mix2_wrapper(dir, off, wd1, wd2, bpp, opt) \ 
  101 static void loop_filter_##dir##_##wd1##wd2##_##bpp##_##opt(uint8_t *dst, ptrdiff_t stride, \ 
  102                                                            int E, int I, int H) \ 
  104     ff_vp9_loop_filter_##dir##_##wd1##_##bpp##_##opt(dst,       stride, \ 
  105                                                      E & 0xff, I & 0xff, H & 0xff); \ 
  106     ff_vp9_loop_filter_##dir##_##wd2##_##bpp##_##opt(dst + off, stride, \ 
  107                                                      E >> 8,   I >> 8,   H >> 8); \ 
  110 #define lpf_mix2_wrappers(wd1, wd2, bpp, opt) \ 
  111 lpf_mix2_wrapper(h, 8 * stride, wd1, wd2, bpp, opt) \ 
  112 lpf_mix2_wrapper(v, 16,         wd1, wd2, bpp, opt) 
  114 #define lpf_mix2_wrappers_set(bpp, opt) \ 
  115 lpf_mix2_wrappers(4, 4, bpp, opt) \ 
  116 lpf_mix2_wrappers(4, 8, bpp, opt) \ 
  117 lpf_mix2_wrappers(8, 4, bpp, opt) \ 
  118 lpf_mix2_wrappers(8, 8, bpp, opt) \ 
  120 lpf_mix2_wrappers_set(
BPC, sse2)
 
  121 lpf_mix2_wrappers_set(
BPC, ssse3)
 
  122 lpf_mix2_wrappers_set(
BPC, avx)
 
  146 #define init_lpf_8_func(idx1, idx2, dir, wd, bpp, opt) \ 
  147     dsp->loop_filter_8[idx1][idx2] = ff_vp9_loop_filter_##dir##_##wd##_##bpp##_##opt 
  148 #define init_lpf_16_func(idx, dir, bpp, opt) \ 
  149     dsp->loop_filter_16[idx] = loop_filter_##dir##_16_##bpp##_##opt 
  150 #define init_lpf_mix2_func(idx1, idx2, idx3, dir, wd1, wd2, bpp, opt) \ 
  151     dsp->loop_filter_mix2[idx1][idx2][idx3] = loop_filter_##dir##_##wd1##wd2##_##bpp##_##opt 
  153 #define init_lpf_funcs(bpp, opt) \ 
  154     init_lpf_8_func(0, 0, h,  4, bpp, opt); \ 
  155     init_lpf_8_func(0, 1, v,  4, bpp, opt); \ 
  156     init_lpf_8_func(1, 0, h,  8, bpp, opt); \ 
  157     init_lpf_8_func(1, 1, v,  8, bpp, opt); \ 
  158     init_lpf_8_func(2, 0, h, 16, bpp, opt); \ 
  159     init_lpf_8_func(2, 1, v, 16, bpp, opt); \ 
  160     init_lpf_16_func(0, h, bpp, opt); \ 
  161     init_lpf_16_func(1, v, bpp, opt); \ 
  162     init_lpf_mix2_func(0, 0, 0, h, 4, 4, bpp, opt); \ 
  163     init_lpf_mix2_func(0, 1, 0, h, 4, 8, bpp, opt); \ 
  164     init_lpf_mix2_func(1, 0, 0, h, 8, 4, bpp, opt); \ 
  165     init_lpf_mix2_func(1, 1, 0, h, 8, 8, bpp, opt); \ 
  166     init_lpf_mix2_func(0, 0, 1, v, 4, 4, bpp, opt); \ 
  167     init_lpf_mix2_func(0, 1, 1, v, 4, 8, bpp, opt); \ 
  168     init_lpf_mix2_func(1, 0, 1, v, 8, 4, bpp, opt); \ 
  169     init_lpf_mix2_func(1, 1, 1, v, 8, 8, bpp, opt) 
  171 #define init_itx_func(idxa, idxb, typea, typeb, size, bpp, opt) \ 
  172     dsp->itxfm_add[idxa][idxb] = \ 
  173         cat(ff_vp9_##typea##_##typeb##_##size##x##size##_add_, bpp, _##opt); 
  174 #define init_itx_func_one(idx, typea, typeb, size, bpp, opt) \ 
  175     init_itx_func(idx, DCT_DCT,   typea, typeb, size, bpp, opt); \ 
  176     init_itx_func(idx, ADST_DCT,  typea, typeb, size, bpp, opt); \ 
  177     init_itx_func(idx, DCT_ADST,  typea, typeb, size, bpp, opt); \ 
  178     init_itx_func(idx, ADST_ADST, typea, typeb, size, bpp, opt) 
  179 #define init_itx_funcs(idx, size, bpp, opt) \ 
  180     init_itx_func(idx, DCT_DCT,   idct,  idct,  size, bpp, opt); \ 
  181     init_itx_func(idx, ADST_DCT,  idct,  iadst, size, bpp, opt); \ 
  182     init_itx_func(idx, DCT_ADST,  iadst, idct,  size, bpp, opt); \ 
  183     init_itx_func(idx, ADST_ADST, iadst, iadst, size, bpp, opt); \ 
  188             init_itx_func_one(4 , iwht, iwht, 4, 
BPC, mmxext);
 
  198         init_lpf_funcs(
BPC, sse2);
 
  207         init_itx_funcs(
TX_4X4, 4, 12, sse2);
 
  215         init_lpf_funcs(
BPC, ssse3);
 
  224         init_lpf_funcs(
BPC, avx);
 
  228 #if HAVE_AVX2_EXTERNAL 
  
av_cold void INIT_FUNC(VP9DSPContext *dsp, int bitexact)
 
#define EXTERNAL_AVX2_FAST(flags)
 
#define init_8_16_32_ipred_funcs(type, enum, bpp, opt)
 
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
 
static atomic_int cpu_flags
 
#define filters_8tap_1d_fn3(op, bpp, opt4, opt8, f_opt)
 
static void idct(int16_t block[64])
 
#define decl_mc_funcs(sz, bpp)
 
#define decl_itxfm_func(typea, typeb, size, bpp, opt)
 
#define decl_itxfm_funcs(size, bpp, opt)
 
#define init_subpel3_32_64(idx, type, bpp, opt)
 
#define decl_ipred_fns(type, bpp, opt4, opt8_16_32)
 
#define filters_8tap_2d_fn2(op, align, bpp, bytes, opt4, opt8, f_opt)
 
void ff_vp9dsp_init_16bpp_x86(VP9DSPContext *dsp)
 
#define init_subpel3(idx, type)
 
#define EXTERNAL_SSE2(flags)
 
#define filters_8tap_2d_fn(op, sz, align, bpp, bytes, opt, f_opt)
 
#define filters_8tap_1d_fn2(op, sz, bpp, opt, f_opt)
 
#define init_ipred_func(type, enum, sz, bpp, opt)
 
#define mc_rep_funcs(name, bitd, step, W, opt)
 
#define EXTERNAL_AVX(flags)
 
#define EXTERNAL_SSSE3(flags)
 
#define EXTERNAL_MMXEXT(flags)
 
#define init_subpel2(idx, idxh, idxv, dir, type)