33 #define MAX_ABS (512 >> (SCALE_OFFSET>0 ? SCALE_OFFSET : 0))
35 static int DEF(try_8x8basis)(int16_t rem[64], int16_t
weight[64], int16_t
basis[64],
int scale)
44 "pxor %%mm7, %%mm7 \n\t"
46 "punpcklwd %%mm5, %%mm5 \n\t"
47 "punpcklwd %%mm5, %%mm5 \n\t"
50 "movq (%1, %0), %%mm0 \n\t"
51 "movq 8(%1, %0), %%mm1 \n\t"
52 PMULHRW(%%mm0, %%mm1, %%mm5, %%mm6)
53 "paddw (%2, %0), %%mm0 \n\t"
54 "paddw 8(%2, %0), %%mm1 \n\t"
55 "psraw $6, %%mm0 \n\t"
56 "psraw $6, %%mm1 \n\t"
57 "pmullw (%3, %0), %%mm0 \n\t"
58 "pmullw 8(%3, %0), %%mm1 \n\t"
59 "pmaddwd %%mm0, %%mm0 \n\t"
60 "pmaddwd %%mm1, %%mm1 \n\t"
61 "paddd %%mm1, %%mm0 \n\t"
62 "psrld $4, %%mm0 \n\t"
63 "paddd %%mm0, %%mm7 \n\t"
68 "psrld $2, %%mm7 \n\t"
77 static void DEF(add_8x8basis)(int16_t rem[64], int16_t
basis[64],
int scale)
86 "punpcklwd %%mm5, %%mm5 \n\t"
87 "punpcklwd %%mm5, %%mm5 \n\t"
90 "movq (%1, %0), %%mm0 \n\t"
91 "movq 8(%1, %0), %%mm1 \n\t"
92 PMULHRW(%%mm0, %%mm1, %%mm5, %%mm6)
93 "paddw (%2, %0), %%mm0 \n\t"
94 "paddw 8(%2, %0), %%mm1 \n\t"
95 "movq %%mm0, (%2, %0) \n\t"
96 "movq %%mm1, 8(%2, %0) \n\t"
102 :
"r"(
basis),
"r"(rem),
"g"(scale)
105 for(
i=0;
i<8*8;
i++){