38 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1,
39 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4,
40 5, 5, 6, 6, 7, 8, 9, 10, 11, 13, 14, 16, 18, 20, 22, 24
44 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 6, 7, 8,
45 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36,
46 38, 40, 42, 44, 46, 48, 50, 52, 54, 56, 58, 60, 62, 64
51 static const int qp_c[] = {
52 29, 30, 31, 32, 33, 33, 34, 34, 35, 35, 36, 36, 37, 37
54 int qp, qp_i,
offset, idxt;
58 offset =
s->ps.pps->cb_qp_offset;
60 offset =
s->ps.pps->cr_qp_offset;
62 qp_i = av_clip(qp_y +
offset, 0, 57);
63 if (
s->ps.sps->chroma_format_idc == 1) {
71 qp = av_clip(qp_i, 0, 51);
81 int ctb_size_mask = (1 <<
s->ps.sps->log2_ctb_size) - 1;
82 int MinCuQpDeltaSizeMask = (1 << (
s->ps.sps->log2_ctb_size -
83 s->ps.pps->diff_cu_qp_delta_depth)) - 1;
84 int xQgBase = xBase - (xBase & MinCuQpDeltaSizeMask);
85 int yQgBase = yBase - (yBase & MinCuQpDeltaSizeMask);
86 int min_cb_width =
s->ps.sps->min_cb_width;
87 int x_cb = xQgBase >>
s->ps.sps->log2_min_cb_size;
88 int y_cb = yQgBase >>
s->ps.sps->log2_min_cb_size;
89 int availableA = (xBase & ctb_size_mask) &&
90 (xQgBase & ctb_size_mask);
91 int availableB = (yBase & ctb_size_mask) &&
92 (yQgBase & ctb_size_mask);
93 int qPy_pred, qPy_a, qPy_b;
98 qPy_pred =
s->sh.slice_qp;
107 qPy_a =
s->qp_y_tab[(x_cb - 1) + y_cb * min_cb_width];
113 qPy_b =
s->qp_y_tab[x_cb + (y_cb - 1) * min_cb_width];
115 av_assert2(qPy_a >= -
s->ps.sps->qp_bd_offset && qPy_a < 52);
116 av_assert2(qPy_b >= -
s->ps.sps->qp_bd_offset && qPy_b < 52);
118 return (qPy_a + qPy_b + 1) >> 1;
125 if (
s->HEVClc->tu.cu_qp_delta != 0) {
126 int off =
s->ps.sps->qp_bd_offset;
127 s->HEVClc->qp_y =
FFUMOD(qp_y +
s->HEVClc->tu.cu_qp_delta + 52 + 2 * off,
130 s->HEVClc->qp_y = qp_y;
135 int log2_min_cb_size =
s->ps.sps->log2_min_cb_size;
136 int x = xC >> log2_min_cb_size;
137 int y = yC >> log2_min_cb_size;
138 return s->qp_y_tab[x + y *
s->ps.sps->min_cb_width];
142 ptrdiff_t stride_dst, ptrdiff_t stride_src)
146 if (((intptr_t)dst | (intptr_t)
src | stride_dst | stride_src) & 15) {
148 for (j = 0; j <
width; j+=8)
155 for (j = 0; j <
width; j+=16)
166 *(uint16_t *)dst = *(uint16_t *)
src;
172 int pixel_shift,
int height,
173 ptrdiff_t stride_dst, ptrdiff_t stride_src)
176 if (pixel_shift == 0) {
184 *(uint16_t *)dst = *(uint16_t *)
src;
192 ptrdiff_t stride_src,
int x,
int y,
int width,
int height,
193 int c_idx,
int x_ctb,
int y_ctb)
195 int sh =
s->ps.sps->pixel_shift;
196 int w =
s->ps.sps->width >>
s->ps.sps->hshift[c_idx];
197 int h =
s->ps.sps->height >>
s->ps.sps->vshift[c_idx];
200 memcpy(
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb) *
w + x) << sh),
202 memcpy(
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb + 1) *
w + x) << sh),
206 copy_vert(
s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb) *
h + y) << sh),
src, sh,
height, 1 << sh, stride_src);
208 copy_vert(
s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb + 1) *
h + y) << sh),
src + ((
width - 1) << sh), sh,
height, 1 << sh, stride_src);
213 ptrdiff_t stride_src, ptrdiff_t stride_dst,
216 if (
s->ps.pps->transquant_bypass_enable_flag ||
217 (
s->ps.sps->pcm.loop_filter_disable_flag &&
s->ps.sps->pcm_enabled_flag)) {
219 int min_pu_size = 1 <<
s->ps.sps->log2_min_pu_size;
220 int hshift =
s->ps.sps->hshift[c_idx];
221 int vshift =
s->ps.sps->vshift[c_idx];
222 int x_min = ((x0 ) >>
s->ps.sps->log2_min_pu_size);
223 int y_min = ((y0 ) >>
s->ps.sps->log2_min_pu_size);
224 int x_max = ((x0 +
width ) >>
s->ps.sps->log2_min_pu_size);
225 int y_max = ((y0 +
height) >>
s->ps.sps->log2_min_pu_size);
226 int len = (min_pu_size >> hshift) <<
s->ps.sps->pixel_shift;
227 for (y = y_min; y < y_max; y++) {
228 for (x = x_min; x < x_max; x++) {
229 if (
s->is_pcm[y *
s->ps.sps->min_pu_width + x]) {
231 uint8_t *
src =
src1 + (((y <<
s->ps.sps->log2_min_pu_size) - y0) >> vshift) * stride_src + ((((x <<
s->ps.sps->log2_min_pu_size) - x0) >> hshift) <<
s->ps.sps->pixel_shift);
232 const uint8_t *dst = dst1 + (((y <<
s->ps.sps->log2_min_pu_size) - y0) >> vshift) * stride_dst + ((((x <<
s->ps.sps->log2_min_pu_size) - x0) >> hshift) <<
s->ps.sps->pixel_shift);
233 for (n = 0; n < (min_pu_size >> vshift); n++) {
244 #define CTB(tab, x, y) ((tab)[(y) * s->ps.sps->ctb_width + (x)])
248 static const uint8_t sao_tab[8] = { 0, 1, 2, 2, 3, 3, 4, 4 };
252 int x_ctb = x >>
s->ps.sps->log2_ctb_size;
253 int y_ctb = y >>
s->ps.sps->log2_ctb_size;
254 int ctb_addr_rs = y_ctb *
s->ps.sps->ctb_width + x_ctb;
255 int ctb_addr_ts =
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs];
258 uint8_t vert_edge[] = { 0, 0 };
259 uint8_t horiz_edge[] = { 0, 0 };
260 uint8_t diag_edge[] = { 0, 0, 0, 0 };
261 uint8_t lfase =
CTB(
s->filter_slice_edges, x_ctb, y_ctb);
262 uint8_t no_tile_filter =
s->ps.pps->tiles_enabled_flag &&
263 !
s->ps.pps->loop_filter_across_tiles_enabled_flag;
264 uint8_t restore = no_tile_filter || !lfase;
270 edges[0] = x_ctb == 0;
271 edges[1] = y_ctb == 0;
272 edges[2] = x_ctb ==
s->ps.sps->ctb_width - 1;
273 edges[3] = y_ctb ==
s->ps.sps->ctb_height - 1;
277 left_tile_edge = no_tile_filter &&
s->ps.pps->tile_id[ctb_addr_ts] !=
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs-1]];
278 vert_edge[0] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb)) || left_tile_edge;
281 right_tile_edge = no_tile_filter &&
s->ps.pps->tile_id[ctb_addr_ts] !=
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs+1]];
282 vert_edge[1] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb)) || right_tile_edge;
285 up_tile_edge = no_tile_filter &&
s->ps.pps->tile_id[ctb_addr_ts] !=
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs -
s->ps.sps->ctb_width]];
286 horiz_edge[0] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb, y_ctb - 1)) || up_tile_edge;
289 bottom_tile_edge = no_tile_filter &&
s->ps.pps->tile_id[ctb_addr_ts] !=
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs +
s->ps.sps->ctb_width]];
290 horiz_edge[1] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb, y_ctb + 1)) || bottom_tile_edge;
292 if (!edges[0] && !edges[1]) {
293 diag_edge[0] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb - 1)) || left_tile_edge || up_tile_edge;
295 if (!edges[1] && !edges[2]) {
296 diag_edge[1] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb - 1)) || right_tile_edge || up_tile_edge;
298 if (!edges[2] && !edges[3]) {
299 diag_edge[2] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb + 1)) || right_tile_edge || bottom_tile_edge;
301 if (!edges[0] && !edges[3]) {
302 diag_edge[3] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb + 1)) || left_tile_edge || bottom_tile_edge;
306 for (c_idx = 0; c_idx < (
s->ps.sps->chroma_format_idc ? 3 : 1); c_idx++) {
307 int x0 = x >>
s->ps.sps->hshift[c_idx];
308 int y0 = y >>
s->ps.sps->vshift[c_idx];
309 ptrdiff_t stride_src =
s->frame->linesize[c_idx];
310 int ctb_size_h = (1 << (
s->ps.sps->log2_ctb_size)) >>
s->ps.sps->hshift[c_idx];
311 int ctb_size_v = (1 << (
s->ps.sps->log2_ctb_size)) >>
s->ps.sps->vshift[c_idx];
312 int width =
FFMIN(ctb_size_h, (
s->ps.sps->width >>
s->ps.sps->hshift[c_idx]) - x0);
313 int height =
FFMIN(ctb_size_v, (
s->ps.sps->height >>
s->ps.sps->vshift[c_idx]) - y0);
315 uint8_t *
src = &
s->frame->data[c_idx][y0 * stride_src + (x0 <<
s->ps.sps->pixel_shift)];
316 ptrdiff_t stride_dst;
323 if (
s->ps.pps->transquant_bypass_enable_flag ||
324 (
s->ps.sps->pcm.loop_filter_disable_flag &&
s->ps.sps->pcm_enabled_flag)) {
328 s->hevcdsp.sao_band_filter[
tab](
src, dst, stride_src, stride_dst,
334 s->hevcdsp.sao_band_filter[
tab](
src,
src, stride_src, stride_src,
342 int w =
s->ps.sps->width >>
s->ps.sps->hshift[c_idx];
343 int h =
s->ps.sps->height >>
s->ps.sps->vshift[c_idx];
344 int left_edge = edges[0];
345 int top_edge = edges[1];
346 int right_edge = edges[2];
347 int bottom_edge = edges[3];
348 int sh =
s->ps.sps->pixel_shift;
349 int left_pixels, right_pixels;
355 int left = 1 - left_edge;
356 int right = 1 - right_edge;
361 dst1 = dst - stride_dst - (
left << sh);
363 src1[1] =
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb - 1) *
w + x0 -
left) << sh);
366 src_idx = (
CTB(
s->sao, x_ctb-1, y_ctb-1).type_idx[c_idx] ==
371 src_idx = (
CTB(
s->sao, x_ctb, y_ctb-1).type_idx[c_idx] ==
376 src_idx = (
CTB(
s->sao, x_ctb+1, y_ctb-1).type_idx[c_idx] ==
382 int left = 1 - left_edge;
383 int right = 1 - right_edge;
388 dst1 = dst +
height * stride_dst - (
left << sh);
390 src1[1] =
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb + 2) *
w + x0 -
left) << sh);
393 src_idx = (
CTB(
s->sao, x_ctb-1, y_ctb+1).type_idx[c_idx] ==
398 src_idx = (
CTB(
s->sao, x_ctb, y_ctb+1).type_idx[c_idx] ==
403 src_idx = (
CTB(
s->sao, x_ctb+1, y_ctb+1).type_idx[c_idx] ==
412 s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb - 1) *
h + y0) << sh),
413 sh,
height, stride_dst, 1 << sh);
422 s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb + 2) *
h + y0) << sh),
423 sh,
height, stride_dst, 1 << sh);
430 src - (left_pixels << sh),
431 (
width + left_pixels + right_pixels) << sh,
432 height, stride_dst, stride_src);
438 s->hevcdsp.sao_edge_restore[restore](
src, dst,
439 stride_src, stride_dst,
457 int log2_min_pu_size =
s->ps.sps->log2_min_pu_size;
463 x_pu = x >> log2_min_pu_size;
464 y_pu = y >> log2_min_pu_size;
466 if (x_pu >=
s->ps.sps->min_pu_width || y_pu >=
s->ps.sps->min_pu_height)
468 return s->is_pcm[y_pu *
s->ps.sps->min_pu_width + x_pu];
471 #define TC_CALC(qp, bs) \
472 tctable[av_clip((qp) + DEFAULT_INTRA_TC_OFFSET * ((bs) - 1) + \
474 0, MAX_QP + DEFAULT_INTRA_TC_OFFSET)]
485 int log2_ctb_size =
s->ps.sps->log2_ctb_size;
486 int x_end, x_end2, y_end;
487 int ctb_size = 1 << log2_ctb_size;
488 int ctb = (x0 >> log2_ctb_size) +
489 (y0 >> log2_ctb_size) *
s->ps.sps->ctb_width;
490 int cur_tc_offset =
s->deblock[ctb].tc_offset;
491 int cur_beta_offset =
s->deblock[ctb].beta_offset;
492 int left_tc_offset, left_beta_offset;
493 int tc_offset, beta_offset;
494 int pcmf = (
s->ps.sps->pcm_enabled_flag &&
495 s->ps.sps->pcm.loop_filter_disable_flag) ||
496 s->ps.pps->transquant_bypass_enable_flag;
499 left_tc_offset =
s->deblock[ctb - 1].tc_offset;
500 left_beta_offset =
s->deblock[ctb - 1].beta_offset;
503 left_beta_offset = 0;
506 x_end = x0 + ctb_size;
507 if (x_end >
s->ps.sps->width)
508 x_end =
s->ps.sps->width;
509 y_end = y0 + ctb_size;
510 if (y_end >
s->ps.sps->height)
511 y_end =
s->ps.sps->height;
513 tc_offset = cur_tc_offset;
514 beta_offset = cur_beta_offset;
517 if (x_end2 !=
s->ps.sps->width)
519 for (y = y0; y < y_end; y += 8) {
521 for (x = x0 ? x0 : 8; x < x_end; x += 8) {
522 const int bs0 =
s->vertical_bs[(x + y *
s->bs_width) >> 2];
523 const int bs1 =
s->vertical_bs[(x + (y + 4) *
s->bs_width) >> 2];
531 src = &
s->frame->data[
LUMA][y *
s->frame->linesize[
LUMA] + (x <<
s->ps.sps->pixel_shift)];
537 s->hevcdsp.hevc_v_loop_filter_luma_c(
src,
538 s->frame->linesize[
LUMA],
539 beta,
tc, no_p, no_q);
541 s->hevcdsp.hevc_v_loop_filter_luma(
src,
542 s->frame->linesize[
LUMA],
543 beta,
tc, no_p, no_q);
551 for (x = x0 ? x0 - 8 : 0; x < x_end2; x += 8) {
552 const int bs0 =
s->horizontal_bs[( x + y *
s->bs_width) >> 2];
553 const int bs1 =
s->horizontal_bs[((x + 4) + y *
s->bs_width) >> 2];
557 tc_offset = x >= x0 ? cur_tc_offset : left_tc_offset;
558 beta_offset = x >= x0 ? cur_beta_offset : left_beta_offset;
563 src = &
s->frame->data[
LUMA][y *
s->frame->linesize[
LUMA] + (x <<
s->ps.sps->pixel_shift)];
569 s->hevcdsp.hevc_h_loop_filter_luma_c(
src,
570 s->frame->linesize[
LUMA],
571 beta,
tc, no_p, no_q);
573 s->hevcdsp.hevc_h_loop_filter_luma(
src,
574 s->frame->linesize[
LUMA],
575 beta,
tc, no_p, no_q);
580 if (
s->ps.sps->chroma_format_idc) {
582 int h = 1 <<
s->ps.sps->hshift[
chroma];
583 int v = 1 <<
s->ps.sps->vshift[
chroma];
586 for (y = y0; y < y_end; y += (8 * v)) {
587 for (x = x0 ? x0 : 8 *
h; x < x_end; x += (8 *
h)) {
588 const int bs0 =
s->vertical_bs[(x + y *
s->bs_width) >> 2];
589 const int bs1 =
s->vertical_bs[(x + (y + (4 * v)) *
s->bs_width) >> 2];
591 if ((bs0 == 2) || (bs1 == 2)) {
593 const int qp1 = (
get_qPy(
s, x - 1, y + (4 * v)) +
get_qPy(
s, x, y + (4 * v)) + 1) >> 1;
597 src = &
s->frame->data[
chroma][(y >>
s->ps.sps->vshift[
chroma]) *
s->frame->linesize[
chroma] + ((x >>
s->ps.sps->hshift[
chroma]) <<
s->ps.sps->pixel_shift)];
600 no_p[1] =
get_pcm(
s, x - 1, y + (4 * v));
602 no_q[1] =
get_pcm(
s, x, y + (4 * v));
603 s->hevcdsp.hevc_v_loop_filter_chroma_c(
src,
607 s->hevcdsp.hevc_v_loop_filter_chroma(
src,
617 tc_offset = x0 ? left_tc_offset : cur_tc_offset;
619 if (x_end !=
s->ps.sps->width)
620 x_end2 = x_end - 8 *
h;
621 for (x = x0 ? x0 - 8 *
h : 0; x < x_end2; x += (8 *
h)) {
622 const int bs0 =
s->horizontal_bs[( x + y *
s->bs_width) >> 2];
623 const int bs1 =
s->horizontal_bs[((x + 4 *
h) + y *
s->bs_width) >> 2];
624 if ((bs0 == 2) || (bs1 == 2)) {
625 const int qp0 = bs0 == 2 ? (
get_qPy(
s, x, y - 1) +
get_qPy(
s, x, y) + 1) >> 1 : 0;
626 const int qp1 = bs1 == 2 ? (
get_qPy(
s, x + (4 *
h), y - 1) +
get_qPy(
s, x + (4 *
h), y) + 1) >> 1 : 0;
630 src = &
s->frame->data[
chroma][(y >>
s->ps.sps->vshift[1]) *
s->frame->linesize[
chroma] + ((x >>
s->ps.sps->hshift[1]) <<
s->ps.sps->pixel_shift)];
633 no_p[1] =
get_pcm(
s, x + (4 *
h), y - 1);
636 s->hevcdsp.hevc_h_loop_filter_chroma_c(
src,
640 s->hevcdsp.hevc_h_loop_filter_chroma(
src,
655 if (
s->ref->refPicList[0].list[curr->
ref_idx[0]] == neigh_refPicList[0].
list[neigh->
ref_idx[0]] &&
656 s->ref->refPicList[0].list[curr->
ref_idx[0]] ==
s->ref->refPicList[1].list[curr->
ref_idx[1]] &&
665 }
else if (neigh_refPicList[0].
list[neigh->
ref_idx[0]] ==
s->ref->refPicList[0].list[curr->
ref_idx[0]] &&
666 neigh_refPicList[1].
list[neigh->
ref_idx[1]] ==
s->ref->refPicList[1].list[curr->
ref_idx[1]]) {
672 }
else if (neigh_refPicList[1].
list[neigh->
ref_idx[1]] ==
s->ref->refPicList[0].list[curr->
ref_idx[0]] &&
673 neigh_refPicList[0].
list[neigh->
ref_idx[0]] ==
s->ref->refPicList[1].list[curr->
ref_idx[1]]) {
688 ref_A =
s->ref->refPicList[0].list[curr->
ref_idx[0]];
691 ref_A =
s->ref->refPicList[1].list[curr->
ref_idx[1]];
696 ref_B = neigh_refPicList[0].
list[neigh->
ref_idx[0]];
699 ref_B = neigh_refPicList[1].
list[neigh->
ref_idx[1]];
702 if (ref_A == ref_B) {
719 int log2_min_pu_size =
s->ps.sps->log2_min_pu_size;
720 int log2_min_tu_size =
s->ps.sps->log2_min_tb_size;
721 int min_pu_width =
s->ps.sps->min_pu_width;
722 int min_tu_width =
s->ps.sps->min_tb_width;
723 int is_intra = tab_mvf[(y0 >> log2_min_pu_size) * min_pu_width +
725 int boundary_upper, boundary_left;
728 boundary_upper = y0 > 0 && !(y0 & 7);
729 if (boundary_upper &&
730 ((!
s->sh.slice_loop_filter_across_slices_enabled_flag &&
732 (y0 % (1 <<
s->ps.sps->log2_ctb_size)) == 0) ||
733 (!
s->ps.pps->loop_filter_across_tiles_enabled_flag &&
735 (y0 % (1 <<
s->ps.sps->log2_ctb_size)) == 0)))
738 if (boundary_upper) {
742 int yp_pu = (y0 - 1) >> log2_min_pu_size;
743 int yq_pu = y0 >> log2_min_pu_size;
744 int yp_tu = (y0 - 1) >> log2_min_tu_size;
745 int yq_tu = y0 >> log2_min_tu_size;
747 for (
i = 0;
i < (1 << log2_trafo_size);
i += 4) {
748 int x_pu = (x0 +
i) >> log2_min_pu_size;
749 int x_tu = (x0 +
i) >> log2_min_tu_size;
750 MvField *top = &tab_mvf[yp_pu * min_pu_width + x_pu];
751 MvField *curr = &tab_mvf[yq_pu * min_pu_width + x_pu];
752 uint8_t top_cbf_luma =
s->cbf_luma[yp_tu * min_tu_width + x_tu];
753 uint8_t curr_cbf_luma =
s->cbf_luma[yq_tu * min_tu_width + x_tu];
757 else if (curr_cbf_luma || top_cbf_luma)
761 s->horizontal_bs[((x0 +
i) + y0 *
s->bs_width) >> 2] = bs;
766 boundary_left = x0 > 0 && !(x0 & 7);
768 ((!
s->sh.slice_loop_filter_across_slices_enabled_flag &&
770 (x0 % (1 <<
s->ps.sps->log2_ctb_size)) == 0) ||
771 (!
s->ps.pps->loop_filter_across_tiles_enabled_flag &&
773 (x0 % (1 <<
s->ps.sps->log2_ctb_size)) == 0)))
780 int xp_pu = (x0 - 1) >> log2_min_pu_size;
781 int xq_pu = x0 >> log2_min_pu_size;
782 int xp_tu = (x0 - 1) >> log2_min_tu_size;
783 int xq_tu = x0 >> log2_min_tu_size;
785 for (
i = 0;
i < (1 << log2_trafo_size);
i += 4) {
786 int y_pu = (y0 +
i) >> log2_min_pu_size;
787 int y_tu = (y0 +
i) >> log2_min_tu_size;
788 MvField *
left = &tab_mvf[y_pu * min_pu_width + xp_pu];
789 MvField *curr = &tab_mvf[y_pu * min_pu_width + xq_pu];
790 uint8_t left_cbf_luma =
s->cbf_luma[y_tu * min_tu_width + xp_tu];
791 uint8_t curr_cbf_luma =
s->cbf_luma[y_tu * min_tu_width + xq_tu];
795 else if (curr_cbf_luma || left_cbf_luma)
799 s->vertical_bs[(x0 + (y0 +
i) *
s->bs_width) >> 2] = bs;
803 if (log2_trafo_size > log2_min_pu_size && !is_intra) {
807 for (j = 8; j < (1 << log2_trafo_size); j += 8) {
808 int yp_pu = (y0 + j - 1) >> log2_min_pu_size;
809 int yq_pu = (y0 + j) >> log2_min_pu_size;
811 for (
i = 0;
i < (1 << log2_trafo_size);
i += 4) {
812 int x_pu = (x0 +
i) >> log2_min_pu_size;
813 MvField *top = &tab_mvf[yp_pu * min_pu_width + x_pu];
814 MvField *curr = &tab_mvf[yq_pu * min_pu_width + x_pu];
817 s->horizontal_bs[((x0 +
i) + (y0 + j) *
s->bs_width) >> 2] = bs;
822 for (j = 0; j < (1 << log2_trafo_size); j += 4) {
823 int y_pu = (y0 + j) >> log2_min_pu_size;
825 for (
i = 8;
i < (1 << log2_trafo_size);
i += 8) {
826 int xp_pu = (x0 +
i - 1) >> log2_min_pu_size;
827 int xq_pu = (x0 +
i) >> log2_min_pu_size;
828 MvField *
left = &tab_mvf[y_pu * min_pu_width + xp_pu];
829 MvField *curr = &tab_mvf[y_pu * min_pu_width + xq_pu];
832 s->vertical_bs[((x0 +
i) + (y0 + j) *
s->bs_width) >> 2] = bs;
844 int x_end = x >=
s->ps.sps->width - ctb_size;
858 if (
s->ps.sps->sao_enabled && !skip) {
859 int y_end = y >=
s->ps.sps->height - ctb_size;
869 if (x_end && y_end) {
880 int x_end = x_ctb >=
s->ps.sps->width - ctb_size;
881 int y_end = y_ctb >=
s->ps.sps->height - ctb_size;