36 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1,
37 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4,
38 5, 5, 6, 6, 7, 8, 9, 10, 11, 13, 14, 16, 18, 20, 22, 24
42 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 6, 7, 8,
43 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36,
44 38, 40, 42, 44, 46, 48, 50, 52, 54, 56, 58, 60, 62, 64
49 static const int qp_c[] = {
50 29, 30, 31, 32, 33, 33, 34, 34, 35, 35, 36, 36, 37, 37
52 int qp, qp_i,
offset, idxt;
56 offset =
s->ps.pps->cb_qp_offset;
58 offset =
s->ps.pps->cr_qp_offset;
61 if (
s->ps.sps->chroma_format_idc == 1) {
77 int xBase,
int yBase,
int log2_cb_size)
79 int ctb_size_mask = (1 <<
s->ps.sps->log2_ctb_size) - 1;
80 int MinCuQpDeltaSizeMask = (1 << (
s->ps.sps->log2_ctb_size -
81 s->ps.pps->diff_cu_qp_delta_depth)) - 1;
82 int xQgBase = xBase - (xBase & MinCuQpDeltaSizeMask);
83 int yQgBase = yBase - (yBase & MinCuQpDeltaSizeMask);
84 int min_cb_width =
s->ps.sps->min_cb_width;
85 int x_cb = xQgBase >>
s->ps.sps->log2_min_cb_size;
86 int y_cb = yQgBase >>
s->ps.sps->log2_min_cb_size;
87 int availableA = (xBase & ctb_size_mask) &&
88 (xQgBase & ctb_size_mask);
89 int availableB = (yBase & ctb_size_mask) &&
90 (yQgBase & ctb_size_mask);
91 int qPy_pred, qPy_a, qPy_b;
96 qPy_pred =
s->sh.slice_qp;
105 qPy_a =
s->qp_y_tab[(x_cb - 1) + y_cb * min_cb_width];
111 qPy_b =
s->qp_y_tab[x_cb + (y_cb - 1) * min_cb_width];
113 av_assert2(qPy_a >= -
s->ps.sps->qp_bd_offset && qPy_a < 52);
114 av_assert2(qPy_b >= -
s->ps.sps->qp_bd_offset && qPy_b < 52);
116 return (qPy_a + qPy_b + 1) >> 1;
125 int off =
s->ps.sps->qp_bd_offset;
134 int log2_min_cb_size =
s->ps.sps->log2_min_cb_size;
135 int x = xC >> log2_min_cb_size;
136 int y = yC >> log2_min_cb_size;
137 return s->qp_y_tab[x + y *
s->ps.sps->min_cb_width];
141 ptrdiff_t stride_dst, ptrdiff_t stride_src)
145 if (((intptr_t)dst | (intptr_t)
src | stride_dst | stride_src) & 15) {
147 for (j = 0; j <
width - 7; j+=8)
157 for (j = 0; j <
width; j++)
165 for (j = 0; j <
width; j+=16)
176 *(uint16_t *)dst = *(uint16_t *)
src;
182 int pixel_shift,
int height,
183 ptrdiff_t stride_dst, ptrdiff_t stride_src)
186 if (pixel_shift == 0) {
194 *(uint16_t *)dst = *(uint16_t *)
src;
202 ptrdiff_t stride_src,
int x,
int y,
int width,
int height,
203 int c_idx,
int x_ctb,
int y_ctb)
205 int sh =
s->ps.sps->pixel_shift;
206 int w =
s->ps.sps->width >>
s->ps.sps->hshift[c_idx];
207 int h =
s->ps.sps->height >>
s->ps.sps->vshift[c_idx];
210 memcpy(
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb) *
w + x) << sh),
212 memcpy(
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb + 1) *
w + x) << sh),
216 copy_vert(
s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb) *
h + y) << sh),
src, sh,
height, 1 << sh, stride_src);
218 copy_vert(
s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb + 1) *
h + y) << sh),
src + ((
width - 1) << sh), sh,
height, 1 << sh, stride_src);
222 uint8_t *
src1,
const uint8_t *dst1,
223 ptrdiff_t stride_src, ptrdiff_t stride_dst,
226 if (
s->ps.pps->transquant_bypass_enable_flag ||
227 (
s->ps.sps->pcm_loop_filter_disabled &&
s->ps.sps->pcm_enabled)) {
229 int min_pu_size = 1 <<
s->ps.sps->log2_min_pu_size;
230 int hshift =
s->ps.sps->hshift[c_idx];
231 int vshift =
s->ps.sps->vshift[c_idx];
232 int x_min = ((x0 ) >>
s->ps.sps->log2_min_pu_size);
233 int y_min = ((y0 ) >>
s->ps.sps->log2_min_pu_size);
234 int x_max = ((x0 +
width ) >>
s->ps.sps->log2_min_pu_size);
235 int y_max = ((y0 +
height) >>
s->ps.sps->log2_min_pu_size);
236 int len = (min_pu_size >> hshift) <<
s->ps.sps->pixel_shift;
237 for (y = y_min; y < y_max; y++) {
238 for (x = x_min; x < x_max; x++) {
239 if (
s->is_pcm[y *
s->ps.sps->min_pu_width + x]) {
241 uint8_t *
src =
src1 + (((y <<
s->ps.sps->log2_min_pu_size) - y0) >> vshift) * stride_src + ((((x <<
s->ps.sps->log2_min_pu_size) - x0) >> hshift) <<
s->ps.sps->pixel_shift);
242 const uint8_t *dst = dst1 + (((y <<
s->ps.sps->log2_min_pu_size) - y0) >> vshift) * stride_dst + ((((x <<
s->ps.sps->log2_min_pu_size) - x0) >> hshift) <<
s->ps.sps->pixel_shift);
243 for (n = 0; n < (min_pu_size >> vshift); n++) {
254 #define CTB(tab, x, y) ((tab)[(y) * s->ps.sps->ctb_width + (x)])
258 static const uint8_t sao_tab[8] = { 0, 1, 2, 2, 3, 3, 4, 4 };
261 int x_ctb = x >>
s->ps.sps->log2_ctb_size;
262 int y_ctb = y >>
s->ps.sps->log2_ctb_size;
263 int ctb_addr_rs = y_ctb *
s->ps.sps->ctb_width + x_ctb;
264 int ctb_addr_ts =
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs];
267 uint8_t vert_edge[] = { 0, 0 };
268 uint8_t horiz_edge[] = { 0, 0 };
269 uint8_t diag_edge[] = { 0, 0, 0, 0 };
270 uint8_t lfase =
CTB(
s->filter_slice_edges, x_ctb, y_ctb);
271 uint8_t no_tile_filter =
s->ps.pps->tiles_enabled_flag &&
272 !
s->ps.pps->loop_filter_across_tiles_enabled_flag;
273 uint8_t restore = no_tile_filter || !lfase;
274 uint8_t left_tile_edge = 0;
275 uint8_t right_tile_edge = 0;
276 uint8_t up_tile_edge = 0;
277 uint8_t bottom_tile_edge = 0;
279 edges[0] = x_ctb == 0;
280 edges[1] = y_ctb == 0;
281 edges[2] = x_ctb ==
s->ps.sps->ctb_width - 1;
282 edges[3] = y_ctb ==
s->ps.sps->ctb_height - 1;
286 left_tile_edge = no_tile_filter &&
s->ps.pps->tile_id[ctb_addr_ts] !=
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs-1]];
287 vert_edge[0] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb)) || left_tile_edge;
290 right_tile_edge = no_tile_filter &&
s->ps.pps->tile_id[ctb_addr_ts] !=
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs+1]];
291 vert_edge[1] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb)) || right_tile_edge;
294 up_tile_edge = no_tile_filter &&
s->ps.pps->tile_id[ctb_addr_ts] !=
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs -
s->ps.sps->ctb_width]];
295 horiz_edge[0] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb, y_ctb - 1)) || up_tile_edge;
298 bottom_tile_edge = no_tile_filter &&
s->ps.pps->tile_id[ctb_addr_ts] !=
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs +
s->ps.sps->ctb_width]];
299 horiz_edge[1] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb, y_ctb + 1)) || bottom_tile_edge;
301 if (!edges[0] && !edges[1]) {
302 diag_edge[0] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb - 1)) || left_tile_edge || up_tile_edge;
304 if (!edges[1] && !edges[2]) {
305 diag_edge[1] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb - 1)) || right_tile_edge || up_tile_edge;
307 if (!edges[2] && !edges[3]) {
308 diag_edge[2] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb + 1)) || right_tile_edge || bottom_tile_edge;
310 if (!edges[0] && !edges[3]) {
311 diag_edge[3] = (!lfase &&
CTB(
s->tab_slice_address, x_ctb, y_ctb) !=
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb + 1)) || left_tile_edge || bottom_tile_edge;
315 for (c_idx = 0; c_idx < (
s->ps.sps->chroma_format_idc ? 3 : 1); c_idx++) {
316 int x0 = x >>
s->ps.sps->hshift[c_idx];
317 int y0 = y >>
s->ps.sps->vshift[c_idx];
318 ptrdiff_t stride_src =
s->frame->linesize[c_idx];
319 int ctb_size_h = (1 << (
s->ps.sps->log2_ctb_size)) >>
s->ps.sps->hshift[c_idx];
320 int ctb_size_v = (1 << (
s->ps.sps->log2_ctb_size)) >>
s->ps.sps->vshift[c_idx];
321 int width =
FFMIN(ctb_size_h, (
s->ps.sps->width >>
s->ps.sps->hshift[c_idx]) - x0);
322 int height =
FFMIN(ctb_size_v, (
s->ps.sps->height >>
s->ps.sps->vshift[c_idx]) - y0);
324 uint8_t *
src = &
s->frame->data[c_idx][y0 * stride_src + (x0 <<
s->ps.sps->pixel_shift)];
325 ptrdiff_t stride_dst;
332 if (
s->ps.pps->transquant_bypass_enable_flag ||
333 (
s->ps.sps->pcm_loop_filter_disabled &&
s->ps.sps->pcm_enabled)) {
337 s->hevcdsp.sao_band_filter[
tab](
src, dst, stride_src, stride_dst,
343 s->hevcdsp.sao_band_filter[
tab](
src,
src, stride_src, stride_src,
351 int w =
s->ps.sps->width >>
s->ps.sps->hshift[c_idx];
352 int h =
s->ps.sps->height >>
s->ps.sps->vshift[c_idx];
353 int left_edge = edges[0];
354 int top_edge = edges[1];
355 int right_edge = edges[2];
356 int bottom_edge = edges[3];
357 int sh =
s->ps.sps->pixel_shift;
358 int left_pixels, right_pixels;
364 int left = 1 - left_edge;
365 int right = 1 - right_edge;
366 const uint8_t *
src1[2];
370 dst1 = dst - stride_dst - (
left << sh);
372 src1[1] =
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb - 1) *
w + x0 -
left) << sh);
375 src_idx = (
CTB(
s->sao, x_ctb-1, y_ctb-1).type_idx[c_idx] ==
380 src_idx = (
CTB(
s->sao, x_ctb, y_ctb-1).type_idx[c_idx] ==
385 src_idx = (
CTB(
s->sao, x_ctb+1, y_ctb-1).type_idx[c_idx] ==
391 int left = 1 - left_edge;
392 int right = 1 - right_edge;
393 const uint8_t *
src1[2];
397 dst1 = dst +
height * stride_dst - (
left << sh);
399 src1[1] =
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb + 2) *
w + x0 -
left) << sh);
402 src_idx = (
CTB(
s->sao, x_ctb-1, y_ctb+1).type_idx[c_idx] ==
407 src_idx = (
CTB(
s->sao, x_ctb, y_ctb+1).type_idx[c_idx] ==
412 src_idx = (
CTB(
s->sao, x_ctb+1, y_ctb+1).type_idx[c_idx] ==
421 s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb - 1) *
h + y0) << sh),
422 sh,
height, stride_dst, 1 << sh);
431 s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb + 2) *
h + y0) << sh),
432 sh,
height, stride_dst, 1 << sh);
439 src - (left_pixels << sh),
440 (
width + left_pixels + right_pixels) << sh,
441 height, stride_dst, stride_src);
447 s->hevcdsp.sao_edge_restore[restore](
src, dst,
448 stride_src, stride_dst,
466 int log2_min_pu_size =
s->ps.sps->log2_min_pu_size;
472 x_pu = x >> log2_min_pu_size;
473 y_pu = y >> log2_min_pu_size;
475 if (x_pu >=
s->ps.sps->min_pu_width || y_pu >=
s->ps.sps->min_pu_height)
477 return s->is_pcm[y_pu *
s->ps.sps->min_pu_width + x_pu];
480 #define TC_CALC(qp, bs) \
481 tctable[av_clip((qp) + DEFAULT_INTRA_TC_OFFSET * ((bs) - 1) + \
483 0, MAX_QP + DEFAULT_INTRA_TC_OFFSET)]
491 uint8_t no_p[2] = { 0 };
492 uint8_t no_q[2] = { 0 };
494 int log2_ctb_size =
s->ps.sps->log2_ctb_size;
495 int x_end, x_end2, y_end;
496 int ctb_size = 1 << log2_ctb_size;
497 int ctb = (x0 >> log2_ctb_size) +
498 (y0 >> log2_ctb_size) *
s->ps.sps->ctb_width;
499 int cur_tc_offset =
s->deblock[ctb].tc_offset;
500 int cur_beta_offset =
s->deblock[ctb].beta_offset;
501 int left_tc_offset, left_beta_offset;
502 int tc_offset, beta_offset;
503 int pcmf = (
s->ps.sps->pcm_enabled &&
504 s->ps.sps->pcm_loop_filter_disabled) ||
505 s->ps.pps->transquant_bypass_enable_flag;
508 left_tc_offset =
s->deblock[ctb - 1].tc_offset;
509 left_beta_offset =
s->deblock[ctb - 1].beta_offset;
512 left_beta_offset = 0;
515 x_end = x0 + ctb_size;
516 if (x_end >
s->ps.sps->width)
517 x_end =
s->ps.sps->width;
518 y_end = y0 + ctb_size;
519 if (y_end >
s->ps.sps->height)
520 y_end =
s->ps.sps->height;
522 tc_offset = cur_tc_offset;
523 beta_offset = cur_beta_offset;
526 if (x_end2 !=
s->ps.sps->width)
528 for (y = y0; y < y_end; y += 8) {
530 for (x = x0 ? x0 : 8; x < x_end; x += 8) {
531 const int bs0 =
s->vertical_bs[(x + y *
s->bs_width) >> 2];
532 const int bs1 =
s->vertical_bs[(x + (y + 4) *
s->bs_width) >> 2];
540 src = &
s->frame->data[
LUMA][y *
s->frame->linesize[
LUMA] + (x <<
s->ps.sps->pixel_shift)];
546 s->hevcdsp.hevc_v_loop_filter_luma_c(
src,
547 s->frame->linesize[
LUMA],
548 beta,
tc, no_p, no_q);
550 s->hevcdsp.hevc_v_loop_filter_luma(
src,
551 s->frame->linesize[
LUMA],
552 beta,
tc, no_p, no_q);
560 for (x = x0 ? x0 - 8 : 0; x < x_end2; x += 8) {
561 const int bs0 =
s->horizontal_bs[( x + y *
s->bs_width) >> 2];
562 const int bs1 =
s->horizontal_bs[((x + 4) + y *
s->bs_width) >> 2];
566 tc_offset = x >= x0 ? cur_tc_offset : left_tc_offset;
567 beta_offset = x >= x0 ? cur_beta_offset : left_beta_offset;
572 src = &
s->frame->data[
LUMA][y *
s->frame->linesize[
LUMA] + (x <<
s->ps.sps->pixel_shift)];
578 s->hevcdsp.hevc_h_loop_filter_luma_c(
src,
579 s->frame->linesize[
LUMA],
580 beta,
tc, no_p, no_q);
582 s->hevcdsp.hevc_h_loop_filter_luma(
src,
583 s->frame->linesize[
LUMA],
584 beta,
tc, no_p, no_q);
589 if (
s->ps.sps->chroma_format_idc) {
591 int h = 1 <<
s->ps.sps->hshift[
chroma];
592 int v = 1 <<
s->ps.sps->vshift[
chroma];
595 for (y = y0; y < y_end; y += (8 * v)) {
596 for (x = x0 ? x0 : 8 *
h; x < x_end; x += (8 *
h)) {
597 const int bs0 =
s->vertical_bs[(x + y *
s->bs_width) >> 2];
598 const int bs1 =
s->vertical_bs[(x + (y + (4 * v)) *
s->bs_width) >> 2];
600 if ((bs0 == 2) || (bs1 == 2)) {
602 const int qp1 = (
get_qPy(
s, x - 1, y + (4 * v)) +
get_qPy(
s, x, y + (4 * v)) + 1) >> 1;
606 src = &
s->frame->data[
chroma][(y >>
s->ps.sps->vshift[
chroma]) *
s->frame->linesize[
chroma] + ((x >>
s->ps.sps->hshift[
chroma]) <<
s->ps.sps->pixel_shift)];
609 no_p[1] =
get_pcm(
s, x - 1, y + (4 * v));
611 no_q[1] =
get_pcm(
s, x, y + (4 * v));
612 s->hevcdsp.hevc_v_loop_filter_chroma_c(
src,
616 s->hevcdsp.hevc_v_loop_filter_chroma(
src,
626 tc_offset = x0 ? left_tc_offset : cur_tc_offset;
628 if (x_end !=
s->ps.sps->width)
629 x_end2 = x_end - 8 *
h;
630 for (x = x0 ? x0 - 8 *
h : 0; x < x_end2; x += (8 *
h)) {
631 const int bs0 =
s->horizontal_bs[( x + y *
s->bs_width) >> 2];
632 const int bs1 =
s->horizontal_bs[((x + 4 *
h) + y *
s->bs_width) >> 2];
633 if ((bs0 == 2) || (bs1 == 2)) {
634 const int qp0 = bs0 == 2 ? (
get_qPy(
s, x, y - 1) +
get_qPy(
s, x, y) + 1) >> 1 : 0;
635 const int qp1 = bs1 == 2 ? (
get_qPy(
s, x + (4 *
h), y - 1) +
get_qPy(
s, x + (4 *
h), y) + 1) >> 1 : 0;
639 src = &
s->frame->data[
chroma][(y >>
s->ps.sps->vshift[1]) *
s->frame->linesize[
chroma] + ((x >>
s->ps.sps->hshift[1]) <<
s->ps.sps->pixel_shift)];
642 no_p[1] =
get_pcm(
s, x + (4 *
h), y - 1);
645 s->hevcdsp.hevc_h_loop_filter_chroma_c(
src,
649 s->hevcdsp.hevc_h_loop_filter_chroma(
src,
664 if (
s->ref->refPicList[0].list[curr->
ref_idx[0]] == neigh_refPicList[0].
list[neigh->
ref_idx[0]] &&
665 s->ref->refPicList[0].list[curr->
ref_idx[0]] ==
s->ref->refPicList[1].list[curr->
ref_idx[1]] &&
674 }
else if (neigh_refPicList[0].
list[neigh->
ref_idx[0]] ==
s->ref->refPicList[0].list[curr->
ref_idx[0]] &&
675 neigh_refPicList[1].
list[neigh->
ref_idx[1]] ==
s->ref->refPicList[1].list[curr->
ref_idx[1]]) {
681 }
else if (neigh_refPicList[1].
list[neigh->
ref_idx[1]] ==
s->ref->refPicList[0].list[curr->
ref_idx[0]] &&
682 neigh_refPicList[0].
list[neigh->
ref_idx[0]] ==
s->ref->refPicList[1].list[curr->
ref_idx[1]]) {
697 ref_A =
s->ref->refPicList[0].list[curr->
ref_idx[0]];
700 ref_A =
s->ref->refPicList[1].list[curr->
ref_idx[1]];
705 ref_B = neigh_refPicList[0].
list[neigh->
ref_idx[0]];
708 ref_B = neigh_refPicList[1].
list[neigh->
ref_idx[1]];
711 if (ref_A == ref_B) {
727 const MvField *tab_mvf =
s->ref->tab_mvf;
728 int log2_min_pu_size =
s->ps.sps->log2_min_pu_size;
729 int log2_min_tu_size =
s->ps.sps->log2_min_tb_size;
730 int min_pu_width =
s->ps.sps->min_pu_width;
731 int min_tu_width =
s->ps.sps->min_tb_width;
732 int is_intra = tab_mvf[(y0 >> log2_min_pu_size) * min_pu_width +
734 int boundary_upper, boundary_left;
737 boundary_upper = y0 > 0 && !(y0 & 7);
738 if (boundary_upper &&
739 ((!
s->sh.slice_loop_filter_across_slices_enabled_flag &&
741 (y0 % (1 <<
s->ps.sps->log2_ctb_size)) == 0) ||
742 (!
s->ps.pps->loop_filter_across_tiles_enabled_flag &&
744 (y0 % (1 <<
s->ps.sps->log2_ctb_size)) == 0)))
747 if (boundary_upper) {
751 int yp_pu = (y0 - 1) >> log2_min_pu_size;
752 int yq_pu = y0 >> log2_min_pu_size;
753 int yp_tu = (y0 - 1) >> log2_min_tu_size;
754 int yq_tu = y0 >> log2_min_tu_size;
756 for (
i = 0;
i < (1 << log2_trafo_size);
i += 4) {
757 int x_pu = (x0 +
i) >> log2_min_pu_size;
758 int x_tu = (x0 +
i) >> log2_min_tu_size;
759 const MvField *top = &tab_mvf[yp_pu * min_pu_width + x_pu];
760 const MvField *curr = &tab_mvf[yq_pu * min_pu_width + x_pu];
761 uint8_t top_cbf_luma =
s->cbf_luma[yp_tu * min_tu_width + x_tu];
762 uint8_t curr_cbf_luma =
s->cbf_luma[yq_tu * min_tu_width + x_tu];
766 else if (curr_cbf_luma || top_cbf_luma)
770 s->horizontal_bs[((x0 +
i) + y0 *
s->bs_width) >> 2] = bs;
775 boundary_left = x0 > 0 && !(x0 & 7);
777 ((!
s->sh.slice_loop_filter_across_slices_enabled_flag &&
779 (x0 % (1 <<
s->ps.sps->log2_ctb_size)) == 0) ||
780 (!
s->ps.pps->loop_filter_across_tiles_enabled_flag &&
782 (x0 % (1 <<
s->ps.sps->log2_ctb_size)) == 0)))
789 int xp_pu = (x0 - 1) >> log2_min_pu_size;
790 int xq_pu = x0 >> log2_min_pu_size;
791 int xp_tu = (x0 - 1) >> log2_min_tu_size;
792 int xq_tu = x0 >> log2_min_tu_size;
794 for (
i = 0;
i < (1 << log2_trafo_size);
i += 4) {
795 int y_pu = (y0 +
i) >> log2_min_pu_size;
796 int y_tu = (y0 +
i) >> log2_min_tu_size;
797 const MvField *
left = &tab_mvf[y_pu * min_pu_width + xp_pu];
798 const MvField *curr = &tab_mvf[y_pu * min_pu_width + xq_pu];
799 uint8_t left_cbf_luma =
s->cbf_luma[y_tu * min_tu_width + xp_tu];
800 uint8_t curr_cbf_luma =
s->cbf_luma[y_tu * min_tu_width + xq_tu];
804 else if (curr_cbf_luma || left_cbf_luma)
808 s->vertical_bs[(x0 + (y0 +
i) *
s->bs_width) >> 2] = bs;
812 if (log2_trafo_size > log2_min_pu_size && !is_intra) {
816 for (j = 8; j < (1 << log2_trafo_size); j += 8) {
817 int yp_pu = (y0 + j - 1) >> log2_min_pu_size;
818 int yq_pu = (y0 + j) >> log2_min_pu_size;
820 for (
i = 0;
i < (1 << log2_trafo_size);
i += 4) {
821 int x_pu = (x0 +
i) >> log2_min_pu_size;
822 const MvField *top = &tab_mvf[yp_pu * min_pu_width + x_pu];
823 const MvField *curr = &tab_mvf[yq_pu * min_pu_width + x_pu];
826 s->horizontal_bs[((x0 +
i) + (y0 + j) *
s->bs_width) >> 2] = bs;
831 for (j = 0; j < (1 << log2_trafo_size); j += 4) {
832 int y_pu = (y0 + j) >> log2_min_pu_size;
834 for (
i = 8;
i < (1 << log2_trafo_size);
i += 8) {
835 int xp_pu = (x0 +
i - 1) >> log2_min_pu_size;
836 int xq_pu = (x0 +
i) >> log2_min_pu_size;
837 const MvField *
left = &tab_mvf[y_pu * min_pu_width + xp_pu];
838 const MvField *curr = &tab_mvf[y_pu * min_pu_width + xq_pu];
841 s->vertical_bs[((x0 +
i) + (y0 + j) *
s->bs_width) >> 2] = bs;
854 int x_end = x >=
s->ps.sps->width - ctb_size;
868 if (
s->ps.sps->sao_enabled && !
skip) {
869 int y_end = y >=
s->ps.sps->height - ctb_size;
879 if (x_end && y_end) {