36     0, 0, 0, 0, 0, 0, 0,  0,  0,  0,  0,  0,  0,  0,  0,  0, 0, 0, 1, 
 
   37     1, 1, 1, 1, 1, 1, 1,  1,  2,  2,  2,  2,  3,  3,  3,  3, 4, 4, 4, 
 
   38     5, 5, 6, 6, 7, 8, 9, 10, 11, 13, 14, 16, 18, 20, 22, 24           
 
   42      0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  6,  7,  8, 
 
   43      9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36, 
 
   44     38, 40, 42, 44, 46, 48, 50, 52, 54, 56, 58, 60, 62, 64                      
 
   49     static const int qp_c[] = {
 
   50         29, 30, 31, 32, 33, 33, 34, 34, 35, 35, 36, 36, 37, 37
 
   52     int qp, qp_i, 
offset, idxt;
 
   56         offset = 
s->ps.pps->cb_qp_offset;
 
   58         offset = 
s->ps.pps->cr_qp_offset;
 
   61     if (
s->ps.sps->chroma_format_idc == 1) {
 
   77                         int xBase, 
int yBase, 
int log2_cb_size)
 
   79     int ctb_size_mask        = (1 << 
s->ps.sps->log2_ctb_size) - 1;
 
   80     int MinCuQpDeltaSizeMask = (1 << (
s->ps.sps->log2_ctb_size -
 
   81                                       s->ps.pps->diff_cu_qp_delta_depth)) - 1;
 
   82     int xQgBase              = xBase - (xBase & MinCuQpDeltaSizeMask);
 
   83     int yQgBase              = yBase - (yBase & MinCuQpDeltaSizeMask);
 
   84     int min_cb_width         = 
s->ps.sps->min_cb_width;
 
   85     int x_cb                 = xQgBase >> 
s->ps.sps->log2_min_cb_size;
 
   86     int y_cb                 = yQgBase >> 
s->ps.sps->log2_min_cb_size;
 
   87     int availableA           = (xBase   & ctb_size_mask) &&
 
   88                                (xQgBase & ctb_size_mask);
 
   89     int availableB           = (yBase   & ctb_size_mask) &&
 
   90                                (yQgBase & ctb_size_mask);
 
   91     int qPy_pred, qPy_a, qPy_b;
 
   96         qPy_pred = 
s->sh.slice_qp;
 
  105         qPy_a = 
s->qp_y_tab[(x_cb - 1) + y_cb * min_cb_width];
 
  111         qPy_b = 
s->qp_y_tab[x_cb + (y_cb - 1) * min_cb_width];
 
  113     av_assert2(qPy_a >= -
s->ps.sps->qp_bd_offset && qPy_a < 52);
 
  114     av_assert2(qPy_b >= -
s->ps.sps->qp_bd_offset && qPy_b < 52);
 
  116     return (qPy_a + qPy_b + 1) >> 1;
 
  125         int off = 
s->ps.sps->qp_bd_offset;
 
  134     int log2_min_cb_size  = 
s->ps.sps->log2_min_cb_size;
 
  135     int x                 = xC >> log2_min_cb_size;
 
  136     int y                 = yC >> log2_min_cb_size;
 
  137     return s->qp_y_tab[x + y * 
s->ps.sps->min_cb_width];
 
  141                      ptrdiff_t stride_dst, ptrdiff_t stride_src)
 
  145     if (((intptr_t)dst | (intptr_t)
src | stride_dst | stride_src) & 15) {
 
  147             for (j = 0; j < 
width - 7; j+=8)
 
  157                 for (j = 0; j < 
width; j++)
 
  165             for (j = 0; j < 
width; j+=16)
 
  176         *(uint16_t *)dst = *(uint16_t *)
src;
 
  182                       int pixel_shift, 
int height,
 
  183                       ptrdiff_t stride_dst, ptrdiff_t stride_src)
 
  186     if (pixel_shift == 0) {
 
  194             *(uint16_t *)dst = *(uint16_t *)
src;
 
  202                            ptrdiff_t stride_src, 
int x, 
int y, 
int width, 
int height,
 
  203                            int c_idx, 
int x_ctb, 
int y_ctb)
 
  205     int sh = 
s->ps.sps->pixel_shift;
 
  206     int w = 
s->ps.sps->width >> 
s->ps.sps->hshift[c_idx];
 
  207     int h = 
s->ps.sps->height >> 
s->ps.sps->vshift[c_idx];
 
  210     memcpy(
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb) * 
w + x) << sh),
 
  212     memcpy(
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb + 1) * 
w + x) << sh),
 
  216     copy_vert(
s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb) * 
h + y) << sh), 
src, sh, 
height, 1 << sh, stride_src);
 
  218     copy_vert(
s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb + 1) * 
h + y) << sh), 
src + ((
width - 1) << sh), sh, 
height, 1 << sh, stride_src);
 
  222                                uint8_t *
src1, 
const uint8_t *dst1,
 
  223                                ptrdiff_t stride_src, ptrdiff_t stride_dst,
 
  226     if ( 
s->ps.pps->transquant_bypass_enable_flag ||
 
  227             (
s->ps.sps->pcm.loop_filter_disable_flag && 
s->ps.sps->pcm_enabled_flag)) {
 
  229         int min_pu_size  = 1 << 
s->ps.sps->log2_min_pu_size;
 
  230         int hshift       = 
s->ps.sps->hshift[c_idx];
 
  231         int vshift       = 
s->ps.sps->vshift[c_idx];
 
  232         int x_min        = ((x0         ) >> 
s->ps.sps->log2_min_pu_size);
 
  233         int y_min        = ((y0         ) >> 
s->ps.sps->log2_min_pu_size);
 
  234         int x_max        = ((x0 + 
width ) >> 
s->ps.sps->log2_min_pu_size);
 
  235         int y_max        = ((y0 + 
height) >> 
s->ps.sps->log2_min_pu_size);
 
  236         int len          = (min_pu_size >> hshift) << 
s->ps.sps->pixel_shift;
 
  237         for (y = y_min; y < y_max; y++) {
 
  238             for (x = x_min; x < x_max; x++) {
 
  239                 if (
s->is_pcm[y * 
s->ps.sps->min_pu_width + x]) {
 
  241                     uint8_t *
src = 
src1 + (((y << 
s->ps.sps->log2_min_pu_size) - y0) >> vshift) * stride_src + ((((x << 
s->ps.sps->log2_min_pu_size) - x0) >> hshift) << 
s->ps.sps->pixel_shift);
 
  242                     const uint8_t *dst = dst1 + (((y << 
s->ps.sps->log2_min_pu_size) - y0) >> vshift) * stride_dst + ((((x << 
s->ps.sps->log2_min_pu_size) - x0) >> hshift) << 
s->ps.sps->pixel_shift);
 
  243                     for (n = 0; n < (min_pu_size >> vshift); n++) {
 
  254 #define CTB(tab, x, y) ((tab)[(y) * s->ps.sps->ctb_width + (x)]) 
  258     static const uint8_t sao_tab[8] = { 0, 1, 2, 2, 3, 3, 4, 4 };
 
  261     int x_ctb                = x >> 
s->ps.sps->log2_ctb_size;
 
  262     int y_ctb                = y >> 
s->ps.sps->log2_ctb_size;
 
  263     int ctb_addr_rs          = y_ctb * 
s->ps.sps->ctb_width + x_ctb;
 
  264     int ctb_addr_ts          = 
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs];
 
  267     uint8_t vert_edge[]      = { 0, 0 };
 
  268     uint8_t horiz_edge[]     = { 0, 0 };
 
  269     uint8_t diag_edge[]      = { 0, 0, 0, 0 };
 
  270     uint8_t lfase            = 
CTB(
s->filter_slice_edges, x_ctb, y_ctb);
 
  271     uint8_t no_tile_filter   = 
s->ps.pps->tiles_enabled_flag &&
 
  272                                !
s->ps.pps->loop_filter_across_tiles_enabled_flag;
 
  273     uint8_t restore          = no_tile_filter || !lfase;
 
  274     uint8_t left_tile_edge   = 0;
 
  275     uint8_t right_tile_edge  = 0;
 
  276     uint8_t up_tile_edge     = 0;
 
  277     uint8_t bottom_tile_edge = 0;
 
  279     edges[0]   = x_ctb == 0;
 
  280     edges[1]   = y_ctb == 0;
 
  281     edges[2]   = x_ctb == 
s->ps.sps->ctb_width  - 1;
 
  282     edges[3]   = y_ctb == 
s->ps.sps->ctb_height - 1;
 
  286             left_tile_edge  = no_tile_filter && 
s->ps.pps->tile_id[ctb_addr_ts] != 
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs-1]];
 
  287             vert_edge[0]    = (!lfase && 
CTB(
s->tab_slice_address, x_ctb, y_ctb) != 
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb)) || left_tile_edge;
 
  290             right_tile_edge = no_tile_filter && 
s->ps.pps->tile_id[ctb_addr_ts] != 
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs+1]];
 
  291             vert_edge[1]    = (!lfase && 
CTB(
s->tab_slice_address, x_ctb, y_ctb) != 
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb)) || right_tile_edge;
 
  294             up_tile_edge     = no_tile_filter && 
s->ps.pps->tile_id[ctb_addr_ts] != 
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs - 
s->ps.sps->ctb_width]];
 
  295             horiz_edge[0]    = (!lfase && 
CTB(
s->tab_slice_address, x_ctb, y_ctb) != 
CTB(
s->tab_slice_address, x_ctb, y_ctb - 1)) || up_tile_edge;
 
  298             bottom_tile_edge = no_tile_filter && 
s->ps.pps->tile_id[ctb_addr_ts] != 
s->ps.pps->tile_id[
s->ps.pps->ctb_addr_rs_to_ts[ctb_addr_rs + 
s->ps.sps->ctb_width]];
 
  299             horiz_edge[1]    = (!lfase && 
CTB(
s->tab_slice_address, x_ctb, y_ctb) != 
CTB(
s->tab_slice_address, x_ctb, y_ctb + 1)) || bottom_tile_edge;
 
  301         if (!edges[0] && !edges[1]) {
 
  302             diag_edge[0] = (!lfase && 
CTB(
s->tab_slice_address, x_ctb, y_ctb) != 
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb - 1)) || left_tile_edge || up_tile_edge;
 
  304         if (!edges[1] && !edges[2]) {
 
  305             diag_edge[1] = (!lfase && 
CTB(
s->tab_slice_address, x_ctb, y_ctb) != 
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb - 1)) || right_tile_edge || up_tile_edge;
 
  307         if (!edges[2] && !edges[3]) {
 
  308             diag_edge[2] = (!lfase && 
CTB(
s->tab_slice_address, x_ctb, y_ctb) != 
CTB(
s->tab_slice_address, x_ctb + 1, y_ctb + 1)) || right_tile_edge || bottom_tile_edge;
 
  310         if (!edges[0] && !edges[3]) {
 
  311             diag_edge[3] = (!lfase && 
CTB(
s->tab_slice_address, x_ctb, y_ctb) != 
CTB(
s->tab_slice_address, x_ctb - 1, y_ctb + 1)) || left_tile_edge || bottom_tile_edge;
 
  315     for (c_idx = 0; c_idx < (
s->ps.sps->chroma_format_idc ? 3 : 1); c_idx++) {
 
  316         int x0       = x >> 
s->ps.sps->hshift[c_idx];
 
  317         int y0       = y >> 
s->ps.sps->vshift[c_idx];
 
  318         ptrdiff_t stride_src = 
s->frame->linesize[c_idx];
 
  319         int ctb_size_h = (1 << (
s->ps.sps->log2_ctb_size)) >> 
s->ps.sps->hshift[c_idx];
 
  320         int ctb_size_v = (1 << (
s->ps.sps->log2_ctb_size)) >> 
s->ps.sps->vshift[c_idx];
 
  321         int width    = 
FFMIN(ctb_size_h, (
s->ps.sps->width  >> 
s->ps.sps->hshift[c_idx]) - x0);
 
  322         int height   = 
FFMIN(ctb_size_v, (
s->ps.sps->height >> 
s->ps.sps->vshift[c_idx]) - y0);
 
  324         uint8_t *
src = &
s->frame->data[c_idx][y0 * stride_src + (x0 << 
s->ps.sps->pixel_shift)];
 
  325         ptrdiff_t stride_dst;
 
  332             if (
s->ps.pps->transquant_bypass_enable_flag ||
 
  333                 (
s->ps.sps->pcm.loop_filter_disable_flag && 
s->ps.sps->pcm_enabled_flag)) {
 
  337                 s->hevcdsp.sao_band_filter[
tab](
src, dst, stride_src, stride_dst,
 
  343                 s->hevcdsp.sao_band_filter[
tab](
src, 
src, stride_src, stride_src,
 
  351             int w = 
s->ps.sps->width >> 
s->ps.sps->hshift[c_idx];
 
  352             int h = 
s->ps.sps->height >> 
s->ps.sps->vshift[c_idx];
 
  353             int left_edge = edges[0];
 
  354             int top_edge = edges[1];
 
  355             int right_edge = edges[2];
 
  356             int bottom_edge = edges[3];
 
  357             int sh = 
s->ps.sps->pixel_shift;
 
  358             int left_pixels, right_pixels;
 
  364                 int left = 1 - left_edge;
 
  365                 int right = 1 - right_edge;
 
  366                 const uint8_t *
src1[2];
 
  370                 dst1 = dst - stride_dst - (
left << sh);
 
  372                 src1[1] = 
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb - 1) * 
w + x0 - 
left) << sh);
 
  375                     src_idx = (
CTB(
s->sao, x_ctb-1, y_ctb-1).type_idx[c_idx] ==
 
  380                 src_idx = (
CTB(
s->sao, x_ctb, y_ctb-1).type_idx[c_idx] ==
 
  385                     src_idx = (
CTB(
s->sao, x_ctb+1, y_ctb-1).type_idx[c_idx] ==
 
  391                 int left = 1 - left_edge;
 
  392                 int right = 1 - right_edge;
 
  393                 const uint8_t *
src1[2];
 
  397                 dst1 = dst + 
height * stride_dst - (
left << sh);
 
  399                 src1[1] = 
s->sao_pixel_buffer_h[c_idx] + (((2 * y_ctb + 2) * 
w + x0 - 
left) << sh);
 
  402                     src_idx = (
CTB(
s->sao, x_ctb-1, y_ctb+1).type_idx[c_idx] ==
 
  407                 src_idx = (
CTB(
s->sao, x_ctb, y_ctb+1).type_idx[c_idx] ==
 
  412                     src_idx = (
CTB(
s->sao, x_ctb+1, y_ctb+1).type_idx[c_idx] ==
 
  421                               s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb - 1) * 
h + y0) << sh),
 
  422                               sh, 
height, stride_dst, 1 << sh);
 
  431                               s->sao_pixel_buffer_v[c_idx] + (((2 * x_ctb + 2) * 
h + y0) << sh),
 
  432                               sh, 
height, stride_dst, 1 << sh);
 
  439                      src - (left_pixels << sh),
 
  440                      (
width + left_pixels + right_pixels) << sh,
 
  441                      height, stride_dst, stride_src);
 
  447             s->hevcdsp.sao_edge_restore[restore](
src, dst,
 
  448                                                 stride_src, stride_dst,
 
  466     int log2_min_pu_size = 
s->ps.sps->log2_min_pu_size;
 
  472     x_pu = x >> log2_min_pu_size;
 
  473     y_pu = y >> log2_min_pu_size;
 
  475     if (x_pu >= 
s->ps.sps->min_pu_width || y_pu >= 
s->ps.sps->min_pu_height)
 
  477     return s->is_pcm[y_pu * 
s->ps.sps->min_pu_width + x_pu];
 
  480 #define TC_CALC(qp, bs)                                                 \ 
  481     tctable[av_clip((qp) + DEFAULT_INTRA_TC_OFFSET * ((bs) - 1) +       \ 
  483                     0, MAX_QP + DEFAULT_INTRA_TC_OFFSET)] 
  491     uint8_t no_p[2] = { 0 };
 
  492     uint8_t no_q[2] = { 0 };
 
  494     int log2_ctb_size = 
s->ps.sps->log2_ctb_size;
 
  495     int x_end, x_end2, y_end;
 
  496     int ctb_size        = 1 << log2_ctb_size;
 
  497     int ctb             = (x0 >> log2_ctb_size) +
 
  498                           (y0 >> log2_ctb_size) * 
s->ps.sps->ctb_width;
 
  499     int cur_tc_offset   = 
s->deblock[ctb].tc_offset;
 
  500     int cur_beta_offset = 
s->deblock[ctb].beta_offset;
 
  501     int left_tc_offset, left_beta_offset;
 
  502     int tc_offset, beta_offset;
 
  503     int pcmf = (
s->ps.sps->pcm_enabled_flag &&
 
  504                 s->ps.sps->pcm.loop_filter_disable_flag) ||
 
  505                s->ps.pps->transquant_bypass_enable_flag;
 
  508         left_tc_offset   = 
s->deblock[ctb - 1].tc_offset;
 
  509         left_beta_offset = 
s->deblock[ctb - 1].beta_offset;
 
  512         left_beta_offset = 0;
 
  515     x_end = x0 + ctb_size;
 
  516     if (x_end > 
s->ps.sps->width)
 
  517         x_end = 
s->ps.sps->width;
 
  518     y_end = y0 + ctb_size;
 
  519     if (y_end > 
s->ps.sps->height)
 
  520         y_end = 
s->ps.sps->height;
 
  522     tc_offset   = cur_tc_offset;
 
  523     beta_offset = cur_beta_offset;
 
  526     if (x_end2 != 
s->ps.sps->width)
 
  528     for (y = y0; y < y_end; y += 8) {
 
  530         for (x = x0 ? x0 : 8; x < x_end; x += 8) {
 
  531             const int bs0 = 
s->vertical_bs[(x +  y      * 
s->bs_width) >> 2];
 
  532             const int bs1 = 
s->vertical_bs[(x + (y + 4) * 
s->bs_width) >> 2];
 
  540                 src     = &
s->frame->data[
LUMA][y * 
s->frame->linesize[
LUMA] + (x << 
s->ps.sps->pixel_shift)];
 
  546                     s->hevcdsp.hevc_v_loop_filter_luma_c(
src,
 
  547                                                          s->frame->linesize[
LUMA],
 
  548                                                          beta, 
tc, no_p, no_q);
 
  550                     s->hevcdsp.hevc_v_loop_filter_luma(
src,
 
  551                                                        s->frame->linesize[
LUMA],
 
  552                                                        beta, 
tc, no_p, no_q);
 
  560         for (x = x0 ? x0 - 8 : 0; x < x_end2; x += 8) {
 
  561             const int bs0 = 
s->horizontal_bs[( x      + y * 
s->bs_width) >> 2];
 
  562             const int bs1 = 
s->horizontal_bs[((x + 4) + y * 
s->bs_width) >> 2];
 
  566                 tc_offset   = x >= x0 ? cur_tc_offset : left_tc_offset;
 
  567                 beta_offset = x >= x0 ? cur_beta_offset : left_beta_offset;
 
  572                 src     = &
s->frame->data[
LUMA][y * 
s->frame->linesize[
LUMA] + (x << 
s->ps.sps->pixel_shift)];
 
  578                     s->hevcdsp.hevc_h_loop_filter_luma_c(
src,
 
  579                                                          s->frame->linesize[
LUMA],
 
  580                                                          beta, 
tc, no_p, no_q);
 
  582                     s->hevcdsp.hevc_h_loop_filter_luma(
src,
 
  583                                                        s->frame->linesize[
LUMA],
 
  584                                                        beta, 
tc, no_p, no_q);
 
  589     if (
s->ps.sps->chroma_format_idc) {
 
  591             int h = 1 << 
s->ps.sps->hshift[
chroma];
 
  592             int v = 1 << 
s->ps.sps->vshift[
chroma];
 
  595             for (y = y0; y < y_end; y += (8 * v)) {
 
  596                 for (x = x0 ? x0 : 8 * 
h; x < x_end; x += (8 * 
h)) {
 
  597                     const int bs0 = 
s->vertical_bs[(x +  y            * 
s->bs_width) >> 2];
 
  598                     const int bs1 = 
s->vertical_bs[(x + (y + (4 * v)) * 
s->bs_width) >> 2];
 
  600                     if ((bs0 == 2) || (bs1 == 2)) {
 
  602                         const int qp1 = (
get_qPy(
s, x - 1, y + (4 * v)) + 
get_qPy(
s, x, y + (4 * v)) + 1) >> 1;
 
  606                         src       = &
s->frame->data[
chroma][(y >> 
s->ps.sps->vshift[
chroma]) * 
s->frame->linesize[
chroma] + ((x >> 
s->ps.sps->hshift[
chroma]) << 
s->ps.sps->pixel_shift)];
 
  609                             no_p[1] = 
get_pcm(
s, x - 1, y + (4 * v));
 
  611                             no_q[1] = 
get_pcm(
s, x, y + (4 * v));
 
  612                             s->hevcdsp.hevc_v_loop_filter_chroma_c(
src,
 
  616                             s->hevcdsp.hevc_v_loop_filter_chroma(
src,
 
  626                 tc_offset = x0 ? left_tc_offset : cur_tc_offset;
 
  628                 if (x_end != 
s->ps.sps->width)
 
  629                     x_end2 = x_end - 8 * 
h;
 
  630                 for (x = x0 ? x0 - 8 * 
h : 0; x < x_end2; x += (8 * 
h)) {
 
  631                     const int bs0 = 
s->horizontal_bs[( x          + y * 
s->bs_width) >> 2];
 
  632                     const int bs1 = 
s->horizontal_bs[((x + 4 * 
h) + y * 
s->bs_width) >> 2];
 
  633                     if ((bs0 == 2) || (bs1 == 2)) {
 
  634                         const int qp0 = bs0 == 2 ? (
get_qPy(
s, x,           y - 1) + 
get_qPy(
s, x,           y) + 1) >> 1 : 0;
 
  635                         const int qp1 = bs1 == 2 ? (
get_qPy(
s, x + (4 * 
h), y - 1) + 
get_qPy(
s, x + (4 * 
h), y) + 1) >> 1 : 0;
 
  639                         src       = &
s->frame->data[
chroma][(y >> 
s->ps.sps->vshift[1]) * 
s->frame->linesize[
chroma] + ((x >> 
s->ps.sps->hshift[1]) << 
s->ps.sps->pixel_shift)];
 
  642                             no_p[1] = 
get_pcm(
s, x + (4 * 
h), y - 1);
 
  645                             s->hevcdsp.hevc_h_loop_filter_chroma_c(
src,
 
  649                             s->hevcdsp.hevc_h_loop_filter_chroma(
src,
 
  664         if (
s->ref->refPicList[0].list[curr->
ref_idx[0]] == neigh_refPicList[0].
list[neigh->
ref_idx[0]]  &&
 
  665             s->ref->refPicList[0].list[curr->
ref_idx[0]] == 
s->ref->refPicList[1].list[curr->
ref_idx[1]] &&
 
  674         } 
else if (neigh_refPicList[0].
list[neigh->
ref_idx[0]] == 
s->ref->refPicList[0].list[curr->
ref_idx[0]] &&
 
  675                    neigh_refPicList[1].
list[neigh->
ref_idx[1]] == 
s->ref->refPicList[1].list[curr->
ref_idx[1]]) {
 
  681         } 
else if (neigh_refPicList[1].
list[neigh->
ref_idx[1]] == 
s->ref->refPicList[0].list[curr->
ref_idx[0]] &&
 
  682                    neigh_refPicList[0].
list[neigh->
ref_idx[0]] == 
s->ref->refPicList[1].list[curr->
ref_idx[1]]) {
 
  697             ref_A = 
s->ref->refPicList[0].list[curr->
ref_idx[0]];
 
  700             ref_A = 
s->ref->refPicList[1].list[curr->
ref_idx[1]];
 
  705             ref_B = neigh_refPicList[0].
list[neigh->
ref_idx[0]];
 
  708             ref_B = neigh_refPicList[1].
list[neigh->
ref_idx[1]];
 
  711         if (ref_A == ref_B) {
 
  727     const MvField *tab_mvf = 
s->ref->tab_mvf;
 
  728     int log2_min_pu_size = 
s->ps.sps->log2_min_pu_size;
 
  729     int log2_min_tu_size = 
s->ps.sps->log2_min_tb_size;
 
  730     int min_pu_width     = 
s->ps.sps->min_pu_width;
 
  731     int min_tu_width     = 
s->ps.sps->min_tb_width;
 
  732     int is_intra = tab_mvf[(y0 >> log2_min_pu_size) * min_pu_width +
 
  734     int boundary_upper, boundary_left;
 
  737     boundary_upper = y0 > 0 && !(y0 & 7);
 
  738     if (boundary_upper &&
 
  739         ((!
s->sh.slice_loop_filter_across_slices_enabled_flag &&
 
  741           (y0 % (1 << 
s->ps.sps->log2_ctb_size)) == 0) ||
 
  742          (!
s->ps.pps->loop_filter_across_tiles_enabled_flag &&
 
  744           (y0 % (1 << 
s->ps.sps->log2_ctb_size)) == 0)))
 
  747     if (boundary_upper) {
 
  751         int yp_pu = (y0 - 1) >> log2_min_pu_size;
 
  752         int yq_pu =  y0      >> log2_min_pu_size;
 
  753         int yp_tu = (y0 - 1) >> log2_min_tu_size;
 
  754         int yq_tu =  y0      >> log2_min_tu_size;
 
  756             for (
i = 0; 
i < (1 << log2_trafo_size); 
i += 4) {
 
  757                 int x_pu = (x0 + 
i) >> log2_min_pu_size;
 
  758                 int x_tu = (x0 + 
i) >> log2_min_tu_size;
 
  759                 const MvField *top  = &tab_mvf[yp_pu * min_pu_width + x_pu];
 
  760                 const MvField *curr = &tab_mvf[yq_pu * min_pu_width + x_pu];
 
  761                 uint8_t top_cbf_luma  = 
s->cbf_luma[yp_tu * min_tu_width + x_tu];
 
  762                 uint8_t curr_cbf_luma = 
s->cbf_luma[yq_tu * min_tu_width + x_tu];
 
  766                 else if (curr_cbf_luma || top_cbf_luma)
 
  770                 s->horizontal_bs[((x0 + 
i) + y0 * 
s->bs_width) >> 2] = bs;
 
  775     boundary_left = x0 > 0 && !(x0 & 7);
 
  777         ((!
s->sh.slice_loop_filter_across_slices_enabled_flag &&
 
  779           (x0 % (1 << 
s->ps.sps->log2_ctb_size)) == 0) ||
 
  780          (!
s->ps.pps->loop_filter_across_tiles_enabled_flag &&
 
  782           (x0 % (1 << 
s->ps.sps->log2_ctb_size)) == 0)))
 
  789         int xp_pu = (x0 - 1) >> log2_min_pu_size;
 
  790         int xq_pu =  x0      >> log2_min_pu_size;
 
  791         int xp_tu = (x0 - 1) >> log2_min_tu_size;
 
  792         int xq_tu =  x0      >> log2_min_tu_size;
 
  794             for (
i = 0; 
i < (1 << log2_trafo_size); 
i += 4) {
 
  795                 int y_pu      = (y0 + 
i) >> log2_min_pu_size;
 
  796                 int y_tu      = (y0 + 
i) >> log2_min_tu_size;
 
  797                 const MvField *
left = &tab_mvf[y_pu * min_pu_width + xp_pu];
 
  798                 const MvField *curr = &tab_mvf[y_pu * min_pu_width + xq_pu];
 
  799                 uint8_t left_cbf_luma = 
s->cbf_luma[y_tu * min_tu_width + xp_tu];
 
  800                 uint8_t curr_cbf_luma = 
s->cbf_luma[y_tu * min_tu_width + xq_tu];
 
  804                 else if (curr_cbf_luma || left_cbf_luma)
 
  808                 s->vertical_bs[(x0 + (y0 + 
i) * 
s->bs_width) >> 2] = bs;
 
  812     if (log2_trafo_size > log2_min_pu_size && !is_intra) {
 
  816         for (j = 8; j < (1 << log2_trafo_size); j += 8) {
 
  817             int yp_pu = (y0 + j - 1) >> log2_min_pu_size;
 
  818             int yq_pu = (y0 + j)     >> log2_min_pu_size;
 
  820             for (
i = 0; 
i < (1 << log2_trafo_size); 
i += 4) {
 
  821                 int x_pu = (x0 + 
i) >> log2_min_pu_size;
 
  822                 const MvField *top  = &tab_mvf[yp_pu * min_pu_width + x_pu];
 
  823                 const MvField *curr = &tab_mvf[yq_pu * min_pu_width + x_pu];
 
  826                 s->horizontal_bs[((x0 + 
i) + (y0 + j) * 
s->bs_width) >> 2] = bs;
 
  831         for (j = 0; j < (1 << log2_trafo_size); j += 4) {
 
  832             int y_pu = (y0 + j) >> log2_min_pu_size;
 
  834             for (
i = 8; 
i < (1 << log2_trafo_size); 
i += 8) {
 
  835                 int xp_pu = (x0 + 
i - 1) >> log2_min_pu_size;
 
  836                 int xq_pu = (x0 + 
i)     >> log2_min_pu_size;
 
  837                 const MvField *
left = &tab_mvf[y_pu * min_pu_width + xp_pu];
 
  838                 const MvField *curr = &tab_mvf[y_pu * min_pu_width + xq_pu];
 
  841                 s->vertical_bs[((x0 + 
i) + (y0 + j) * 
s->bs_width) >> 2] = bs;
 
  854     int x_end = x >= 
s->ps.sps->width  - ctb_size;
 
  868     if (
s->ps.sps->sao_enabled && !
skip) {
 
  869         int y_end = y >= 
s->ps.sps->height - ctb_size;
 
  879         if (x_end && y_end) {